diff --git "a/wandb/run-20220301_103527-1wkgn37c/files/wandb-summary.json" "b/wandb/run-20220301_103527-1wkgn37c/files/wandb-summary.json" --- "a/wandb/run-20220301_103527-1wkgn37c/files/wandb-summary.json" +++ "b/wandb/run-20220301_103527-1wkgn37c/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 4.3047, "train/learning_rate": 2.982e-05, "train/epoch": 0.84, "train/global_step": 500, "_runtime": 4780, "_timestamp": 1646135707, "_step": 500, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 10.0, 25.0, 89.0, 201.0, 274.0, 207.0, 129.0, 61.0, 14.0, 2.0, 3.0], "bins": [-159.7316436767578, -156.95663452148438, -154.181640625, -151.40663146972656, -148.63162231445312, -145.8566131591797, -143.0816192626953, -140.30661010742188, -137.53160095214844, -134.756591796875, -131.98159790039062, -129.2065887451172, -126.43157958984375, -123.65657806396484, -120.88157653808594, -118.1065673828125, -115.3315658569336, -112.55656433105469, -109.78155517578125, -107.00655364990234, -104.2315444946289, -101.45654296875, -98.68153381347656, -95.90653228759766, -93.13153076171875, -90.35652923583984, -87.5815200805664, -84.8065185546875, -82.03150939941406, -79.25650787353516, -76.48150634765625, -73.70649719238281, -70.93148803710938, -68.15648651123047, -65.38147735595703, -62.606475830078125, -59.83146667480469, -57.05646514892578, -54.28145980834961, -51.50645446777344, -48.731449127197266, -45.956443786621094, -43.18143844604492, -40.40643310546875, -37.631431579589844, -34.856422424316406, -32.0814208984375, -29.306415557861328, -26.531410217285156, -23.756404876708984, -20.981399536132812, -18.206396102905273, -15.431390762329102, -12.65638542175293, -9.88138198852539, -7.106376647949219, -4.331371307373047, -1.5563664436340332, 1.2186384201049805, 3.993642807006836, 6.768648147583008, 9.54365348815918, 12.318656921386719, 15.09366226196289, 17.868667602539062]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 7.0, 3.0, 7.0, 11.0, 11.0, 13.0, 14.0, 12.0, 23.0, 21.0, 23.0, 42.0, 37.0, 53.0, 48.0, 58.0, 57.0, 72.0, 58.0, 64.0, 50.0, 41.0, 47.0, 42.0, 27.0, 30.0, 26.0, 21.0, 22.0, 19.0, 14.0, 6.0, 3.0, 13.0, 5.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-71.47561645507812, -69.17546081542969, -66.87531280517578, -64.57515716552734, -62.275001525878906, -59.974849700927734, -57.67469787597656, -55.374542236328125, -53.07438659667969, -50.774234771728516, -48.47407913208008, -46.173927307128906, -43.87377166748047, -41.5736198425293, -39.273468017578125, -36.97331237792969, -34.673160552978516, -32.373008728027344, -30.072853088378906, -27.772701263427734, -25.472545623779297, -23.172393798828125, -20.87224006652832, -18.572086334228516, -16.27193260192871, -13.971778869628906, -11.671625137329102, -9.371472358703613, -7.071318626403809, -4.771164894104004, -2.4710121154785156, -0.17085838317871094, 2.1292953491210938, 4.429449081420898, 6.729602336883545, 9.029755592346191, 11.329909324645996, 13.6300630569458, 15.930215835571289, 18.230369567871094, 20.5305233001709, 22.830677032470703, 25.130830764770508, 27.430984497070312, 29.731136322021484, 32.03129196166992, 34.331443786621094, 36.63159942626953, 38.9317512512207, 41.231903076171875, 43.53205871582031, 45.832210540771484, 48.13236618041992, 50.432518005371094, 52.73267364501953, 55.0328254699707, 57.332977294921875, 59.63312911987305, 61.933284759521484, 64.23343658447266, 66.5335922241211, 68.83374786376953, 71.13389587402344, 73.43405151367188, 75.73420715332031]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 5.0, 8.0, 12.0, 7.0, 11.0, 15.0, 13.0, 14.0, 25.0, 22.0, 24.0, 30.0, 37.0, 49.0, 57.0, 48.0, 48.0, 64.0, 60.0, 52.0, 51.0, 51.0, 52.0, 36.0, 28.0, 30.0, 21.0, 33.0, 10.0, 18.0, 12.0, 11.0, 16.0, 11.0, 9.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8671875, -3.72955322265625, -3.5919189453125, -3.45428466796875, -3.316650390625, -3.17901611328125, -3.0413818359375, -2.90374755859375, -2.76611328125, -2.62847900390625, -2.4908447265625, -2.35321044921875, -2.215576171875, -2.07794189453125, -1.9403076171875, -1.80267333984375, -1.6650390625, -1.52740478515625, -1.3897705078125, -1.25213623046875, -1.114501953125, -0.97686767578125, -0.8392333984375, -0.70159912109375, -0.56396484375, -0.42633056640625, -0.2886962890625, -0.15106201171875, -0.013427734375, 0.12420654296875, 0.2618408203125, 0.39947509765625, 0.537109375, 0.67474365234375, 0.8123779296875, 0.95001220703125, 1.087646484375, 1.22528076171875, 1.3629150390625, 1.50054931640625, 1.63818359375, 1.77581787109375, 1.9134521484375, 2.05108642578125, 2.188720703125, 2.32635498046875, 2.4639892578125, 2.60162353515625, 2.7392578125, 2.87689208984375, 3.0145263671875, 3.15216064453125, 3.289794921875, 3.42742919921875, 3.5650634765625, 3.70269775390625, 3.84033203125, 3.97796630859375, 4.1156005859375, 4.25323486328125, 4.390869140625, 4.52850341796875, 4.6661376953125, 4.80377197265625, 4.94140625]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 8.0, 14.0, 13.0, 16.0, 23.0, 27.0, 43.0, 59.0, 83.0, 124.0, 207.0, 315.0, 496.0, 859.0, 1490.0, 2865.0, 6509.0, 18137.0, 74813.0, 592136.0, 2777785.0, 611157.0, 75542.0, 18610.0, 6385.0, 2814.0, 1469.0, 858.0, 482.0, 329.0, 198.0, 114.0, 81.0, 65.0, 56.0, 30.0, 19.0, 18.0, 15.0, 9.0, 6.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.6953125, -11.2989501953125, -10.902587890625, -10.5062255859375, -10.10986328125, -9.7135009765625, -9.317138671875, -8.9207763671875, -8.5244140625, -8.1280517578125, -7.731689453125, -7.3353271484375, -6.93896484375, -6.5426025390625, -6.146240234375, -5.7498779296875, -5.353515625, -4.9571533203125, -4.560791015625, -4.1644287109375, -3.76806640625, -3.3717041015625, -2.975341796875, -2.5789794921875, -2.1826171875, -1.7862548828125, -1.389892578125, -0.9935302734375, -0.59716796875, -0.2008056640625, 0.195556640625, 0.5919189453125, 0.98828125, 1.3846435546875, 1.781005859375, 2.1773681640625, 2.57373046875, 2.9700927734375, 3.366455078125, 3.7628173828125, 4.1591796875, 4.5555419921875, 4.951904296875, 5.3482666015625, 5.74462890625, 6.1409912109375, 6.537353515625, 6.9337158203125, 7.330078125, 7.7264404296875, 8.122802734375, 8.5191650390625, 8.91552734375, 9.3118896484375, 9.708251953125, 10.1046142578125, 10.5009765625, 10.8973388671875, 11.293701171875, 11.6900634765625, 12.08642578125, 12.4827880859375, 12.879150390625, 13.2755126953125, 13.671875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 11.0, 8.0, 16.0, 33.0, 30.0, 84.0, 112.0, 214.0, 400.0, 631.0, 878.0, 714.0, 427.0, 227.0, 132.0, 65.0, 44.0, 27.0, 11.0, 7.0, 4.0, 5.0, 3.0, 1.0, 2.0, 2.0], "bins": [-37.90625, -37.126953125, -36.34765625, -35.568359375, -34.7890625, -34.009765625, -33.23046875, -32.451171875, -31.671875, -30.892578125, -30.11328125, -29.333984375, -28.5546875, -27.775390625, -26.99609375, -26.216796875, -25.4375, -24.658203125, -23.87890625, -23.099609375, -22.3203125, -21.541015625, -20.76171875, -19.982421875, -19.203125, -18.423828125, -17.64453125, -16.865234375, -16.0859375, -15.306640625, -14.52734375, -13.748046875, -12.96875, -12.189453125, -11.41015625, -10.630859375, -9.8515625, -9.072265625, -8.29296875, -7.513671875, -6.734375, -5.955078125, -5.17578125, -4.396484375, -3.6171875, -2.837890625, -2.05859375, -1.279296875, -0.5, 0.279296875, 1.05859375, 1.837890625, 2.6171875, 3.396484375, 4.17578125, 4.955078125, 5.734375, 6.513671875, 7.29296875, 8.072265625, 8.8515625, 9.630859375, 10.41015625, 11.189453125, 11.96875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 11.0, 15.0, 47.0, 96.0, 204.0, 550.0, 1421.0, 15083.0, 4158904.0, 15713.0, 1382.0, 476.0, 230.0, 71.0, 46.0, 23.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-124.0625, -120.466796875, -116.87109375, -113.275390625, -109.6796875, -106.083984375, -102.48828125, -98.892578125, -95.296875, -91.701171875, -88.10546875, -84.509765625, -80.9140625, -77.318359375, -73.72265625, -70.126953125, -66.53125, -62.935546875, -59.33984375, -55.744140625, -52.1484375, -48.552734375, -44.95703125, -41.361328125, -37.765625, -34.169921875, -30.57421875, -26.978515625, -23.3828125, -19.787109375, -16.19140625, -12.595703125, -9.0, -5.404296875, -1.80859375, 1.787109375, 5.3828125, 8.978515625, 12.57421875, 16.169921875, 19.765625, 23.361328125, 26.95703125, 30.552734375, 34.1484375, 37.744140625, 41.33984375, 44.935546875, 48.53125, 52.126953125, 55.72265625, 59.318359375, 62.9140625, 66.509765625, 70.10546875, 73.701171875, 77.296875, 80.892578125, 84.48828125, 88.083984375, 91.6796875, 95.275390625, 98.87109375, 102.466796875, 106.0625]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 74.0, 443.0, 436.0, 56.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.867191314697266, -27.192401885986328, -20.51761245727539, -13.842823028564453, -7.168033599853516, -0.4932441711425781, 6.181545257568359, 12.856334686279297, 19.531124114990234, 26.205913543701172, 32.88070297241211, 39.55549240112305, 46.230281829833984, 52.90507125854492, 59.57986068725586, 66.25465393066406, 72.929443359375, 79.60423278808594, 86.27902221679688, 92.95381164550781, 99.62860107421875, 106.30339050292969, 112.97817993164062, 119.65296936035156, 126.3277587890625, 133.00254821777344, 139.67733764648438, 146.3521270751953, 153.02691650390625, 159.7017059326172, 166.37649536132812, 173.05128479003906, 179.72607421875, 186.40086364746094, 193.07565307617188, 199.7504425048828, 206.42523193359375, 213.1000213623047, 219.77481079101562, 226.44960021972656, 233.1243896484375, 239.79917907714844, 246.47396850585938, 253.1487579345703, 259.82354736328125, 266.49835205078125, 273.1731262207031, 279.847900390625, 286.522705078125, 293.197509765625, 299.8722839355469, 306.54705810546875, 313.22186279296875, 319.89666748046875, 326.5714416503906, 333.2462158203125, 339.9210205078125, 346.5958251953125, 353.2705993652344, 359.94537353515625, 366.62017822265625, 373.29498291015625, 379.9697570800781, 386.64453125, 393.3193359375]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 3.0, 6.0, 6.0, 11.0, 10.0, 10.0, 14.0, 12.0, 9.0, 18.0, 18.0, 15.0, 22.0, 27.0, 28.0, 25.0, 44.0, 38.0, 33.0, 38.0, 38.0, 28.0, 48.0, 46.0, 42.0, 44.0, 36.0, 37.0, 36.0, 34.0, 31.0, 27.0, 18.0, 21.0, 21.0, 15.0, 10.0, 18.0, 11.0, 9.0, 11.0, 10.0, 6.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-45.879852294921875, -44.38687515258789, -42.893898010253906, -41.40092468261719, -39.9079475402832, -38.41497039794922, -36.921993255615234, -35.42901611328125, -33.93604278564453, -32.44306564331055, -30.950090408325195, -29.45711326599121, -27.96413803100586, -26.471160888671875, -24.97818374633789, -23.485206604003906, -21.992229461669922, -20.499252319335938, -19.006277084350586, -17.5132999420166, -16.02032470703125, -14.527347564697266, -13.034370422363281, -11.541394233703613, -10.048418045043945, -8.555441856384277, -7.062465190887451, -5.569488525390625, -4.076512336730957, -2.583536148071289, -1.0905590057373047, 0.4024171829223633, 1.8953933715820312, 3.3883697986602783, 4.881346225738525, 6.374322891235352, 7.8672990798950195, 9.360275268554688, 10.853252410888672, 12.34622859954834, 13.839204788208008, 15.332180976867676, 16.825157165527344, 18.318134307861328, 19.811111450195312, 21.304086685180664, 22.79706382751465, 24.2900390625, 25.783016204833984, 27.27599334716797, 28.76896858215332, 30.261945724487305, 31.754920959472656, 33.24789810180664, 34.740875244140625, 36.23385238647461, 37.726829528808594, 39.21980667114258, 40.71278381347656, 42.20575714111328, 43.698734283447266, 45.19171142578125, 46.684688568115234, 48.17766571044922, 49.67063903808594]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 6.0, 9.0, 9.0, 10.0, 18.0, 13.0, 16.0, 20.0, 25.0, 24.0, 38.0, 34.0, 36.0, 62.0, 54.0, 55.0, 50.0, 47.0, 36.0, 59.0, 61.0, 44.0, 41.0, 42.0, 33.0, 33.0, 19.0, 21.0, 20.0, 20.0, 12.0, 7.0, 12.0, 6.0, 6.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1953125, -4.03729248046875, -3.8792724609375, -3.72125244140625, -3.563232421875, -3.40521240234375, -3.2471923828125, -3.08917236328125, -2.93115234375, -2.77313232421875, -2.6151123046875, -2.45709228515625, -2.299072265625, -2.14105224609375, -1.9830322265625, -1.82501220703125, -1.6669921875, -1.50897216796875, -1.3509521484375, -1.19293212890625, -1.034912109375, -0.87689208984375, -0.7188720703125, -0.56085205078125, -0.40283203125, -0.24481201171875, -0.0867919921875, 0.07122802734375, 0.229248046875, 0.38726806640625, 0.5452880859375, 0.70330810546875, 0.861328125, 1.01934814453125, 1.1773681640625, 1.33538818359375, 1.493408203125, 1.65142822265625, 1.8094482421875, 1.96746826171875, 2.12548828125, 2.28350830078125, 2.4415283203125, 2.59954833984375, 2.757568359375, 2.91558837890625, 3.0736083984375, 3.23162841796875, 3.3896484375, 3.54766845703125, 3.7056884765625, 3.86370849609375, 4.021728515625, 4.17974853515625, 4.3377685546875, 4.49578857421875, 4.65380859375, 4.81182861328125, 4.9698486328125, 5.12786865234375, 5.285888671875, 5.44390869140625, 5.6019287109375, 5.75994873046875, 5.91796875]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 4.0, 2.0, 10.0, 16.0, 15.0, 23.0, 36.0, 57.0, 74.0, 105.0, 166.0, 245.0, 340.0, 484.0, 727.0, 1017.0, 1491.0, 2208.0, 3170.0, 4774.0, 7450.0, 10913.0, 16759.0, 26201.0, 41521.0, 68118.0, 115393.0, 197867.0, 217434.0, 127913.0, 75315.0, 45886.0, 28763.0, 18210.0, 11897.0, 7671.0, 5239.0, 3419.0, 2344.0, 1664.0, 1139.0, 742.0, 563.0, 393.0, 252.0, 175.0, 115.0, 71.0, 59.0, 36.0, 28.0, 14.0, 14.0, 11.0, 7.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.52978515625, -0.5127487182617188, -0.4957122802734375, -0.47867584228515625, -0.461639404296875, -0.44460296630859375, -0.4275665283203125, -0.41053009033203125, -0.39349365234375, -0.37645721435546875, -0.3594207763671875, -0.34238433837890625, -0.325347900390625, -0.30831146240234375, -0.2912750244140625, -0.27423858642578125, -0.2572021484375, -0.24016571044921875, -0.2231292724609375, -0.20609283447265625, -0.189056396484375, -0.17201995849609375, -0.1549835205078125, -0.13794708251953125, -0.12091064453125, -0.10387420654296875, -0.0868377685546875, -0.06980133056640625, -0.052764892578125, -0.03572845458984375, -0.0186920166015625, -0.00165557861328125, 0.015380859375, 0.03241729736328125, 0.0494537353515625, 0.06649017333984375, 0.083526611328125, 0.10056304931640625, 0.1175994873046875, 0.13463592529296875, 0.15167236328125, 0.16870880126953125, 0.1857452392578125, 0.20278167724609375, 0.219818115234375, 0.23685455322265625, 0.2538909912109375, 0.27092742919921875, 0.2879638671875, 0.30500030517578125, 0.3220367431640625, 0.33907318115234375, 0.356109619140625, 0.37314605712890625, 0.3901824951171875, 0.40721893310546875, 0.42425537109375, 0.44129180908203125, 0.4583282470703125, 0.47536468505859375, 0.492401123046875, 0.5094375610351562, 0.5264739990234375, 0.5435104370117188, 0.560546875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 6.0, 2.0, 5.0, 4.0, 7.0, 11.0, 20.0, 11.0, 16.0, 19.0, 10.0, 20.0, 17.0, 20.0, 24.0, 30.0, 28.0, 37.0, 27.0, 24.0, 44.0, 35.0, 23.0, 1067.0, 41.0, 41.0, 41.0, 33.0, 19.0, 33.0, 34.0, 34.0, 24.0, 24.0, 22.0, 22.0, 24.0, 17.0, 18.0, 16.0, 10.0, 16.0, 8.0, 9.0, 12.0, 5.0, 2.0, 3.0, 1.0, 4.0, 5.0, 5.0, 1.0, 2.0, 1.0], "bins": [-2.318359375, -2.248077392578125, -2.17779541015625, -2.107513427734375, -2.0372314453125, -1.966949462890625, -1.89666748046875, -1.826385498046875, -1.756103515625, -1.685821533203125, -1.61553955078125, -1.545257568359375, -1.4749755859375, -1.404693603515625, -1.33441162109375, -1.264129638671875, -1.19384765625, -1.123565673828125, -1.05328369140625, -0.983001708984375, -0.9127197265625, -0.842437744140625, -0.77215576171875, -0.701873779296875, -0.631591796875, -0.561309814453125, -0.49102783203125, -0.420745849609375, -0.3504638671875, -0.280181884765625, -0.20989990234375, -0.139617919921875, -0.0693359375, 0.000946044921875, 0.07122802734375, 0.141510009765625, 0.2117919921875, 0.282073974609375, 0.35235595703125, 0.422637939453125, 0.492919921875, 0.563201904296875, 0.63348388671875, 0.703765869140625, 0.7740478515625, 0.844329833984375, 0.91461181640625, 0.984893798828125, 1.05517578125, 1.125457763671875, 1.19573974609375, 1.266021728515625, 1.3363037109375, 1.406585693359375, 1.47686767578125, 1.547149658203125, 1.617431640625, 1.687713623046875, 1.75799560546875, 1.828277587890625, 1.8985595703125, 1.968841552734375, 2.03912353515625, 2.109405517578125, 2.1796875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 6.0, 8.0, 15.0, 15.0, 32.0, 34.0, 58.0, 108.0, 123.0, 184.0, 297.0, 419.0, 654.0, 970.0, 1463.0, 2271.0, 3451.0, 5468.0, 8719.0, 14275.0, 23806.0, 40975.0, 73270.0, 139815.0, 1304336.0, 218335.0, 111604.0, 59760.0, 33617.0, 19958.0, 11942.0, 7446.0, 4740.0, 3014.0, 2027.0, 1307.0, 873.0, 583.0, 399.0, 244.0, 177.0, 120.0, 76.0, 50.0, 38.0, 22.0, 12.0, 10.0, 7.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.55419921875, -0.5378189086914062, -0.5214385986328125, -0.5050582885742188, -0.488677978515625, -0.47229766845703125, -0.4559173583984375, -0.43953704833984375, -0.42315673828125, -0.40677642822265625, -0.3903961181640625, -0.37401580810546875, -0.357635498046875, -0.34125518798828125, -0.3248748779296875, -0.30849456787109375, -0.2921142578125, -0.27573394775390625, -0.2593536376953125, -0.24297332763671875, -0.226593017578125, -0.21021270751953125, -0.1938323974609375, -0.17745208740234375, -0.16107177734375, -0.14469146728515625, -0.1283111572265625, -0.11193084716796875, -0.095550537109375, -0.07917022705078125, -0.0627899169921875, -0.04640960693359375, -0.030029296875, -0.01364898681640625, 0.0027313232421875, 0.01911163330078125, 0.035491943359375, 0.05187225341796875, 0.0682525634765625, 0.08463287353515625, 0.10101318359375, 0.11739349365234375, 0.1337738037109375, 0.15015411376953125, 0.166534423828125, 0.18291473388671875, 0.1992950439453125, 0.21567535400390625, 0.2320556640625, 0.24843597412109375, 0.2648162841796875, 0.28119659423828125, 0.297576904296875, 0.31395721435546875, 0.3303375244140625, 0.34671783447265625, 0.36309814453125, 0.37947845458984375, 0.3958587646484375, 0.41223907470703125, 0.428619384765625, 0.44499969482421875, 0.4613800048828125, 0.47776031494140625, 0.494140625]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 4.0, 4.0, 9.0, 10.0, 6.0, 13.0, 15.0, 21.0, 22.0, 25.0, 32.0, 45.0, 46.0, 60.0, 76.0, 76.0, 73.0, 65.0, 73.0, 59.0, 52.0, 38.0, 41.0, 27.0, 25.0, 18.0, 15.0, 14.0, 6.0, 7.0, 6.0, 2.0, 4.0, 3.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015745162963867188, -0.0015187114477157593, -0.0014629065990447998, -0.0014071017503738403, -0.0013512969017028809, -0.0012954920530319214, -0.001239687204360962, -0.0011838823556900024, -0.001128077507019043, -0.0010722726583480835, -0.001016467809677124, -0.0009606629610061646, -0.0009048581123352051, -0.0008490532636642456, -0.0007932484149932861, -0.0007374435663223267, -0.0006816387176513672, -0.0006258338689804077, -0.0005700290203094482, -0.0005142241716384888, -0.0004584193229675293, -0.0004026144742965698, -0.00034680962562561035, -0.0002910047769546509, -0.0002351999282836914, -0.00017939507961273193, -0.00012359023094177246, -6.778538227081299e-05, -1.1980533599853516e-05, 4.382431507110596e-05, 9.962916374206543e-05, 0.0001554340124130249, 0.00021123886108398438, 0.00026704370975494385, 0.0003228485584259033, 0.0003786534070968628, 0.00043445825576782227, 0.0004902631044387817, 0.0005460679531097412, 0.0006018728017807007, 0.0006576776504516602, 0.0007134824991226196, 0.0007692873477935791, 0.0008250921964645386, 0.000880897045135498, 0.0009367018938064575, 0.000992506742477417, 0.0010483115911483765, 0.001104116439819336, 0.0011599212884902954, 0.0012157261371612549, 0.0012715309858322144, 0.0013273358345031738, 0.0013831406831741333, 0.0014389455318450928, 0.0014947503805160522, 0.0015505552291870117, 0.0016063600778579712, 0.0016621649265289307, 0.0017179697751998901, 0.0017737746238708496, 0.001829579472541809, 0.0018853843212127686, 0.001941189169883728, 0.0019969940185546875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 7.0, 4.0, 7.0, 4.0, 12.0, 14.0, 13.0, 22.0, 28.0, 41.0, 42.0, 52.0, 84.0, 112.0, 161.0, 234.0, 353.0, 656.0, 25155.0, 1019249.0, 901.0, 418.0, 261.0, 206.0, 129.0, 113.0, 67.0, 62.0, 39.0, 30.0, 17.0, 14.0, 17.0, 10.0, 7.0, 3.0, 5.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.04010009765625, -0.03896045684814453, -0.03782081604003906, -0.036681175231933594, -0.035541534423828125, -0.034401893615722656, -0.03326225280761719, -0.03212261199951172, -0.03098297119140625, -0.02984333038330078, -0.028703689575195312, -0.027564048767089844, -0.026424407958984375, -0.025284767150878906, -0.024145126342773438, -0.02300548553466797, -0.0218658447265625, -0.02072620391845703, -0.019586563110351562, -0.018446922302246094, -0.017307281494140625, -0.016167640686035156, -0.015027999877929688, -0.013888359069824219, -0.01274871826171875, -0.011609077453613281, -0.010469436645507812, -0.009329795837402344, -0.008190155029296875, -0.007050514221191406, -0.0059108734130859375, -0.004771232604980469, -0.003631591796875, -0.0024919509887695312, -0.0013523101806640625, -0.00021266937255859375, 0.000926971435546875, 0.0020666122436523438, 0.0032062530517578125, 0.004345893859863281, 0.00548553466796875, 0.006625175476074219, 0.0077648162841796875, 0.008904457092285156, 0.010044097900390625, 0.011183738708496094, 0.012323379516601562, 0.013463020324707031, 0.0146026611328125, 0.01574230194091797, 0.016881942749023438, 0.018021583557128906, 0.019161224365234375, 0.020300865173339844, 0.021440505981445312, 0.02258014678955078, 0.02371978759765625, 0.02485942840576172, 0.025999069213867188, 0.027138710021972656, 0.028278350830078125, 0.029417991638183594, 0.030557632446289062, 0.03169727325439453, 0.0328369140625]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 18.0, 610.0, 383.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008214879781007767, -0.008067880757153034, -0.007920882664620876, -0.007773883640766144, -0.007626885082572699, -0.007479886524379253, -0.007332887966185808, -0.007185889407992363, -0.0070388903841376305, -0.006891891825944185, -0.00674489326775074, -0.0065978942438960075, -0.006450895685702562, -0.006303897127509117, -0.006156898569315672, -0.006009900011122227, -0.0058629014529287815, -0.005715902894735336, -0.005568904336541891, -0.005421905312687159, -0.005274906754493713, -0.005127908196300268, -0.004980909638106823, -0.004833911079913378, -0.0046869125217199326, -0.004539913963526487, -0.004392915405333042, -0.00424591638147831, -0.004098917823284864, -0.003951919265091419, -0.003804920706897974, -0.003657922148704529, -0.0035109235905110836, -0.0033639250323176384, -0.0032169262412935495, -0.0030699276831001043, -0.0029229288920760155, -0.0027759303338825703, -0.002628931775689125, -0.00248193321749568, -0.0023349341936409473, -0.002187935635447502, -0.0020409368444234133, -0.001893938286229968, -0.001746939611621201, -0.001599940937012434, -0.0014529423788189888, -0.0013059437042102218, -0.0011589451460167766, -0.0010119464714080095, -0.0008649478550069034, -0.0007179492386057973, -0.0005709505639970303, -0.0004239518893882632, -0.0002769532729871571, -0.000129954656586051, 1.7044018022716045e-05, 0.00016404266352765262, 0.0003110413090325892, 0.0004580399545375258, 0.0006050386000424623, 0.0007520372746512294, 0.0008990358910523355, 0.0010460345074534416, 0.0011930331820622087]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 4.0, 8.0, 6.0, 15.0, 6.0, 13.0, 14.0, 12.0, 9.0, 22.0, 23.0, 24.0, 26.0, 34.0, 37.0, 35.0, 45.0, 38.0, 35.0, 34.0, 39.0, 44.0, 37.0, 39.0, 39.0, 36.0, 33.0, 34.0, 36.0, 33.0, 22.0, 19.0, 18.0, 17.0, 15.0, 16.0, 12.0, 13.0, 16.0, 7.0, 8.0, 3.0, 4.0, 5.0, 4.0, 3.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0007455945014953613, -0.0007216371595859528, -0.0006976798176765442, -0.0006737224757671356, -0.000649765133857727, -0.0006258077919483185, -0.0006018504500389099, -0.0005778931081295013, -0.0005539357662200928, -0.0005299784243106842, -0.0005060210824012756, -0.00048206374049186707, -0.0004581063985824585, -0.0004341490566730499, -0.00041019171476364136, -0.0003862343728542328, -0.0003622770309448242, -0.00033831968903541565, -0.0003143623471260071, -0.0002904050052165985, -0.00026644766330718994, -0.00024249032139778137, -0.0002185329794883728, -0.00019457563757896423, -0.00017061829566955566, -0.0001466609537601471, -0.00012270361185073853, -9.874626994132996e-05, -7.478892803192139e-05, -5.083158612251282e-05, -2.6874244213104248e-05, -2.9169023036956787e-06, 2.104043960571289e-05, 4.499778151512146e-05, 6.895512342453003e-05, 9.29124653339386e-05, 0.00011686980724334717, 0.00014082714915275574, 0.0001647844910621643, 0.00018874183297157288, 0.00021269917488098145, 0.00023665651679039001, 0.0002606138586997986, 0.00028457120060920715, 0.0003085285425186157, 0.0003324858844280243, 0.00035644322633743286, 0.00038040056824684143, 0.00040435791015625, 0.00042831525206565857, 0.00045227259397506714, 0.0004762299358844757, 0.0005001872777938843, 0.0005241446197032928, 0.0005481019616127014, 0.00057205930352211, 0.0005960166454315186, 0.0006199739873409271, 0.0006439313292503357, 0.0006678886711597443, 0.0006918460130691528, 0.0007158033549785614, 0.00073976069688797, 0.0007637180387973785, 0.0007876753807067871]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 6.0, 9.0, 9.0, 10.0, 18.0, 13.0, 16.0, 20.0, 25.0, 24.0, 38.0, 34.0, 36.0, 62.0, 54.0, 55.0, 50.0, 47.0, 36.0, 59.0, 61.0, 44.0, 41.0, 42.0, 33.0, 33.0, 19.0, 21.0, 20.0, 20.0, 12.0, 7.0, 12.0, 6.0, 6.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1953125, -4.03729248046875, -3.8792724609375, -3.72125244140625, -3.563232421875, -3.40521240234375, -3.2471923828125, -3.08917236328125, -2.93115234375, -2.77313232421875, -2.6151123046875, -2.45709228515625, -2.299072265625, -2.14105224609375, -1.9830322265625, -1.82501220703125, -1.6669921875, -1.50897216796875, -1.3509521484375, -1.19293212890625, -1.034912109375, -0.87689208984375, -0.7188720703125, -0.56085205078125, -0.40283203125, -0.24481201171875, -0.0867919921875, 0.07122802734375, 0.229248046875, 0.38726806640625, 0.5452880859375, 0.70330810546875, 0.861328125, 1.01934814453125, 1.1773681640625, 1.33538818359375, 1.493408203125, 1.65142822265625, 1.8094482421875, 1.96746826171875, 2.12548828125, 2.28350830078125, 2.4415283203125, 2.59954833984375, 2.757568359375, 2.91558837890625, 3.0736083984375, 3.23162841796875, 3.3896484375, 3.54766845703125, 3.7056884765625, 3.86370849609375, 4.021728515625, 4.17974853515625, 4.3377685546875, 4.49578857421875, 4.65380859375, 4.81182861328125, 4.9698486328125, 5.12786865234375, 5.285888671875, 5.44390869140625, 5.6019287109375, 5.75994873046875, 5.91796875]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 2.0, 6.0, 3.0, 7.0, 12.0, 4.0, 10.0, 16.0, 23.0, 31.0, 30.0, 47.0, 69.0, 113.0, 120.0, 165.0, 243.0, 294.0, 445.0, 604.0, 901.0, 1186.0, 1815.0, 2793.0, 4624.0, 8302.0, 18227.0, 81378.0, 784044.0, 100324.0, 19676.0, 8918.0, 4844.0, 2862.0, 1878.0, 1328.0, 895.0, 638.0, 453.0, 318.0, 219.0, 190.0, 128.0, 108.0, 73.0, 49.0, 42.0, 24.0, 24.0, 16.0, 9.0, 7.0, 9.0, 10.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0], "bins": [-20.515625, -19.865234375, -19.21484375, -18.564453125, -17.9140625, -17.263671875, -16.61328125, -15.962890625, -15.3125, -14.662109375, -14.01171875, -13.361328125, -12.7109375, -12.060546875, -11.41015625, -10.759765625, -10.109375, -9.458984375, -8.80859375, -8.158203125, -7.5078125, -6.857421875, -6.20703125, -5.556640625, -4.90625, -4.255859375, -3.60546875, -2.955078125, -2.3046875, -1.654296875, -1.00390625, -0.353515625, 0.296875, 0.947265625, 1.59765625, 2.248046875, 2.8984375, 3.548828125, 4.19921875, 4.849609375, 5.5, 6.150390625, 6.80078125, 7.451171875, 8.1015625, 8.751953125, 9.40234375, 10.052734375, 10.703125, 11.353515625, 12.00390625, 12.654296875, 13.3046875, 13.955078125, 14.60546875, 15.255859375, 15.90625, 16.556640625, 17.20703125, 17.857421875, 18.5078125, 19.158203125, 19.80859375, 20.458984375, 21.109375]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 8.0, 10.0, 10.0, 11.0, 16.0, 18.0, 17.0, 17.0, 26.0, 31.0, 36.0, 45.0, 30.0, 32.0, 41.0, 53.0, 91.0, 343.0, 1636.0, 163.0, 68.0, 49.0, 41.0, 33.0, 37.0, 37.0, 28.0, 21.0, 19.0, 23.0, 18.0, 9.0, 12.0, 11.0, 5.0, 4.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.6796875, -15.221923828125, -14.76416015625, -14.306396484375, -13.8486328125, -13.390869140625, -12.93310546875, -12.475341796875, -12.017578125, -11.559814453125, -11.10205078125, -10.644287109375, -10.1865234375, -9.728759765625, -9.27099609375, -8.813232421875, -8.35546875, -7.897705078125, -7.43994140625, -6.982177734375, -6.5244140625, -6.066650390625, -5.60888671875, -5.151123046875, -4.693359375, -4.235595703125, -3.77783203125, -3.320068359375, -2.8623046875, -2.404541015625, -1.94677734375, -1.489013671875, -1.03125, -0.573486328125, -0.11572265625, 0.342041015625, 0.7998046875, 1.257568359375, 1.71533203125, 2.173095703125, 2.630859375, 3.088623046875, 3.54638671875, 4.004150390625, 4.4619140625, 4.919677734375, 5.37744140625, 5.835205078125, 6.29296875, 6.750732421875, 7.20849609375, 7.666259765625, 8.1240234375, 8.581787109375, 9.03955078125, 9.497314453125, 9.955078125, 10.412841796875, 10.87060546875, 11.328369140625, 11.7861328125, 12.243896484375, 12.70166015625, 13.159423828125, 13.6171875]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 7.0, 3.0, 7.0, 11.0, 10.0, 15.0, 14.0, 19.0, 22.0, 21.0, 35.0, 47.0, 47.0, 49.0, 114.0, 233.0, 1158.0, 2380208.0, 761988.0, 999.0, 261.0, 109.0, 60.0, 39.0, 44.0, 34.0, 34.0, 21.0, 20.0, 12.0, 17.0, 15.0, 13.0, 12.0, 8.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.15625, -61.04931640625, -58.9423828125, -56.83544921875, -54.728515625, -52.62158203125, -50.5146484375, -48.40771484375, -46.30078125, -44.19384765625, -42.0869140625, -39.97998046875, -37.873046875, -35.76611328125, -33.6591796875, -31.55224609375, -29.4453125, -27.33837890625, -25.2314453125, -23.12451171875, -21.017578125, -18.91064453125, -16.8037109375, -14.69677734375, -12.58984375, -10.48291015625, -8.3759765625, -6.26904296875, -4.162109375, -2.05517578125, 0.0517578125, 2.15869140625, 4.265625, 6.37255859375, 8.4794921875, 10.58642578125, 12.693359375, 14.80029296875, 16.9072265625, 19.01416015625, 21.12109375, 23.22802734375, 25.3349609375, 27.44189453125, 29.548828125, 31.65576171875, 33.7626953125, 35.86962890625, 37.9765625, 40.08349609375, 42.1904296875, 44.29736328125, 46.404296875, 48.51123046875, 50.6181640625, 52.72509765625, 54.83203125, 56.93896484375, 59.0458984375, 61.15283203125, 63.259765625, 65.36669921875, 67.4736328125, 69.58056640625, 71.6875]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 360.0, 648.0, 8.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-225.95680236816406, -221.44615173339844, -216.93551635742188, -212.42486572265625, -207.9142303466797, -203.40357971191406, -198.8929443359375, -194.38229370117188, -189.87164306640625, -185.36099243164062, -180.85035705566406, -176.33970642089844, -171.82907104492188, -167.31842041015625, -162.8077850341797, -158.29713439941406, -153.7864990234375, -149.27584838867188, -144.7652130126953, -140.2545623779297, -135.74392700195312, -131.2332763671875, -126.7226333618164, -122.21199035644531, -117.70134735107422, -113.19070434570312, -108.68006134033203, -104.16941833496094, -99.65876770019531, -95.14813232421875, -90.63748168945312, -86.12683868408203, -81.61618041992188, -77.10553741455078, -72.59489440917969, -68.0842514038086, -63.573604583740234, -59.06296157836914, -54.55231475830078, -50.04167175292969, -45.531028747558594, -41.0203857421875, -36.509742736816406, -31.999095916748047, -27.488452911376953, -22.97780990600586, -18.467164993286133, -13.956520080566406, -9.445877075195312, -4.935233116149902, -0.4245891571044922, 4.086054801940918, 8.596698760986328, 13.107341766357422, 17.61798667907715, 22.128631591796875, 26.63927459716797, 31.149917602539062, 35.660560607910156, 40.171207427978516, 44.68185043334961, 49.1924934387207, 53.70314025878906, 58.213783264160156, 62.72442626953125]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 5.0, 5.0, 6.0, 3.0, 7.0, 5.0, 3.0, 12.0, 8.0, 19.0, 19.0, 27.0, 29.0, 30.0, 32.0, 36.0, 26.0, 35.0, 27.0, 46.0, 39.0, 40.0, 36.0, 49.0, 39.0, 36.0, 39.0, 38.0, 40.0, 28.0, 41.0, 26.0, 26.0, 17.0, 22.0, 20.0, 15.0, 12.0, 10.0, 7.0, 11.0, 11.0, 7.0, 5.0, 2.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-42.54457092285156, -41.331809997558594, -40.11905288696289, -38.90629196166992, -37.69353103637695, -36.48077392578125, -35.26801300048828, -34.05525207519531, -32.842491149902344, -31.629732131958008, -30.41697120666504, -29.204212188720703, -27.991451263427734, -26.7786922454834, -25.565933227539062, -24.353172302246094, -23.14041519165039, -21.927656173706055, -20.714895248413086, -19.50213623046875, -18.28937530517578, -17.076616287231445, -15.86385726928711, -14.651097297668457, -13.438337326049805, -12.225577354431152, -11.0128173828125, -9.800058364868164, -8.587298393249512, -7.374538421630859, -6.161778926849365, -4.949019432067871, -3.736255645751953, -2.52349591255188, -1.3107361793518066, -0.0979764461517334, 1.1147832870483398, 2.327543258666992, 3.5403027534484863, 4.7530622482299805, 5.965822219848633, 7.178582191467285, 8.391342163085938, 9.604101181030273, 10.816861152648926, 12.029621124267578, 13.242380142211914, 14.455140113830566, 15.667900085449219, 16.880659103393555, 18.093420028686523, 19.30617904663086, 20.518939971923828, 21.731698989868164, 22.9444580078125, 24.15721893310547, 25.369977951049805, 26.58273696899414, 27.79549789428711, 29.008256912231445, 30.22101593017578, 31.43377685546875, 32.64653778076172, 33.85929489135742, 35.07205581665039]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 1.0, 6.0, 8.0, 13.0, 8.0, 14.0, 12.0, 16.0, 15.0, 29.0, 25.0, 33.0, 35.0, 37.0, 40.0, 65.0, 42.0, 45.0, 49.0, 57.0, 52.0, 42.0, 50.0, 47.0, 43.0, 34.0, 23.0, 37.0, 24.0, 23.0, 14.0, 19.0, 11.0, 8.0, 12.0, 6.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3828125, -4.2213134765625, -4.059814453125, -3.8983154296875, -3.73681640625, -3.5753173828125, -3.413818359375, -3.2523193359375, -3.0908203125, -2.9293212890625, -2.767822265625, -2.6063232421875, -2.44482421875, -2.2833251953125, -2.121826171875, -1.9603271484375, -1.798828125, -1.6373291015625, -1.475830078125, -1.3143310546875, -1.15283203125, -0.9913330078125, -0.829833984375, -0.6683349609375, -0.5068359375, -0.3453369140625, -0.183837890625, -0.0223388671875, 0.13916015625, 0.3006591796875, 0.462158203125, 0.6236572265625, 0.78515625, 0.9466552734375, 1.108154296875, 1.2696533203125, 1.43115234375, 1.5926513671875, 1.754150390625, 1.9156494140625, 2.0771484375, 2.2386474609375, 2.400146484375, 2.5616455078125, 2.72314453125, 2.8846435546875, 3.046142578125, 3.2076416015625, 3.369140625, 3.5306396484375, 3.692138671875, 3.8536376953125, 4.01513671875, 4.1766357421875, 4.338134765625, 4.4996337890625, 4.6611328125, 4.8226318359375, 4.984130859375, 5.1456298828125, 5.30712890625, 5.4686279296875, 5.630126953125, 5.7916259765625, 5.953125]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 1.0, 4.0, 7.0, 9.0, 18.0, 16.0, 16.0, 35.0, 64.0, 62.0, 85.0, 103.0, 158.0, 276.0, 446.0, 760.0, 1307.0, 2500.0, 5521.0, 14235.0, 51918.0, 532794.0, 3236930.0, 287815.0, 37828.0, 11430.0, 4666.0, 2235.0, 1148.0, 649.0, 395.0, 258.0, 158.0, 122.0, 82.0, 58.0, 39.0, 39.0, 21.0, 22.0, 11.0, 9.0, 11.0, 5.0, 6.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0], "bins": [-21.421875, -20.7607421875, -20.099609375, -19.4384765625, -18.77734375, -18.1162109375, -17.455078125, -16.7939453125, -16.1328125, -15.4716796875, -14.810546875, -14.1494140625, -13.48828125, -12.8271484375, -12.166015625, -11.5048828125, -10.84375, -10.1826171875, -9.521484375, -8.8603515625, -8.19921875, -7.5380859375, -6.876953125, -6.2158203125, -5.5546875, -4.8935546875, -4.232421875, -3.5712890625, -2.91015625, -2.2490234375, -1.587890625, -0.9267578125, -0.265625, 0.3955078125, 1.056640625, 1.7177734375, 2.37890625, 3.0400390625, 3.701171875, 4.3623046875, 5.0234375, 5.6845703125, 6.345703125, 7.0068359375, 7.66796875, 8.3291015625, 8.990234375, 9.6513671875, 10.3125, 10.9736328125, 11.634765625, 12.2958984375, 12.95703125, 13.6181640625, 14.279296875, 14.9404296875, 15.6015625, 16.2626953125, 16.923828125, 17.5849609375, 18.24609375, 18.9072265625, 19.568359375, 20.2294921875, 20.890625]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 2.0, 6.0, 6.0, 15.0, 15.0, 25.0, 32.0, 45.0, 76.0, 115.0, 160.0, 229.0, 327.0, 466.0, 593.0, 601.0, 455.0, 289.0, 192.0, 148.0, 78.0, 61.0, 36.0, 32.0, 20.0, 17.0, 11.0, 15.0, 4.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.65625, -25.97021484375, -25.2841796875, -24.59814453125, -23.912109375, -23.22607421875, -22.5400390625, -21.85400390625, -21.16796875, -20.48193359375, -19.7958984375, -19.10986328125, -18.423828125, -17.73779296875, -17.0517578125, -16.36572265625, -15.6796875, -14.99365234375, -14.3076171875, -13.62158203125, -12.935546875, -12.24951171875, -11.5634765625, -10.87744140625, -10.19140625, -9.50537109375, -8.8193359375, -8.13330078125, -7.447265625, -6.76123046875, -6.0751953125, -5.38916015625, -4.703125, -4.01708984375, -3.3310546875, -2.64501953125, -1.958984375, -1.27294921875, -0.5869140625, 0.09912109375, 0.78515625, 1.47119140625, 2.1572265625, 2.84326171875, 3.529296875, 4.21533203125, 4.9013671875, 5.58740234375, 6.2734375, 6.95947265625, 7.6455078125, 8.33154296875, 9.017578125, 9.70361328125, 10.3896484375, 11.07568359375, 11.76171875, 12.44775390625, 13.1337890625, 13.81982421875, 14.505859375, 15.19189453125, 15.8779296875, 16.56396484375, 17.25]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 5.0, 8.0, 6.0, 19.0, 32.0, 26.0, 59.0, 67.0, 107.0, 196.0, 440.0, 1759.0, 221504.0, 3961356.0, 7254.0, 685.0, 286.0, 162.0, 97.0, 85.0, 34.0, 31.0, 16.0, 17.0, 8.0, 4.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.3125, -62.2353515625, -59.158203125, -56.0810546875, -53.00390625, -49.9267578125, -46.849609375, -43.7724609375, -40.6953125, -37.6181640625, -34.541015625, -31.4638671875, -28.38671875, -25.3095703125, -22.232421875, -19.1552734375, -16.078125, -13.0009765625, -9.923828125, -6.8466796875, -3.76953125, -0.6923828125, 2.384765625, 5.4619140625, 8.5390625, 11.6162109375, 14.693359375, 17.7705078125, 20.84765625, 23.9248046875, 27.001953125, 30.0791015625, 33.15625, 36.2333984375, 39.310546875, 42.3876953125, 45.46484375, 48.5419921875, 51.619140625, 54.6962890625, 57.7734375, 60.8505859375, 63.927734375, 67.0048828125, 70.08203125, 73.1591796875, 76.236328125, 79.3134765625, 82.390625, 85.4677734375, 88.544921875, 91.6220703125, 94.69921875, 97.7763671875, 100.853515625, 103.9306640625, 107.0078125, 110.0849609375, 113.162109375, 116.2392578125, 119.31640625, 122.3935546875, 125.470703125, 128.5478515625, 131.625]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 31.0, 36.0, 69.0, 150.0, 188.0, 188.0, 161.0, 98.0, 46.0, 27.0, 9.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-108.53904724121094, -106.02537536621094, -103.5116958618164, -100.9980239868164, -98.48434448242188, -95.97067260742188, -93.45699310302734, -90.94332122802734, -88.42964172363281, -85.91596984863281, -83.40229034423828, -80.88861846923828, -78.37493896484375, -75.86126708984375, -73.34758758544922, -70.83391571044922, -68.32024383544922, -65.80657196044922, -63.29289245605469, -60.77921676635742, -58.265541076660156, -55.751869201660156, -53.23819351196289, -50.724517822265625, -48.21084213256836, -45.697166442871094, -43.18349075317383, -40.66981506347656, -38.15614318847656, -35.64246368408203, -33.12879180908203, -30.615116119384766, -28.10143280029297, -25.587757110595703, -23.074081420898438, -20.560407638549805, -18.04673194885254, -15.533056259155273, -13.019381523132324, -10.505706787109375, -7.992031097412109, -5.478355884552002, -2.9646806716918945, -0.4510054588317871, 2.0626697540283203, 4.576345443725586, 7.090020179748535, 9.603694915771484, 12.11737060546875, 14.631046295166016, 17.14472198486328, 19.658395767211914, 22.17207145690918, 24.685747146606445, 27.199420928955078, 29.713096618652344, 32.22677230834961, 34.740447998046875, 37.25412368774414, 39.767799377441406, 42.281471252441406, 44.79515075683594, 47.30882263183594, 49.8224983215332, 52.33617401123047]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 2.0, 6.0, 6.0, 8.0, 14.0, 9.0, 22.0, 16.0, 10.0, 25.0, 27.0, 23.0, 36.0, 29.0, 43.0, 36.0, 42.0, 45.0, 34.0, 45.0, 41.0, 44.0, 37.0, 45.0, 36.0, 46.0, 31.0, 35.0, 31.0, 31.0, 22.0, 19.0, 15.0, 15.0, 20.0, 10.0, 10.0, 5.0, 4.0, 9.0, 10.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-61.119720458984375, -59.25748825073242, -57.395259857177734, -55.53302764892578, -53.670799255371094, -51.80856704711914, -49.94633483886719, -48.0841064453125, -46.22187805175781, -44.35964584350586, -42.49741744995117, -40.63518524169922, -38.77295684814453, -36.91072463989258, -35.048492431640625, -33.18626403808594, -31.324031829833984, -29.461801528930664, -27.599571228027344, -25.73733901977539, -23.875110626220703, -22.01287841796875, -20.15064811706543, -18.28841781616211, -16.42618751525879, -14.563957214355469, -12.701726913452148, -10.839495658874512, -8.977265357971191, -7.115035057067871, -5.252803802490234, -3.390573501586914, -1.5283432006835938, 0.33388733863830566, 2.196117877960205, 4.058348655700684, 5.920578956604004, 7.782809257507324, 9.645040512084961, 11.507270812988281, 13.369501113891602, 15.231731414794922, 17.093961715698242, 18.956192016601562, 20.818424224853516, 22.680652618408203, 24.542884826660156, 26.405115127563477, 28.267345428466797, 30.129575729370117, 31.991806030273438, 33.85403823852539, 35.71626663208008, 37.57849884033203, 39.44072723388672, 41.30295944213867, 43.165191650390625, 45.02742385864258, 46.889652252197266, 48.75188446044922, 50.614112854003906, 52.47634506225586, 54.33857727050781, 56.2008056640625, 58.06303405761719]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 5.0, 9.0, 17.0, 10.0, 15.0, 20.0, 28.0, 30.0, 27.0, 27.0, 46.0, 46.0, 49.0, 49.0, 47.0, 52.0, 64.0, 44.0, 50.0, 59.0, 44.0, 43.0, 35.0, 32.0, 33.0, 28.0, 21.0, 17.0, 15.0, 15.0, 6.0, 5.0, 11.0, 7.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.55078125, -4.3717041015625, -4.192626953125, -4.0135498046875, -3.83447265625, -3.6553955078125, -3.476318359375, -3.2972412109375, -3.1181640625, -2.9390869140625, -2.760009765625, -2.5809326171875, -2.40185546875, -2.2227783203125, -2.043701171875, -1.8646240234375, -1.685546875, -1.5064697265625, -1.327392578125, -1.1483154296875, -0.96923828125, -0.7901611328125, -0.611083984375, -0.4320068359375, -0.2529296875, -0.0738525390625, 0.105224609375, 0.2843017578125, 0.46337890625, 0.6424560546875, 0.821533203125, 1.0006103515625, 1.1796875, 1.3587646484375, 1.537841796875, 1.7169189453125, 1.89599609375, 2.0750732421875, 2.254150390625, 2.4332275390625, 2.6123046875, 2.7913818359375, 2.970458984375, 3.1495361328125, 3.32861328125, 3.5076904296875, 3.686767578125, 3.8658447265625, 4.044921875, 4.2239990234375, 4.403076171875, 4.5821533203125, 4.76123046875, 4.9403076171875, 5.119384765625, 5.2984619140625, 5.4775390625, 5.6566162109375, 5.835693359375, 6.0147705078125, 6.19384765625, 6.3729248046875, 6.552001953125, 6.7310791015625, 6.91015625]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 12.0, 19.0, 25.0, 40.0, 53.0, 92.0, 123.0, 197.0, 291.0, 404.0, 611.0, 1005.0, 1421.0, 2100.0, 3203.0, 4584.0, 7100.0, 10726.0, 16314.0, 24382.0, 37641.0, 59341.0, 99184.0, 189008.0, 244981.0, 134869.0, 74973.0, 46511.0, 30332.0, 19974.0, 13270.0, 8488.0, 5606.0, 3793.0, 2575.0, 1769.0, 1150.0, 805.0, 510.0, 369.0, 230.0, 180.0, 104.0, 66.0, 47.0, 23.0, 15.0, 12.0, 11.0, 9.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.64501953125, -0.6250152587890625, -0.605010986328125, -0.5850067138671875, -0.56500244140625, -0.5449981689453125, -0.524993896484375, -0.5049896240234375, -0.4849853515625, -0.4649810791015625, -0.444976806640625, -0.4249725341796875, -0.40496826171875, -0.3849639892578125, -0.364959716796875, -0.3449554443359375, -0.324951171875, -0.3049468994140625, -0.284942626953125, -0.2649383544921875, -0.24493408203125, -0.2249298095703125, -0.204925537109375, -0.1849212646484375, -0.1649169921875, -0.1449127197265625, -0.124908447265625, -0.1049041748046875, -0.08489990234375, -0.0648956298828125, -0.044891357421875, -0.0248870849609375, -0.0048828125, 0.0151214599609375, 0.035125732421875, 0.0551300048828125, 0.07513427734375, 0.0951385498046875, 0.115142822265625, 0.1351470947265625, 0.1551513671875, 0.1751556396484375, 0.195159912109375, 0.2151641845703125, 0.23516845703125, 0.2551727294921875, 0.275177001953125, 0.2951812744140625, 0.315185546875, 0.3351898193359375, 0.355194091796875, 0.3751983642578125, 0.39520263671875, 0.4152069091796875, 0.435211181640625, 0.4552154541015625, 0.4752197265625, 0.4952239990234375, 0.515228271484375, 0.5352325439453125, 0.55523681640625, 0.5752410888671875, 0.595245361328125, 0.6152496337890625, 0.63525390625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 9.0, 2.0, 6.0, 11.0, 14.0, 7.0, 13.0, 23.0, 25.0, 12.0, 27.0, 25.0, 28.0, 35.0, 30.0, 35.0, 47.0, 49.0, 44.0, 1071.0, 38.0, 42.0, 41.0, 38.0, 37.0, 48.0, 45.0, 36.0, 29.0, 22.0, 24.0, 24.0, 16.0, 13.0, 17.0, 15.0, 9.0, 8.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.86328125, -2.7645263671875, -2.665771484375, -2.5670166015625, -2.46826171875, -2.3695068359375, -2.270751953125, -2.1719970703125, -2.0732421875, -1.9744873046875, -1.875732421875, -1.7769775390625, -1.67822265625, -1.5794677734375, -1.480712890625, -1.3819580078125, -1.283203125, -1.1844482421875, -1.085693359375, -0.9869384765625, -0.88818359375, -0.7894287109375, -0.690673828125, -0.5919189453125, -0.4931640625, -0.3944091796875, -0.295654296875, -0.1968994140625, -0.09814453125, 0.0006103515625, 0.099365234375, 0.1981201171875, 0.296875, 0.3956298828125, 0.494384765625, 0.5931396484375, 0.69189453125, 0.7906494140625, 0.889404296875, 0.9881591796875, 1.0869140625, 1.1856689453125, 1.284423828125, 1.3831787109375, 1.48193359375, 1.5806884765625, 1.679443359375, 1.7781982421875, 1.876953125, 1.9757080078125, 2.074462890625, 2.1732177734375, 2.27197265625, 2.3707275390625, 2.469482421875, 2.5682373046875, 2.6669921875, 2.7657470703125, 2.864501953125, 2.9632568359375, 3.06201171875, 3.1607666015625, 3.259521484375, 3.3582763671875, 3.45703125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 3.0, 1.0, 2.0, 7.0, 10.0, 12.0, 22.0, 25.0, 57.0, 75.0, 83.0, 173.0, 218.0, 320.0, 497.0, 742.0, 1057.0, 1553.0, 2387.0, 3498.0, 5372.0, 8524.0, 13331.0, 21903.0, 35762.0, 60741.0, 109742.0, 204946.0, 1291006.0, 142387.0, 75721.0, 44189.0, 26412.0, 16570.0, 10269.0, 6639.0, 4273.0, 2852.0, 1882.0, 1217.0, 847.0, 590.0, 404.0, 255.0, 189.0, 118.0, 82.0, 64.0, 42.0, 16.0, 16.0, 12.0, 4.0, 12.0, 3.0, 3.0, 0.0, 3.0, 3.0, 0.0, 2.0], "bins": [-0.52978515625, -0.5128097534179688, -0.4958343505859375, -0.47885894775390625, -0.461883544921875, -0.44490814208984375, -0.4279327392578125, -0.41095733642578125, -0.39398193359375, -0.37700653076171875, -0.3600311279296875, -0.34305572509765625, -0.326080322265625, -0.30910491943359375, -0.2921295166015625, -0.27515411376953125, -0.2581787109375, -0.24120330810546875, -0.2242279052734375, -0.20725250244140625, -0.190277099609375, -0.17330169677734375, -0.1563262939453125, -0.13935089111328125, -0.12237548828125, -0.10540008544921875, -0.0884246826171875, -0.07144927978515625, -0.054473876953125, -0.03749847412109375, -0.0205230712890625, -0.00354766845703125, 0.013427734375, 0.03040313720703125, 0.0473785400390625, 0.06435394287109375, 0.081329345703125, 0.09830474853515625, 0.1152801513671875, 0.13225555419921875, 0.14923095703125, 0.16620635986328125, 0.1831817626953125, 0.20015716552734375, 0.217132568359375, 0.23410797119140625, 0.2510833740234375, 0.26805877685546875, 0.2850341796875, 0.30200958251953125, 0.3189849853515625, 0.33596038818359375, 0.352935791015625, 0.36991119384765625, 0.3868865966796875, 0.40386199951171875, 0.42083740234375, 0.43781280517578125, 0.4547882080078125, 0.47176361083984375, 0.488739013671875, 0.5057144165039062, 0.5226898193359375, 0.5396652221679688, 0.556640625]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 8.0, 8.0, 12.0, 19.0, 20.0, 24.0, 29.0, 40.0, 63.0, 85.0, 107.0, 98.0, 100.0, 78.0, 78.0, 54.0, 45.0, 34.0, 24.0, 20.0, 9.0, 10.0, 10.0, 3.0, 4.0, 4.0, 2.0, 6.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0031032562255859375, -0.003019392490386963, -0.0029355287551879883, -0.0028516650199890137, -0.002767801284790039, -0.0026839375495910645, -0.00260007381439209, -0.0025162100791931152, -0.0024323463439941406, -0.002348482608795166, -0.0022646188735961914, -0.002180755138397217, -0.002096891403198242, -0.0020130276679992676, -0.001929163932800293, -0.0018453001976013184, -0.0017614364624023438, -0.0016775727272033691, -0.0015937089920043945, -0.00150984525680542, -0.0014259815216064453, -0.0013421177864074707, -0.001258254051208496, -0.0011743903160095215, -0.0010905265808105469, -0.0010066628456115723, -0.0009227991104125977, -0.000838935375213623, -0.0007550716400146484, -0.0006712079048156738, -0.0005873441696166992, -0.0005034804344177246, -0.00041961669921875, -0.0003357529640197754, -0.0002518892288208008, -0.00016802549362182617, -8.416175842285156e-05, -2.980232238769531e-07, 8.356571197509766e-05, 0.00016742944717407227, 0.0002512931823730469, 0.0003351569175720215, 0.0004190206527709961, 0.0005028843879699707, 0.0005867481231689453, 0.0006706118583679199, 0.0007544755935668945, 0.0008383393287658691, 0.0009222030639648438, 0.0010060667991638184, 0.001089930534362793, 0.0011737942695617676, 0.0012576580047607422, 0.0013415217399597168, 0.0014253854751586914, 0.001509249210357666, 0.0015931129455566406, 0.0016769766807556152, 0.0017608404159545898, 0.0018447041511535645, 0.001928567886352539, 0.0020124316215515137, 0.0020962953567504883, 0.002180159091949463, 0.0022640228271484375]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 2.0, 3.0, 4.0, 1.0, 2.0, 7.0, 6.0, 10.0, 18.0, 14.0, 36.0, 92.0, 122.0, 222.0, 515.0, 14835.0, 1031260.0, 748.0, 269.0, 159.0, 85.0, 52.0, 25.0, 25.0, 11.0, 11.0, 10.0, 4.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0589599609375, -0.05679035186767578, -0.05462074279785156, -0.052451133728027344, -0.050281524658203125, -0.048111915588378906, -0.04594230651855469, -0.04377269744873047, -0.04160308837890625, -0.03943347930908203, -0.03726387023925781, -0.035094261169433594, -0.032924652099609375, -0.030755043029785156, -0.028585433959960938, -0.02641582489013672, -0.0242462158203125, -0.02207660675048828, -0.019906997680664062, -0.017737388610839844, -0.015567779541015625, -0.013398170471191406, -0.011228561401367188, -0.009058952331542969, -0.00688934326171875, -0.004719734191894531, -0.0025501251220703125, -0.00038051605224609375, 0.001789093017578125, 0.003958702087402344, 0.0061283111572265625, 0.008297920227050781, 0.010467529296875, 0.012637138366699219, 0.014806747436523438, 0.016976356506347656, 0.019145965576171875, 0.021315574645996094, 0.023485183715820312, 0.02565479278564453, 0.02782440185546875, 0.02999401092529297, 0.03216361999511719, 0.034333229064941406, 0.036502838134765625, 0.038672447204589844, 0.04084205627441406, 0.04301166534423828, 0.0451812744140625, 0.04735088348388672, 0.04952049255371094, 0.051690101623535156, 0.053859710693359375, 0.056029319763183594, 0.05819892883300781, 0.06036853790283203, 0.06253814697265625, 0.06470775604248047, 0.06687736511230469, 0.0690469741821289, 0.07121658325195312, 0.07338619232177734, 0.07555580139160156, 0.07772541046142578, 0.07989501953125]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0, 751.0, 259.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004929606337100267, -0.004597438033670187, -0.004265269264578819, -0.003933100961148739, -0.0036009326577186584, -0.003268764354288578, -0.002936595818027854, -0.00260442728176713, -0.0022722589783370495, -0.0019400905584916472, -0.001607922138646245, -0.0012757537188008428, -0.0009435852989554405, -0.0006114168791100383, -0.00027924845926463604, 5.292007699608803e-05, 0.00038508838042616844, 0.0007172568002715707, 0.001049425220116973, 0.0013815936399623752, 0.0017137620598077774, 0.002045930363237858, 0.002378098899498582, 0.002710267435759306, 0.0030424357391893864, 0.0033746040426194668, 0.003706772578880191, 0.004038941115140915, 0.004371109418570995, 0.004703277722001076, 0.005035446025431156, 0.005367614794522524, 0.005699783563613892, 0.006031951867043972, 0.006364120170474052, 0.00669628893956542, 0.0070284572429955006, 0.007360625546425581, 0.007692794315516949, 0.008024962618947029, 0.00835713092237711, 0.00868929922580719, 0.00902146752923727, 0.00935363583266735, 0.009685805067420006, 0.010017973370850086, 0.010350141674280167, 0.010682309977710247, 0.011014478281140327, 0.011346646584570408, 0.011678814888000488, 0.012010983191430569, 0.012343151494860649, 0.012675320729613304, 0.013007489033043385, 0.013339657336473465, 0.013671825639903545, 0.014003993943333626, 0.014336162246763706, 0.014668330550193787, 0.015000499784946442, 0.015332668088376522, 0.015664836391806602, 0.01599700376391411, 0.016329172998666763]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 1.0, 4.0, 6.0, 4.0, 10.0, 8.0, 13.0, 22.0, 16.0, 14.0, 32.0, 23.0, 34.0, 20.0, 36.0, 34.0, 43.0, 27.0, 38.0, 48.0, 37.0, 33.0, 37.0, 41.0, 48.0, 39.0, 47.0, 38.0, 33.0, 32.0, 22.0, 18.0, 24.0, 15.0, 21.0, 15.0, 11.0, 9.0, 11.0, 8.0, 6.0, 8.0, 3.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0008952021598815918, -0.000864262692630291, -0.0008333232253789902, -0.0008023837581276894, -0.0007714442908763885, -0.0007405048236250877, -0.0007095653563737869, -0.0006786258891224861, -0.0006476864218711853, -0.0006167469546198845, -0.0005858074873685837, -0.0005548680201172829, -0.0005239285528659821, -0.0004929890856146812, -0.00046204961836338043, -0.0004311101511120796, -0.0004001706838607788, -0.000369231216609478, -0.0003382917493581772, -0.0003073522821068764, -0.00027641281485557556, -0.00024547334760427475, -0.00021453388035297394, -0.00018359441310167313, -0.00015265494585037231, -0.0001217154785990715, -9.077601134777069e-05, -5.983654409646988e-05, -2.8897076845169067e-05, 2.0423904061317444e-06, 3.2981857657432556e-05, 6.392132490873337e-05, 9.486079216003418e-05, 0.000125800259411335, 0.0001567397266626358, 0.00018767919391393661, 0.00021861866116523743, 0.00024955812841653824, 0.00028049759566783905, 0.00031143706291913986, 0.0003423765301704407, 0.0003733159974217415, 0.0004042554646730423, 0.0004351949319243431, 0.0004661343991756439, 0.0004970738664269447, 0.0005280133336782455, 0.0005589528009295464, 0.0005898922681808472, 0.000620831735432148, 0.0006517712026834488, 0.0006827106699347496, 0.0007136501371860504, 0.0007445896044373512, 0.000775529071688652, 0.0008064685389399529, 0.0008374080061912537, 0.0008683474734425545, 0.0008992869406938553, 0.0009302264079451561, 0.0009611658751964569, 0.0009921053424477577, 0.0010230448096990585, 0.0010539842769503593, 0.0010849237442016602]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 5.0, 9.0, 17.0, 10.0, 15.0, 20.0, 28.0, 30.0, 27.0, 27.0, 46.0, 46.0, 49.0, 49.0, 47.0, 52.0, 64.0, 44.0, 50.0, 59.0, 44.0, 43.0, 35.0, 33.0, 32.0, 28.0, 21.0, 17.0, 15.0, 15.0, 6.0, 5.0, 11.0, 7.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.55078125, -4.3717041015625, -4.192626953125, -4.0135498046875, -3.83447265625, -3.6553955078125, -3.476318359375, -3.2972412109375, -3.1181640625, -2.9390869140625, -2.760009765625, -2.5809326171875, -2.40185546875, -2.2227783203125, -2.043701171875, -1.8646240234375, -1.685546875, -1.5064697265625, -1.327392578125, -1.1483154296875, -0.96923828125, -0.7901611328125, -0.611083984375, -0.4320068359375, -0.2529296875, -0.0738525390625, 0.105224609375, 0.2843017578125, 0.46337890625, 0.6424560546875, 0.821533203125, 1.0006103515625, 1.1796875, 1.3587646484375, 1.537841796875, 1.7169189453125, 1.89599609375, 2.0750732421875, 2.254150390625, 2.4332275390625, 2.6123046875, 2.7913818359375, 2.970458984375, 3.1495361328125, 3.32861328125, 3.5076904296875, 3.686767578125, 3.8658447265625, 4.044921875, 4.2239990234375, 4.403076171875, 4.5821533203125, 4.76123046875, 4.9403076171875, 5.119384765625, 5.2984619140625, 5.4775390625, 5.6566162109375, 5.835693359375, 6.0147705078125, 6.19384765625, 6.3729248046875, 6.552001953125, 6.7310791015625, 6.91015625]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 5.0, 5.0, 10.0, 13.0, 42.0, 37.0, 58.0, 90.0, 142.0, 240.0, 341.0, 618.0, 1182.0, 2902.0, 9064.0, 38158.0, 227534.0, 616703.0, 118428.0, 22690.0, 6034.0, 2024.0, 918.0, 499.0, 281.0, 186.0, 122.0, 70.0, 70.0, 29.0, 19.0, 21.0, 7.0, 8.0, 2.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.81640625, -5.6246337890625, -5.432861328125, -5.2410888671875, -5.04931640625, -4.8575439453125, -4.665771484375, -4.4739990234375, -4.2822265625, -4.0904541015625, -3.898681640625, -3.7069091796875, -3.51513671875, -3.3233642578125, -3.131591796875, -2.9398193359375, -2.748046875, -2.5562744140625, -2.364501953125, -2.1727294921875, -1.98095703125, -1.7891845703125, -1.597412109375, -1.4056396484375, -1.2138671875, -1.0220947265625, -0.830322265625, -0.6385498046875, -0.44677734375, -0.2550048828125, -0.063232421875, 0.1285400390625, 0.3203125, 0.5120849609375, 0.703857421875, 0.8956298828125, 1.08740234375, 1.2791748046875, 1.470947265625, 1.6627197265625, 1.8544921875, 2.0462646484375, 2.238037109375, 2.4298095703125, 2.62158203125, 2.8133544921875, 3.005126953125, 3.1968994140625, 3.388671875, 3.5804443359375, 3.772216796875, 3.9639892578125, 4.15576171875, 4.3475341796875, 4.539306640625, 4.7310791015625, 4.9228515625, 5.1146240234375, 5.306396484375, 5.4981689453125, 5.68994140625, 5.8817138671875, 6.073486328125, 6.2652587890625, 6.45703125]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 8.0, 4.0, 14.0, 9.0, 15.0, 20.0, 24.0, 22.0, 26.0, 29.0, 43.0, 43.0, 47.0, 45.0, 50.0, 76.0, 1677.0, 452.0, 62.0, 52.0, 50.0, 36.0, 47.0, 33.0, 33.0, 30.0, 25.0, 18.0, 20.0, 20.0, 8.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.359375, -17.745849609375, -17.13232421875, -16.518798828125, -15.9052734375, -15.291748046875, -14.67822265625, -14.064697265625, -13.451171875, -12.837646484375, -12.22412109375, -11.610595703125, -10.9970703125, -10.383544921875, -9.77001953125, -9.156494140625, -8.54296875, -7.929443359375, -7.31591796875, -6.702392578125, -6.0888671875, -5.475341796875, -4.86181640625, -4.248291015625, -3.634765625, -3.021240234375, -2.40771484375, -1.794189453125, -1.1806640625, -0.567138671875, 0.04638671875, 0.659912109375, 1.2734375, 1.886962890625, 2.50048828125, 3.114013671875, 3.7275390625, 4.341064453125, 4.95458984375, 5.568115234375, 6.181640625, 6.795166015625, 7.40869140625, 8.022216796875, 8.6357421875, 9.249267578125, 9.86279296875, 10.476318359375, 11.08984375, 11.703369140625, 12.31689453125, 12.930419921875, 13.5439453125, 14.157470703125, 14.77099609375, 15.384521484375, 15.998046875, 16.611572265625, 17.22509765625, 17.838623046875, 18.4521484375, 19.065673828125, 19.67919921875, 20.292724609375, 20.90625]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 3.0, 6.0, 24.0, 18.0, 14.0, 24.0, 21.0, 41.0, 38.0, 56.0, 86.0, 111.0, 233.0, 756.0, 24542.0, 3116530.0, 2161.0, 443.0, 164.0, 120.0, 71.0, 44.0, 43.0, 24.0, 32.0, 17.0, 27.0, 12.0, 12.0, 13.0, 6.0, 5.0, 4.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-48.84375, -47.4189453125, -45.994140625, -44.5693359375, -43.14453125, -41.7197265625, -40.294921875, -38.8701171875, -37.4453125, -36.0205078125, -34.595703125, -33.1708984375, -31.74609375, -30.3212890625, -28.896484375, -27.4716796875, -26.046875, -24.6220703125, -23.197265625, -21.7724609375, -20.34765625, -18.9228515625, -17.498046875, -16.0732421875, -14.6484375, -13.2236328125, -11.798828125, -10.3740234375, -8.94921875, -7.5244140625, -6.099609375, -4.6748046875, -3.25, -1.8251953125, -0.400390625, 1.0244140625, 2.44921875, 3.8740234375, 5.298828125, 6.7236328125, 8.1484375, 9.5732421875, 10.998046875, 12.4228515625, 13.84765625, 15.2724609375, 16.697265625, 18.1220703125, 19.546875, 20.9716796875, 22.396484375, 23.8212890625, 25.24609375, 26.6708984375, 28.095703125, 29.5205078125, 30.9453125, 32.3701171875, 33.794921875, 35.2197265625, 36.64453125, 38.0693359375, 39.494140625, 40.9189453125, 42.34375]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 10.0, 34.0, 140.0, 359.0, 319.0, 129.0, 20.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-44.795841217041016, -43.94947052001953, -43.10310363769531, -42.25673294067383, -41.41036605834961, -40.563995361328125, -39.717628479003906, -38.87125778198242, -38.02488708496094, -37.17851638793945, -36.332149505615234, -35.48577880859375, -34.63941192626953, -33.79304122924805, -32.94667053222656, -32.100303649902344, -31.253936767578125, -30.407567977905273, -29.561199188232422, -28.714828491210938, -27.868459701538086, -27.022090911865234, -26.175722122192383, -25.32935333251953, -24.482982635498047, -23.636613845825195, -22.790245056152344, -21.94387435913086, -21.097505569458008, -20.251136779785156, -19.404767990112305, -18.558399200439453, -17.7120304107666, -16.86566162109375, -16.0192928314209, -15.17292308807373, -14.326554298400879, -13.480184555053711, -12.63381576538086, -11.787446975708008, -10.941078186035156, -10.094709396362305, -9.248339653015137, -8.401970863342285, -7.555602073669434, -6.709232807159424, -5.862863540649414, -5.0164947509765625, -4.1701250076293945, -3.323755979537964, -2.477386951446533, -1.6310176849365234, -0.7846486568450928, 0.06172037124633789, 0.9080896377563477, 1.7544584274291992, 2.600827693939209, 3.4471967220306396, 4.29356575012207, 5.13993501663208, 5.98630428314209, 6.832673072814941, 7.679042339324951, 8.525411605834961, 9.371780395507812]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 5.0, 2.0, 7.0, 5.0, 10.0, 10.0, 13.0, 15.0, 18.0, 25.0, 29.0, 20.0, 23.0, 28.0, 20.0, 22.0, 40.0, 43.0, 39.0, 41.0, 49.0, 34.0, 31.0, 40.0, 47.0, 36.0, 38.0, 31.0, 28.0, 31.0, 34.0, 24.0, 29.0, 25.0, 19.0, 19.0, 15.0, 17.0, 5.0, 5.0, 9.0, 5.0, 4.0, 4.0, 2.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-47.77581024169922, -46.37089920043945, -44.96598815917969, -43.561073303222656, -42.15616226196289, -40.751251220703125, -39.34634017944336, -37.941429138183594, -36.53651809692383, -35.13160705566406, -33.7266960144043, -32.32178497314453, -30.916872024536133, -29.511959075927734, -28.10704803466797, -26.702136993408203, -25.297224044799805, -23.89231300354004, -22.48740005493164, -21.082489013671875, -19.67757797241211, -18.272666931152344, -16.867753982543945, -15.46284294128418, -14.057930946350098, -12.653018951416016, -11.24810791015625, -9.843195915222168, -8.438283920288086, -7.03337287902832, -5.628460884094238, -4.223549842834473, -2.8186378479003906, -1.4137262105941772, -0.008814573287963867, 1.396097183227539, 2.801008701324463, 4.205920219421387, 5.610832214355469, 7.015743255615234, 8.420655250549316, 9.825567245483398, 11.230478286743164, 12.635390281677246, 14.040302276611328, 15.445213317871094, 16.85012435913086, 18.255035400390625, 19.659948348999023, 21.06485939025879, 22.469772338867188, 23.874683380126953, 25.27959442138672, 26.684505462646484, 28.089418411254883, 29.49432945251465, 30.899242401123047, 32.30415344238281, 33.70906448364258, 35.113975524902344, 36.518890380859375, 37.92380142211914, 39.328712463378906, 40.73362350463867, 42.13853454589844]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 7.0, 11.0, 18.0, 13.0, 16.0, 24.0, 34.0, 24.0, 34.0, 29.0, 42.0, 53.0, 52.0, 50.0, 57.0, 55.0, 52.0, 50.0, 52.0, 56.0, 46.0, 42.0, 20.0, 35.0, 29.0, 25.0, 17.0, 15.0, 15.0, 7.0, 7.0, 13.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.77734375, -4.5914306640625, -4.405517578125, -4.2196044921875, -4.03369140625, -3.8477783203125, -3.661865234375, -3.4759521484375, -3.2900390625, -3.1041259765625, -2.918212890625, -2.7322998046875, -2.54638671875, -2.3604736328125, -2.174560546875, -1.9886474609375, -1.802734375, -1.6168212890625, -1.430908203125, -1.2449951171875, -1.05908203125, -0.8731689453125, -0.687255859375, -0.5013427734375, -0.3154296875, -0.1295166015625, 0.056396484375, 0.2423095703125, 0.42822265625, 0.6141357421875, 0.800048828125, 0.9859619140625, 1.171875, 1.3577880859375, 1.543701171875, 1.7296142578125, 1.91552734375, 2.1014404296875, 2.287353515625, 2.4732666015625, 2.6591796875, 2.8450927734375, 3.031005859375, 3.2169189453125, 3.40283203125, 3.5887451171875, 3.774658203125, 3.9605712890625, 4.146484375, 4.3323974609375, 4.518310546875, 4.7042236328125, 4.89013671875, 5.0760498046875, 5.261962890625, 5.4478759765625, 5.6337890625, 5.8197021484375, 6.005615234375, 6.1915283203125, 6.37744140625, 6.5633544921875, 6.749267578125, 6.9351806640625, 7.12109375]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 8.0, 6.0, 10.0, 8.0, 15.0, 16.0, 16.0, 37.0, 41.0, 54.0, 60.0, 86.0, 134.0, 187.0, 391.0, 1109.0, 5878.0, 49594.0, 983174.0, 2953329.0, 180793.0, 15546.0, 2336.0, 601.0, 281.0, 151.0, 88.0, 66.0, 61.0, 43.0, 41.0, 29.0, 24.0, 25.0, 14.0, 8.0, 4.0, 9.0, 8.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.890625, -15.307373046875, -14.72412109375, -14.140869140625, -13.5576171875, -12.974365234375, -12.39111328125, -11.807861328125, -11.224609375, -10.641357421875, -10.05810546875, -9.474853515625, -8.8916015625, -8.308349609375, -7.72509765625, -7.141845703125, -6.55859375, -5.975341796875, -5.39208984375, -4.808837890625, -4.2255859375, -3.642333984375, -3.05908203125, -2.475830078125, -1.892578125, -1.309326171875, -0.72607421875, -0.142822265625, 0.4404296875, 1.023681640625, 1.60693359375, 2.190185546875, 2.7734375, 3.356689453125, 3.93994140625, 4.523193359375, 5.1064453125, 5.689697265625, 6.27294921875, 6.856201171875, 7.439453125, 8.022705078125, 8.60595703125, 9.189208984375, 9.7724609375, 10.355712890625, 10.93896484375, 11.522216796875, 12.10546875, 12.688720703125, 13.27197265625, 13.855224609375, 14.4384765625, 15.021728515625, 15.60498046875, 16.188232421875, 16.771484375, 17.354736328125, 17.93798828125, 18.521240234375, 19.1044921875, 19.687744140625, 20.27099609375, 20.854248046875, 21.4375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 7.0, 9.0, 18.0, 16.0, 49.0, 51.0, 81.0, 99.0, 140.0, 238.0, 338.0, 456.0, 582.0, 571.0, 428.0, 314.0, 215.0, 141.0, 119.0, 64.0, 43.0, 27.0, 25.0, 17.0, 8.0, 10.0, 1.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.359375, -19.740966796875, -19.12255859375, -18.504150390625, -17.8857421875, -17.267333984375, -16.64892578125, -16.030517578125, -15.412109375, -14.793701171875, -14.17529296875, -13.556884765625, -12.9384765625, -12.320068359375, -11.70166015625, -11.083251953125, -10.46484375, -9.846435546875, -9.22802734375, -8.609619140625, -7.9912109375, -7.372802734375, -6.75439453125, -6.135986328125, -5.517578125, -4.899169921875, -4.28076171875, -3.662353515625, -3.0439453125, -2.425537109375, -1.80712890625, -1.188720703125, -0.5703125, 0.048095703125, 0.66650390625, 1.284912109375, 1.9033203125, 2.521728515625, 3.14013671875, 3.758544921875, 4.376953125, 4.995361328125, 5.61376953125, 6.232177734375, 6.8505859375, 7.468994140625, 8.08740234375, 8.705810546875, 9.32421875, 9.942626953125, 10.56103515625, 11.179443359375, 11.7978515625, 12.416259765625, 13.03466796875, 13.653076171875, 14.271484375, 14.889892578125, 15.50830078125, 16.126708984375, 16.7451171875, 17.363525390625, 17.98193359375, 18.600341796875, 19.21875]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 9.0, 3.0, 11.0, 17.0, 28.0, 33.0, 60.0, 93.0, 99.0, 198.0, 386.0, 1267.0, 19728.0, 2883027.0, 1276009.0, 11421.0, 1047.0, 349.0, 179.0, 115.0, 57.0, 48.0, 23.0, 31.0, 14.0, 4.0, 9.0, 6.0, 4.0, 4.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.25, -42.400390625, -40.55078125, -38.701171875, -36.8515625, -35.001953125, -33.15234375, -31.302734375, -29.453125, -27.603515625, -25.75390625, -23.904296875, -22.0546875, -20.205078125, -18.35546875, -16.505859375, -14.65625, -12.806640625, -10.95703125, -9.107421875, -7.2578125, -5.408203125, -3.55859375, -1.708984375, 0.140625, 1.990234375, 3.83984375, 5.689453125, 7.5390625, 9.388671875, 11.23828125, 13.087890625, 14.9375, 16.787109375, 18.63671875, 20.486328125, 22.3359375, 24.185546875, 26.03515625, 27.884765625, 29.734375, 31.583984375, 33.43359375, 35.283203125, 37.1328125, 38.982421875, 40.83203125, 42.681640625, 44.53125, 46.380859375, 48.23046875, 50.080078125, 51.9296875, 53.779296875, 55.62890625, 57.478515625, 59.328125, 61.177734375, 63.02734375, 64.876953125, 66.7265625, 68.576171875, 70.42578125, 72.275390625, 74.125]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 12.0, 20.0, 62.0, 131.0, 261.0, 267.0, 170.0, 65.0, 22.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.441036224365234, -42.25052261352539, -38.06000900268555, -33.86949157714844, -29.678979873657227, -25.488466262817383, -21.297950744628906, -17.107437133789062, -12.916923522949219, -8.726409912109375, -4.535895347595215, -0.3453807830810547, 3.845132827758789, 8.035646438598633, 12.22616195678711, 16.416675567626953, 20.607189178466797, 24.79770278930664, 28.988216400146484, 33.178733825683594, 37.36924743652344, 41.55976104736328, 45.750274658203125, 49.94078826904297, 54.13130187988281, 58.321815490722656, 62.5123291015625, 66.70284271240234, 70.89335632324219, 75.08386993408203, 79.27438354492188, 83.46490478515625, 87.65541076660156, 91.8459243774414, 96.03643798828125, 100.2269515991211, 104.41746520996094, 108.60797882080078, 112.79849243164062, 116.989013671875, 121.17951965332031, 125.37003326416016, 129.560546875, 133.75106811523438, 137.9415740966797, 142.13209533691406, 146.32260131835938, 150.51312255859375, 154.70364379882812, 158.8941650390625, 163.0846710205078, 167.2751922607422, 171.4656982421875, 175.65621948242188, 179.8467254638672, 184.03724670410156, 188.22775268554688, 192.41827392578125, 196.60877990722656, 200.79930114746094, 204.98980712890625, 209.18032836914062, 213.37083435058594, 217.5613555908203, 221.75186157226562]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 6.0, 10.0, 4.0, 10.0, 4.0, 8.0, 6.0, 12.0, 15.0, 11.0, 21.0, 23.0, 23.0, 37.0, 35.0, 27.0, 31.0, 41.0, 42.0, 43.0, 42.0, 40.0, 46.0, 29.0, 42.0, 50.0, 36.0, 50.0, 31.0, 37.0, 26.0, 33.0, 27.0, 14.0, 14.0, 18.0, 16.0, 18.0, 7.0, 6.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-50.21797180175781, -48.60258102416992, -46.9871940612793, -45.371803283691406, -43.75641632080078, -42.14102554321289, -40.525638580322266, -38.910247802734375, -37.29486083984375, -35.67947006225586, -34.064083099365234, -32.448692321777344, -30.83330535888672, -29.217914581298828, -27.602527618408203, -25.987136840820312, -24.371747970581055, -22.756359100341797, -21.14097023010254, -19.52558135986328, -17.910192489624023, -16.294803619384766, -14.679413795471191, -13.064024925231934, -11.448636054992676, -9.833247184753418, -8.21785831451416, -6.602468967437744, -4.987080097198486, -3.3716907501220703, -1.7563018798828125, -0.1409130096435547, 1.4744758605957031, 3.089864730834961, 4.705253601074219, 6.320642948150635, 7.936031818389893, 9.551421165466309, 11.166810035705566, 12.782198905944824, 14.397587776184082, 16.012977600097656, 17.628366470336914, 19.243755340576172, 20.85914421081543, 22.474533081054688, 24.089921951293945, 25.705310821533203, 27.32069969177246, 28.93608856201172, 30.551477432250977, 32.166866302490234, 33.782257080078125, 35.39764404296875, 37.01303482055664, 38.628421783447266, 40.243812561035156, 41.85920333862305, 43.47459030151367, 45.08998107910156, 46.70536804199219, 48.32075881958008, 49.9361457824707, 51.551536560058594, 53.16692352294922]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 7.0, 11.0, 14.0, 19.0, 16.0, 25.0, 38.0, 29.0, 42.0, 34.0, 43.0, 35.0, 52.0, 46.0, 82.0, 62.0, 54.0, 52.0, 41.0, 39.0, 52.0, 30.0, 28.0, 27.0, 30.0, 26.0, 24.0, 8.0, 12.0, 10.0, 9.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.96484375, -4.76910400390625, -4.5733642578125, -4.37762451171875, -4.181884765625, -3.98614501953125, -3.7904052734375, -3.59466552734375, -3.39892578125, -3.20318603515625, -3.0074462890625, -2.81170654296875, -2.615966796875, -2.42022705078125, -2.2244873046875, -2.02874755859375, -1.8330078125, -1.63726806640625, -1.4415283203125, -1.24578857421875, -1.050048828125, -0.85430908203125, -0.6585693359375, -0.46282958984375, -0.26708984375, -0.07135009765625, 0.1243896484375, 0.32012939453125, 0.515869140625, 0.71160888671875, 0.9073486328125, 1.10308837890625, 1.298828125, 1.49456787109375, 1.6903076171875, 1.88604736328125, 2.081787109375, 2.27752685546875, 2.4732666015625, 2.66900634765625, 2.86474609375, 3.06048583984375, 3.2562255859375, 3.45196533203125, 3.647705078125, 3.84344482421875, 4.0391845703125, 4.23492431640625, 4.4306640625, 4.62640380859375, 4.8221435546875, 5.01788330078125, 5.213623046875, 5.40936279296875, 5.6051025390625, 5.80084228515625, 5.99658203125, 6.19232177734375, 6.3880615234375, 6.58380126953125, 6.779541015625, 6.97528076171875, 7.1710205078125, 7.36676025390625, 7.5625]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 1.0, 3.0, 4.0, 12.0, 8.0, 19.0, 35.0, 36.0, 62.0, 109.0, 149.0, 245.0, 324.0, 516.0, 770.0, 1203.0, 1898.0, 2879.0, 4353.0, 7006.0, 10990.0, 18114.0, 30249.0, 52365.0, 95024.0, 186375.0, 275900.0, 159569.0, 83228.0, 46020.0, 27136.0, 16240.0, 10057.0, 6240.0, 3919.0, 2587.0, 1661.0, 1133.0, 766.0, 461.0, 302.0, 203.0, 152.0, 95.0, 56.0, 29.0, 13.0, 21.0, 16.0, 2.0, 7.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.75048828125, -0.7273178100585938, -0.7041473388671875, -0.6809768676757812, -0.657806396484375, -0.6346359252929688, -0.6114654541015625, -0.5882949829101562, -0.56512451171875, -0.5419540405273438, -0.5187835693359375, -0.49561309814453125, -0.472442626953125, -0.44927215576171875, -0.4261016845703125, -0.40293121337890625, -0.3797607421875, -0.35659027099609375, -0.3334197998046875, -0.31024932861328125, -0.287078857421875, -0.26390838623046875, -0.2407379150390625, -0.21756744384765625, -0.19439697265625, -0.17122650146484375, -0.1480560302734375, -0.12488555908203125, -0.101715087890625, -0.07854461669921875, -0.0553741455078125, -0.03220367431640625, -0.009033203125, 0.01413726806640625, 0.0373077392578125, 0.06047821044921875, 0.083648681640625, 0.10681915283203125, 0.1299896240234375, 0.15316009521484375, 0.17633056640625, 0.19950103759765625, 0.2226715087890625, 0.24584197998046875, 0.269012451171875, 0.29218292236328125, 0.3153533935546875, 0.33852386474609375, 0.3616943359375, 0.38486480712890625, 0.4080352783203125, 0.43120574951171875, 0.454376220703125, 0.47754669189453125, 0.5007171630859375, 0.5238876342773438, 0.54705810546875, 0.5702285766601562, 0.5933990478515625, 0.6165695190429688, 0.639739990234375, 0.6629104614257812, 0.6860809326171875, 0.7092514038085938, 0.732421875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 5.0, 2.0, 10.0, 4.0, 5.0, 9.0, 14.0, 11.0, 11.0, 21.0, 18.0, 30.0, 21.0, 32.0, 36.0, 30.0, 47.0, 50.0, 32.0, 52.0, 50.0, 1072.0, 60.0, 44.0, 37.0, 23.0, 29.0, 47.0, 26.0, 26.0, 21.0, 15.0, 11.0, 23.0, 20.0, 15.0, 12.0, 7.0, 12.0, 4.0, 7.0, 4.0, 11.0, 7.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.091796875, -2.996337890625, -2.90087890625, -2.805419921875, -2.7099609375, -2.614501953125, -2.51904296875, -2.423583984375, -2.328125, -2.232666015625, -2.13720703125, -2.041748046875, -1.9462890625, -1.850830078125, -1.75537109375, -1.659912109375, -1.564453125, -1.468994140625, -1.37353515625, -1.278076171875, -1.1826171875, -1.087158203125, -0.99169921875, -0.896240234375, -0.80078125, -0.705322265625, -0.60986328125, -0.514404296875, -0.4189453125, -0.323486328125, -0.22802734375, -0.132568359375, -0.037109375, 0.058349609375, 0.15380859375, 0.249267578125, 0.3447265625, 0.440185546875, 0.53564453125, 0.631103515625, 0.7265625, 0.822021484375, 0.91748046875, 1.012939453125, 1.1083984375, 1.203857421875, 1.29931640625, 1.394775390625, 1.490234375, 1.585693359375, 1.68115234375, 1.776611328125, 1.8720703125, 1.967529296875, 2.06298828125, 2.158447265625, 2.25390625, 2.349365234375, 2.44482421875, 2.540283203125, 2.6357421875, 2.731201171875, 2.82666015625, 2.922119140625, 3.017578125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 6.0, 8.0, 8.0, 14.0, 11.0, 26.0, 28.0, 29.0, 51.0, 87.0, 115.0, 149.0, 214.0, 326.0, 468.0, 691.0, 1031.0, 1421.0, 2158.0, 3080.0, 4880.0, 7158.0, 11244.0, 17447.0, 27868.0, 45717.0, 78739.0, 146662.0, 1297425.0, 195314.0, 102404.0, 57229.0, 34061.0, 21028.0, 13575.0, 8690.0, 5768.0, 3704.0, 2588.0, 1783.0, 1208.0, 844.0, 575.0, 417.0, 261.0, 193.0, 126.0, 94.0, 69.0, 41.0, 32.0, 30.0, 21.0, 7.0, 5.0, 6.0, 5.0, 5.0, 2.0, 1.0], "bins": [-0.57763671875, -0.5599822998046875, -0.542327880859375, -0.5246734619140625, -0.50701904296875, -0.4893646240234375, -0.471710205078125, -0.4540557861328125, -0.4364013671875, -0.4187469482421875, -0.401092529296875, -0.3834381103515625, -0.36578369140625, -0.3481292724609375, -0.330474853515625, -0.3128204345703125, -0.295166015625, -0.2775115966796875, -0.259857177734375, -0.2422027587890625, -0.22454833984375, -0.2068939208984375, -0.189239501953125, -0.1715850830078125, -0.1539306640625, -0.1362762451171875, -0.118621826171875, -0.1009674072265625, -0.08331298828125, -0.0656585693359375, -0.048004150390625, -0.0303497314453125, -0.0126953125, 0.0049591064453125, 0.022613525390625, 0.0402679443359375, 0.05792236328125, 0.0755767822265625, 0.093231201171875, 0.1108856201171875, 0.1285400390625, 0.1461944580078125, 0.163848876953125, 0.1815032958984375, 0.19915771484375, 0.2168121337890625, 0.234466552734375, 0.2521209716796875, 0.269775390625, 0.2874298095703125, 0.305084228515625, 0.3227386474609375, 0.34039306640625, 0.3580474853515625, 0.375701904296875, 0.3933563232421875, 0.4110107421875, 0.4286651611328125, 0.446319580078125, 0.4639739990234375, 0.48162841796875, 0.4992828369140625, 0.516937255859375, 0.5345916748046875, 0.55224609375]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 7.0, 5.0, 6.0, 4.0, 8.0, 11.0, 17.0, 18.0, 28.0, 32.0, 24.0, 35.0, 45.0, 55.0, 67.0, 83.0, 99.0, 62.0, 75.0, 62.0, 56.0, 42.0, 35.0, 31.0, 14.0, 16.0, 15.0, 11.0, 11.0, 9.0, 4.0, 0.0, 5.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0019378662109375, -0.0018814951181411743, -0.0018251240253448486, -0.001768752932548523, -0.0017123818397521973, -0.0016560107469558716, -0.001599639654159546, -0.0015432685613632202, -0.0014868974685668945, -0.0014305263757705688, -0.0013741552829742432, -0.0013177841901779175, -0.0012614130973815918, -0.0012050420045852661, -0.0011486709117889404, -0.0010922998189926147, -0.001035928726196289, -0.0009795576333999634, -0.0009231865406036377, -0.000866815447807312, -0.0008104443550109863, -0.0007540732622146606, -0.000697702169418335, -0.0006413310766220093, -0.0005849599838256836, -0.0005285888910293579, -0.0004722177982330322, -0.00041584670543670654, -0.00035947561264038086, -0.0003031045198440552, -0.0002467334270477295, -0.0001903623342514038, -0.00013399124145507812, -7.762014865875244e-05, -2.1249055862426758e-05, 3.5122036933898926e-05, 9.149312973022461e-05, 0.0001478642225265503, 0.00020423531532287598, 0.00026060640811920166, 0.00031697750091552734, 0.00037334859371185303, 0.0004297196865081787, 0.0004860907793045044, 0.0005424618721008301, 0.0005988329648971558, 0.0006552040576934814, 0.0007115751504898071, 0.0007679462432861328, 0.0008243173360824585, 0.0008806884288787842, 0.0009370595216751099, 0.0009934306144714355, 0.0010498017072677612, 0.001106172800064087, 0.0011625438928604126, 0.0012189149856567383, 0.001275286078453064, 0.0013316571712493896, 0.0013880282640457153, 0.001444399356842041, 0.0015007704496383667, 0.0015571415424346924, 0.001613512635231018, 0.0016698837280273438]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 10.0, 7.0, 16.0, 14.0, 26.0, 26.0, 32.0, 46.0, 87.0, 128.0, 149.0, 251.0, 446.0, 1738.0, 1023206.0, 20807.0, 665.0, 304.0, 170.0, 114.0, 82.0, 68.0, 41.0, 30.0, 22.0, 14.0, 8.0, 8.0, 6.0, 5.0, 7.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0341796875, -0.032946109771728516, -0.03171253204345703, -0.030478954315185547, -0.029245376586914062, -0.028011798858642578, -0.026778221130371094, -0.02554464340209961, -0.024311065673828125, -0.02307748794555664, -0.021843910217285156, -0.020610332489013672, -0.019376754760742188, -0.018143177032470703, -0.01690959930419922, -0.015676021575927734, -0.01444244384765625, -0.013208866119384766, -0.011975288391113281, -0.010741710662841797, -0.009508132934570312, -0.008274555206298828, -0.007040977478027344, -0.005807399749755859, -0.004573822021484375, -0.0033402442932128906, -0.0021066665649414062, -0.0008730888366699219, 0.0003604888916015625, 0.0015940666198730469, 0.0028276443481445312, 0.004061222076416016, 0.0052947998046875, 0.006528377532958984, 0.007761955261230469, 0.008995532989501953, 0.010229110717773438, 0.011462688446044922, 0.012696266174316406, 0.01392984390258789, 0.015163421630859375, 0.01639699935913086, 0.017630577087402344, 0.018864154815673828, 0.020097732543945312, 0.021331310272216797, 0.02256488800048828, 0.023798465728759766, 0.02503204345703125, 0.026265621185302734, 0.02749919891357422, 0.028732776641845703, 0.029966354370117188, 0.031199932098388672, 0.032433509826660156, 0.03366708755493164, 0.034900665283203125, 0.03613424301147461, 0.037367820739746094, 0.03860139846801758, 0.03983497619628906, 0.04106855392456055, 0.04230213165283203, 0.043535709381103516, 0.044769287109375]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 26.0, 620.0, 364.0, 8.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008985470049083233, -0.008765552192926407, -0.00854563433676958, -0.008325716480612755, -0.008105798624455929, -0.007885880768299103, -0.007665962912142277, -0.007446045055985451, -0.007226127199828625, -0.007006209343671799, -0.006786291487514973, -0.006566373631358147, -0.006346455775201321, -0.006126537919044495, -0.005906620062887669, -0.005686702206730843, -0.005466783884912729, -0.005246866028755903, -0.005026948172599077, -0.004807030316442251, -0.004587112460285425, -0.004367194604128599, -0.004147276282310486, -0.00392735842615366, -0.0037074408028274775, -0.0034875229466706514, -0.0032676050905138254, -0.0030476870015263557, -0.0028277691453695297, -0.0026078512892127037, -0.0023879334330558777, -0.0021680155768990517, -0.0019480977207422256, -0.0017281798645853996, -0.0015082620084285736, -0.0012883440358564258, -0.0010684261796995997, -0.0008485083235427737, -0.0006285903509706259, -0.00040867249481379986, -0.00018875463865697384, 3.116324660368264e-05, 0.0002510811318643391, 0.00047099904622882605, 0.0006909169023856521, 0.0009108347585424781, 0.001130752731114626, 0.001350670587271452, 0.001570588443428278, 0.001790506299585104, 0.00201042415574193, 0.002230342011898756, 0.002450259868055582, 0.002670177724212408, 0.0028900958131998777, 0.0031100136693567038, 0.0033299315255135298, 0.003549849381670356, 0.003769767237827182, 0.0039896853268146515, 0.0042096031829714775, 0.0044295210391283035, 0.0046494388952851295, 0.004869356751441956, 0.005089274607598782]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 3.0, 3.0, 14.0, 9.0, 13.0, 11.0, 14.0, 16.0, 12.0, 14.0, 26.0, 12.0, 24.0, 31.0, 33.0, 39.0, 40.0, 41.0, 45.0, 39.0, 39.0, 30.0, 43.0, 30.0, 43.0, 35.0, 34.0, 30.0, 36.0, 34.0, 30.0, 22.0, 20.0, 20.0, 21.0, 17.0, 13.0, 16.0, 11.0, 8.0, 10.0, 7.0, 6.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000735938549041748, -0.0007114782929420471, -0.0006870180368423462, -0.0006625577807426453, -0.0006380975246429443, -0.0006136372685432434, -0.0005891770124435425, -0.0005647167563438416, -0.0005402565002441406, -0.0005157962441444397, -0.0004913359880447388, -0.00046687573194503784, -0.0004424154758453369, -0.000417955219745636, -0.00039349496364593506, -0.00036903470754623413, -0.0003445744514465332, -0.0003201141953468323, -0.00029565393924713135, -0.0002711936831474304, -0.0002467334270477295, -0.00022227317094802856, -0.00019781291484832764, -0.0001733526587486267, -0.00014889240264892578, -0.00012443214654922485, -9.997189044952393e-05, -7.5511634349823e-05, -5.105137825012207e-05, -2.6591122150421143e-05, -2.130866050720215e-06, 2.2329390048980713e-05, 4.678964614868164e-05, 7.124990224838257e-05, 9.57101583480835e-05, 0.00012017041444778442, 0.00014463067054748535, 0.00016909092664718628, 0.0001935511827468872, 0.00021801143884658813, 0.00024247169494628906, 0.00026693195104599, 0.0002913922071456909, 0.00031585246324539185, 0.0003403127193450928, 0.0003647729754447937, 0.00038923323154449463, 0.00041369348764419556, 0.0004381537437438965, 0.0004626139998435974, 0.00048707425594329834, 0.0005115345120429993, 0.0005359947681427002, 0.0005604550242424011, 0.000584915280342102, 0.000609375536441803, 0.0006338357925415039, 0.0006582960486412048, 0.0006827563047409058, 0.0007072165608406067, 0.0007316768169403076, 0.0007561370730400085, 0.0007805973291397095, 0.0008050575852394104, 0.0008295178413391113]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 7.0, 11.0, 14.0, 19.0, 16.0, 25.0, 38.0, 29.0, 42.0, 34.0, 43.0, 35.0, 52.0, 46.0, 82.0, 62.0, 54.0, 52.0, 41.0, 39.0, 52.0, 30.0, 28.0, 27.0, 30.0, 26.0, 24.0, 8.0, 12.0, 10.0, 9.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.96484375, -4.76910400390625, -4.5733642578125, -4.37762451171875, -4.181884765625, -3.98614501953125, -3.7904052734375, -3.59466552734375, -3.39892578125, -3.20318603515625, -3.0074462890625, -2.81170654296875, -2.615966796875, -2.42022705078125, -2.2244873046875, -2.02874755859375, -1.8330078125, -1.63726806640625, -1.4415283203125, -1.24578857421875, -1.050048828125, -0.85430908203125, -0.6585693359375, -0.46282958984375, -0.26708984375, -0.07135009765625, 0.1243896484375, 0.32012939453125, 0.515869140625, 0.71160888671875, 0.9073486328125, 1.10308837890625, 1.298828125, 1.49456787109375, 1.6903076171875, 1.88604736328125, 2.081787109375, 2.27752685546875, 2.4732666015625, 2.66900634765625, 2.86474609375, 3.06048583984375, 3.2562255859375, 3.45196533203125, 3.647705078125, 3.84344482421875, 4.0391845703125, 4.23492431640625, 4.4306640625, 4.62640380859375, 4.8221435546875, 5.01788330078125, 5.213623046875, 5.40936279296875, 5.6051025390625, 5.80084228515625, 5.99658203125, 6.19232177734375, 6.3880615234375, 6.58380126953125, 6.779541015625, 6.97528076171875, 7.1710205078125, 7.36676025390625, 7.5625]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 9.0, 11.0, 16.0, 26.0, 34.0, 52.0, 95.0, 113.0, 193.0, 320.0, 500.0, 829.0, 1452.0, 2397.0, 4298.0, 8166.0, 17234.0, 43438.0, 138707.0, 481179.0, 234452.0, 66866.0, 24641.0, 10686.0, 5473.0, 2954.0, 1744.0, 995.0, 612.0, 396.0, 258.0, 144.0, 91.0, 62.0, 41.0, 24.0, 15.0, 13.0, 7.0, 10.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.08203125, -2.96209716796875, -2.8421630859375, -2.72222900390625, -2.602294921875, -2.48236083984375, -2.3624267578125, -2.24249267578125, -2.12255859375, -2.00262451171875, -1.8826904296875, -1.76275634765625, -1.642822265625, -1.52288818359375, -1.4029541015625, -1.28302001953125, -1.1630859375, -1.04315185546875, -0.9232177734375, -0.80328369140625, -0.683349609375, -0.56341552734375, -0.4434814453125, -0.32354736328125, -0.20361328125, -0.08367919921875, 0.0362548828125, 0.15618896484375, 0.276123046875, 0.39605712890625, 0.5159912109375, 0.63592529296875, 0.755859375, 0.87579345703125, 0.9957275390625, 1.11566162109375, 1.235595703125, 1.35552978515625, 1.4754638671875, 1.59539794921875, 1.71533203125, 1.83526611328125, 1.9552001953125, 2.07513427734375, 2.195068359375, 2.31500244140625, 2.4349365234375, 2.55487060546875, 2.6748046875, 2.79473876953125, 2.9146728515625, 3.03460693359375, 3.154541015625, 3.27447509765625, 3.3944091796875, 3.51434326171875, 3.63427734375, 3.75421142578125, 3.8741455078125, 3.99407958984375, 4.114013671875, 4.23394775390625, 4.3538818359375, 4.47381591796875, 4.59375]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 5.0, 2.0, 8.0, 9.0, 13.0, 11.0, 9.0, 15.0, 25.0, 19.0, 27.0, 16.0, 34.0, 35.0, 47.0, 44.0, 52.0, 69.0, 56.0, 168.0, 1830.0, 123.0, 53.0, 54.0, 43.0, 39.0, 44.0, 32.0, 27.0, 23.0, 20.0, 19.0, 17.0, 17.0, 11.0, 9.0, 8.0, 4.0, 4.0, 7.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-22.640625, -22.051513671875, -21.46240234375, -20.873291015625, -20.2841796875, -19.695068359375, -19.10595703125, -18.516845703125, -17.927734375, -17.338623046875, -16.74951171875, -16.160400390625, -15.5712890625, -14.982177734375, -14.39306640625, -13.803955078125, -13.21484375, -12.625732421875, -12.03662109375, -11.447509765625, -10.8583984375, -10.269287109375, -9.68017578125, -9.091064453125, -8.501953125, -7.912841796875, -7.32373046875, -6.734619140625, -6.1455078125, -5.556396484375, -4.96728515625, -4.378173828125, -3.7890625, -3.199951171875, -2.61083984375, -2.021728515625, -1.4326171875, -0.843505859375, -0.25439453125, 0.334716796875, 0.923828125, 1.512939453125, 2.10205078125, 2.691162109375, 3.2802734375, 3.869384765625, 4.45849609375, 5.047607421875, 5.63671875, 6.225830078125, 6.81494140625, 7.404052734375, 7.9931640625, 8.582275390625, 9.17138671875, 9.760498046875, 10.349609375, 10.938720703125, 11.52783203125, 12.116943359375, 12.7060546875, 13.295166015625, 13.88427734375, 14.473388671875, 15.0625]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 9.0, 3.0, 3.0, 8.0, 7.0, 14.0, 18.0, 15.0, 21.0, 18.0, 33.0, 19.0, 55.0, 67.0, 87.0, 165.0, 307.0, 775.0, 5448.0, 2483315.0, 649781.0, 3920.0, 729.0, 283.0, 180.0, 105.0, 77.0, 39.0, 37.0, 36.0, 21.0, 17.0, 21.0, 14.0, 14.0, 11.0, 11.0, 7.0, 7.0, 2.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-25.859375, -24.899658203125, -23.93994140625, -22.980224609375, -22.0205078125, -21.060791015625, -20.10107421875, -19.141357421875, -18.181640625, -17.221923828125, -16.26220703125, -15.302490234375, -14.3427734375, -13.383056640625, -12.42333984375, -11.463623046875, -10.50390625, -9.544189453125, -8.58447265625, -7.624755859375, -6.6650390625, -5.705322265625, -4.74560546875, -3.785888671875, -2.826171875, -1.866455078125, -0.90673828125, 0.052978515625, 1.0126953125, 1.972412109375, 2.93212890625, 3.891845703125, 4.8515625, 5.811279296875, 6.77099609375, 7.730712890625, 8.6904296875, 9.650146484375, 10.60986328125, 11.569580078125, 12.529296875, 13.489013671875, 14.44873046875, 15.408447265625, 16.3681640625, 17.327880859375, 18.28759765625, 19.247314453125, 20.20703125, 21.166748046875, 22.12646484375, 23.086181640625, 24.0458984375, 25.005615234375, 25.96533203125, 26.925048828125, 27.884765625, 28.844482421875, 29.80419921875, 30.763916015625, 31.7236328125, 32.683349609375, 33.64306640625, 34.602783203125, 35.5625]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 312.0, 675.0, 26.0, 0.0, 0.0, 0.0, 1.0], "bins": [-238.09268188476562, -233.99868774414062, -229.90469360351562, -225.81068420410156, -221.71669006347656, -217.62269592285156, -213.5286865234375, -209.4346923828125, -205.3406982421875, -201.2467041015625, -197.1527099609375, -193.05870056152344, -188.96470642089844, -184.87071228027344, -180.77670288085938, -176.68270874023438, -172.58871459960938, -168.49472045898438, -164.40072631835938, -160.3067169189453, -156.2127227783203, -152.1187286376953, -148.02471923828125, -143.93072509765625, -139.83673095703125, -135.74273681640625, -131.64874267578125, -127.55473327636719, -123.46073913574219, -119.36674499511719, -115.27274322509766, -111.17874145507812, -107.08473205566406, -102.99073791503906, -98.89673614501953, -94.802734375, -90.708740234375, -86.61474609375, -82.52074432373047, -78.42674255371094, -74.33274841308594, -70.23875427246094, -66.1447525024414, -62.05075454711914, -57.956756591796875, -53.86275863647461, -49.768760681152344, -45.67476272583008, -41.58076858520508, -37.48677062988281, -33.39277267456055, -29.29877471923828, -25.204776763916016, -21.11077880859375, -17.016780853271484, -12.922782897949219, -8.828784942626953, -4.7347869873046875, -0.6407890319824219, 3.4532089233398438, 7.547206878662109, 11.641204833984375, 15.73520278930664, 19.829200744628906, 23.923198699951172]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 9.0, 6.0, 3.0, 9.0, 11.0, 12.0, 21.0, 23.0, 28.0, 32.0, 26.0, 26.0, 27.0, 28.0, 34.0, 37.0, 29.0, 35.0, 49.0, 48.0, 59.0, 43.0, 36.0, 39.0, 39.0, 35.0, 26.0, 24.0, 34.0, 25.0, 22.0, 17.0, 18.0, 13.0, 11.0, 10.0, 14.0, 3.0, 13.0, 5.0, 5.0, 4.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-58.52305221557617, -56.78562545776367, -55.04820251464844, -53.31077575683594, -51.5733528137207, -49.8359260559082, -48.09850311279297, -46.36107635498047, -44.62364959716797, -42.88622283935547, -41.148799896240234, -39.411373138427734, -37.6739501953125, -35.9365234375, -34.1990966796875, -32.461673736572266, -30.7242488861084, -28.98682403564453, -27.249399185180664, -25.511974334716797, -23.774547576904297, -22.03712272644043, -20.299697875976562, -18.562271118164062, -16.824848175048828, -15.087423324584961, -13.349997520446777, -11.61257266998291, -9.875146865844727, -8.13772201538086, -6.400297164916992, -4.662871360778809, -2.925445556640625, -1.1880203485488892, 0.5494048595428467, 2.286829948425293, 4.024255275726318, 5.761680603027344, 7.499105453491211, 9.236531257629395, 10.973956108093262, 12.711380958557129, 14.448806762695312, 16.18623161315918, 17.923656463623047, 19.661083221435547, 21.39850616455078, 23.13593292236328, 24.87335777282715, 26.610782623291016, 28.348207473754883, 30.08563232421875, 31.82305908203125, 33.56048583984375, 35.297908782958984, 37.035335540771484, 38.77275848388672, 40.51018524169922, 42.24760818481445, 43.98503494262695, 45.72245788574219, 47.45988464355469, 49.19731140136719, 50.93473434448242, 52.67216110229492]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 5.0, 5.0, 3.0, 12.0, 13.0, 17.0, 15.0, 23.0, 28.0, 44.0, 31.0, 41.0, 38.0, 39.0, 42.0, 57.0, 64.0, 62.0, 62.0, 51.0, 34.0, 43.0, 49.0, 37.0, 28.0, 25.0, 27.0, 24.0, 29.0, 17.0, 13.0, 14.0, 4.0, 9.0, 7.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.89453125, -4.6964111328125, -4.498291015625, -4.3001708984375, -4.10205078125, -3.9039306640625, -3.705810546875, -3.5076904296875, -3.3095703125, -3.1114501953125, -2.913330078125, -2.7152099609375, -2.51708984375, -2.3189697265625, -2.120849609375, -1.9227294921875, -1.724609375, -1.5264892578125, -1.328369140625, -1.1302490234375, -0.93212890625, -0.7340087890625, -0.535888671875, -0.3377685546875, -0.1396484375, 0.0584716796875, 0.256591796875, 0.4547119140625, 0.65283203125, 0.8509521484375, 1.049072265625, 1.2471923828125, 1.4453125, 1.6434326171875, 1.841552734375, 2.0396728515625, 2.23779296875, 2.4359130859375, 2.634033203125, 2.8321533203125, 3.0302734375, 3.2283935546875, 3.426513671875, 3.6246337890625, 3.82275390625, 4.0208740234375, 4.218994140625, 4.4171142578125, 4.615234375, 4.8133544921875, 5.011474609375, 5.2095947265625, 5.40771484375, 5.6058349609375, 5.803955078125, 6.0020751953125, 6.2001953125, 6.3983154296875, 6.596435546875, 6.7945556640625, 6.99267578125, 7.1907958984375, 7.388916015625, 7.5870361328125, 7.78515625]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 8.0, 11.0, 20.0, 17.0, 15.0, 22.0, 29.0, 31.0, 36.0, 43.0, 43.0, 74.0, 208.0, 1589.0, 46972.0, 3794128.0, 345340.0, 4921.0, 371.0, 110.0, 53.0, 50.0, 33.0, 30.0, 22.0, 28.0, 17.0, 20.0, 11.0, 10.0, 14.0, 3.0, 6.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.28125, -27.1806640625, -26.080078125, -24.9794921875, -23.87890625, -22.7783203125, -21.677734375, -20.5771484375, -19.4765625, -18.3759765625, -17.275390625, -16.1748046875, -15.07421875, -13.9736328125, -12.873046875, -11.7724609375, -10.671875, -9.5712890625, -8.470703125, -7.3701171875, -6.26953125, -5.1689453125, -4.068359375, -2.9677734375, -1.8671875, -0.7666015625, 0.333984375, 1.4345703125, 2.53515625, 3.6357421875, 4.736328125, 5.8369140625, 6.9375, 8.0380859375, 9.138671875, 10.2392578125, 11.33984375, 12.4404296875, 13.541015625, 14.6416015625, 15.7421875, 16.8427734375, 17.943359375, 19.0439453125, 20.14453125, 21.2451171875, 22.345703125, 23.4462890625, 24.546875, 25.6474609375, 26.748046875, 27.8486328125, 28.94921875, 30.0498046875, 31.150390625, 32.2509765625, 33.3515625, 34.4521484375, 35.552734375, 36.6533203125, 37.75390625, 38.8544921875, 39.955078125, 41.0556640625, 42.15625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 2.0, 4.0, 10.0, 8.0, 23.0, 35.0, 58.0, 84.0, 125.0, 183.0, 262.0, 440.0, 635.0, 672.0, 559.0, 351.0, 237.0, 158.0, 97.0, 55.0, 37.0, 12.0, 9.0, 9.0, 6.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0], "bins": [-28.125, -27.4727783203125, -26.820556640625, -26.1683349609375, -25.51611328125, -24.8638916015625, -24.211669921875, -23.5594482421875, -22.9072265625, -22.2550048828125, -21.602783203125, -20.9505615234375, -20.29833984375, -19.6461181640625, -18.993896484375, -18.3416748046875, -17.689453125, -17.0372314453125, -16.385009765625, -15.7327880859375, -15.08056640625, -14.4283447265625, -13.776123046875, -13.1239013671875, -12.4716796875, -11.8194580078125, -11.167236328125, -10.5150146484375, -9.86279296875, -9.2105712890625, -8.558349609375, -7.9061279296875, -7.25390625, -6.6016845703125, -5.949462890625, -5.2972412109375, -4.64501953125, -3.9927978515625, -3.340576171875, -2.6883544921875, -2.0361328125, -1.3839111328125, -0.731689453125, -0.0794677734375, 0.57275390625, 1.2249755859375, 1.877197265625, 2.5294189453125, 3.181640625, 3.8338623046875, 4.486083984375, 5.1383056640625, 5.79052734375, 6.4427490234375, 7.094970703125, 7.7471923828125, 8.3994140625, 9.0516357421875, 9.703857421875, 10.3560791015625, 11.00830078125, 11.6605224609375, 12.312744140625, 12.9649658203125, 13.6171875]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 6.0, 9.0, 8.0, 14.0, 38.0, 60.0, 66.0, 100.0, 165.0, 241.0, 535.0, 1951.0, 33829.0, 3722275.0, 426683.0, 6500.0, 902.0, 334.0, 174.0, 144.0, 92.0, 37.0, 26.0, 31.0, 23.0, 15.0, 10.0, 6.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.21875, -41.31982421875, -39.4208984375, -37.52197265625, -35.623046875, -33.72412109375, -31.8251953125, -29.92626953125, -28.02734375, -26.12841796875, -24.2294921875, -22.33056640625, -20.431640625, -18.53271484375, -16.6337890625, -14.73486328125, -12.8359375, -10.93701171875, -9.0380859375, -7.13916015625, -5.240234375, -3.34130859375, -1.4423828125, 0.45654296875, 2.35546875, 4.25439453125, 6.1533203125, 8.05224609375, 9.951171875, 11.85009765625, 13.7490234375, 15.64794921875, 17.546875, 19.44580078125, 21.3447265625, 23.24365234375, 25.142578125, 27.04150390625, 28.9404296875, 30.83935546875, 32.73828125, 34.63720703125, 36.5361328125, 38.43505859375, 40.333984375, 42.23291015625, 44.1318359375, 46.03076171875, 47.9296875, 49.82861328125, 51.7275390625, 53.62646484375, 55.525390625, 57.42431640625, 59.3232421875, 61.22216796875, 63.12109375, 65.02001953125, 66.9189453125, 68.81787109375, 70.716796875, 72.61572265625, 74.5146484375, 76.41357421875, 78.3125]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 21.0, 42.0, 95.0, 191.0, 224.0, 183.0, 163.0, 61.0, 20.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-135.32640075683594, -131.41815185546875, -127.50990295410156, -123.60165405273438, -119.69340515136719, -115.78515625, -111.87689971923828, -107.9686508178711, -104.0604019165039, -100.15215301513672, -96.24390411376953, -92.33565521240234, -88.42739868164062, -84.51914978027344, -80.61090087890625, -76.70265197753906, -72.79440307617188, -68.88615417480469, -64.9779052734375, -61.06965255737305, -57.16140365600586, -53.25315475463867, -49.34490203857422, -45.43665313720703, -41.528404235839844, -37.620155334472656, -33.71190643310547, -29.803653717041016, -25.895404815673828, -21.98715591430664, -18.07890510559082, -14.170654296875, -10.262405395507812, -6.354155540466309, -2.4459056854248047, 1.4623441696166992, 5.370594024658203, 9.27884292602539, 13.187093734741211, 17.09534454345703, 21.00359344482422, 24.911842346191406, 28.820093154907227, 32.72834396362305, 36.636592864990234, 40.54484176635742, 44.453094482421875, 48.36134338378906, 52.26959228515625, 56.17784118652344, 60.086090087890625, 63.99434280395508, 67.902587890625, 71.81083679199219, 75.7190933227539, 79.6273422241211, 83.53559112548828, 87.44384002685547, 91.35208892822266, 95.26033782958984, 99.16859436035156, 103.07684326171875, 106.98509216308594, 110.89334106445312, 114.80158996582031]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 10.0, 10.0, 12.0, 11.0, 15.0, 21.0, 23.0, 21.0, 27.0, 20.0, 22.0, 26.0, 36.0, 44.0, 48.0, 44.0, 34.0, 39.0, 32.0, 43.0, 35.0, 42.0, 45.0, 45.0, 33.0, 27.0, 25.0, 28.0, 30.0, 25.0, 19.0, 18.0, 12.0, 18.0, 13.0, 6.0, 8.0, 10.0, 7.0, 6.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-49.94775390625, -48.38202667236328, -46.81629943847656, -45.250572204589844, -43.684844970703125, -42.119117736816406, -40.55339050292969, -38.987667083740234, -37.421939849853516, -35.8562126159668, -34.29048538208008, -32.72475814819336, -31.159032821655273, -29.593305587768555, -28.027578353881836, -26.46185302734375, -24.8961238861084, -23.33039665222168, -21.76466941833496, -20.198944091796875, -18.633216857910156, -17.067489624023438, -15.501762390136719, -13.936036109924316, -12.370308876037598, -10.804581642150879, -9.238855361938477, -7.673128128051758, -6.107401371002197, -4.541674613952637, -2.975947380065918, -1.4102210998535156, 0.15550613403320312, 1.7212330102920532, 3.2869598865509033, 4.852686882019043, 6.4184136390686035, 7.984140396118164, 9.549867630004883, 11.115593910217285, 12.681321144104004, 14.247048377990723, 15.812774658203125, 17.378501892089844, 18.944229125976562, 20.50995635986328, 22.07568359375, 23.641408920288086, 25.207136154174805, 26.772863388061523, 28.338590621948242, 29.904315948486328, 31.470043182373047, 33.035770416259766, 34.601497650146484, 36.1672248840332, 37.73295211791992, 39.29867935180664, 40.86440658569336, 42.43013381958008, 43.9958610534668, 45.56158447265625, 47.12731170654297, 48.69303894042969, 50.258766174316406]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 0.0, 6.0, 4.0, 10.0, 11.0, 16.0, 19.0, 29.0, 26.0, 36.0, 36.0, 32.0, 47.0, 49.0, 49.0, 53.0, 58.0, 52.0, 50.0, 47.0, 48.0, 47.0, 42.0, 36.0, 35.0, 31.0, 30.0, 24.0, 22.0, 21.0, 9.0, 10.0, 6.0, 6.0, 2.0, 7.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6015625, -5.398681640625, -5.19580078125, -4.992919921875, -4.7900390625, -4.587158203125, -4.38427734375, -4.181396484375, -3.978515625, -3.775634765625, -3.57275390625, -3.369873046875, -3.1669921875, -2.964111328125, -2.76123046875, -2.558349609375, -2.35546875, -2.152587890625, -1.94970703125, -1.746826171875, -1.5439453125, -1.341064453125, -1.13818359375, -0.935302734375, -0.732421875, -0.529541015625, -0.32666015625, -0.123779296875, 0.0791015625, 0.281982421875, 0.48486328125, 0.687744140625, 0.890625, 1.093505859375, 1.29638671875, 1.499267578125, 1.7021484375, 1.905029296875, 2.10791015625, 2.310791015625, 2.513671875, 2.716552734375, 2.91943359375, 3.122314453125, 3.3251953125, 3.528076171875, 3.73095703125, 3.933837890625, 4.13671875, 4.339599609375, 4.54248046875, 4.745361328125, 4.9482421875, 5.151123046875, 5.35400390625, 5.556884765625, 5.759765625, 5.962646484375, 6.16552734375, 6.368408203125, 6.5712890625, 6.774169921875, 6.97705078125, 7.179931640625, 7.3828125]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 3.0, 6.0, 4.0, 5.0, 16.0, 18.0, 27.0, 35.0, 70.0, 95.0, 117.0, 210.0, 281.0, 431.0, 632.0, 861.0, 1244.0, 1826.0, 2584.0, 3694.0, 5313.0, 7710.0, 11284.0, 16473.0, 24970.0, 38245.0, 61931.0, 105045.0, 193042.0, 230087.0, 131638.0, 74678.0, 45339.0, 29054.0, 19337.0, 13075.0, 9039.0, 6240.0, 4252.0, 2962.0, 2053.0, 1427.0, 1028.0, 661.0, 463.0, 347.0, 220.0, 174.0, 126.0, 56.0, 46.0, 38.0, 19.0, 15.0, 11.0, 9.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.66748046875, -0.6467437744140625, -0.626007080078125, -0.6052703857421875, -0.58453369140625, -0.5637969970703125, -0.543060302734375, -0.5223236083984375, -0.5015869140625, -0.4808502197265625, -0.460113525390625, -0.4393768310546875, -0.41864013671875, -0.3979034423828125, -0.377166748046875, -0.3564300537109375, -0.335693359375, -0.3149566650390625, -0.294219970703125, -0.2734832763671875, -0.25274658203125, -0.2320098876953125, -0.211273193359375, -0.1905364990234375, -0.1697998046875, -0.1490631103515625, -0.128326416015625, -0.1075897216796875, -0.08685302734375, -0.0661163330078125, -0.045379638671875, -0.0246429443359375, -0.00390625, 0.0168304443359375, 0.037567138671875, 0.0583038330078125, 0.07904052734375, 0.0997772216796875, 0.120513916015625, 0.1412506103515625, 0.1619873046875, 0.1827239990234375, 0.203460693359375, 0.2241973876953125, 0.24493408203125, 0.2656707763671875, 0.286407470703125, 0.3071441650390625, 0.327880859375, 0.3486175537109375, 0.369354248046875, 0.3900909423828125, 0.41082763671875, 0.4315643310546875, 0.452301025390625, 0.4730377197265625, 0.4937744140625, 0.5145111083984375, 0.535247802734375, 0.5559844970703125, 0.57672119140625, 0.5974578857421875, 0.618194580078125, 0.6389312744140625, 0.65966796875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 9.0, 7.0, 8.0, 11.0, 9.0, 24.0, 20.0, 21.0, 29.0, 36.0, 27.0, 35.0, 37.0, 41.0, 43.0, 33.0, 48.0, 39.0, 1069.0, 46.0, 45.0, 44.0, 42.0, 36.0, 35.0, 33.0, 30.0, 21.0, 34.0, 22.0, 12.0, 5.0, 15.0, 15.0, 7.0, 11.0, 3.0, 6.0, 3.0, 3.0, 3.0, 1.0, 4.0, 0.0, 1.0, 3.0, 1.0], "bins": [-3.703125, -3.5986328125, -3.494140625, -3.3896484375, -3.28515625, -3.1806640625, -3.076171875, -2.9716796875, -2.8671875, -2.7626953125, -2.658203125, -2.5537109375, -2.44921875, -2.3447265625, -2.240234375, -2.1357421875, -2.03125, -1.9267578125, -1.822265625, -1.7177734375, -1.61328125, -1.5087890625, -1.404296875, -1.2998046875, -1.1953125, -1.0908203125, -0.986328125, -0.8818359375, -0.77734375, -0.6728515625, -0.568359375, -0.4638671875, -0.359375, -0.2548828125, -0.150390625, -0.0458984375, 0.05859375, 0.1630859375, 0.267578125, 0.3720703125, 0.4765625, 0.5810546875, 0.685546875, 0.7900390625, 0.89453125, 0.9990234375, 1.103515625, 1.2080078125, 1.3125, 1.4169921875, 1.521484375, 1.6259765625, 1.73046875, 1.8349609375, 1.939453125, 2.0439453125, 2.1484375, 2.2529296875, 2.357421875, 2.4619140625, 2.56640625, 2.6708984375, 2.775390625, 2.8798828125, 2.984375]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 4.0, 0.0, 5.0, 13.0, 15.0, 19.0, 19.0, 43.0, 63.0, 87.0, 111.0, 159.0, 224.0, 279.0, 461.0, 591.0, 858.0, 1192.0, 1709.0, 2434.0, 3497.0, 5213.0, 7864.0, 12040.0, 18247.0, 28876.0, 46007.0, 78072.0, 139917.0, 1277014.0, 194291.0, 108090.0, 61731.0, 37869.0, 23532.0, 15545.0, 10085.0, 6460.0, 4392.0, 3056.0, 2060.0, 1494.0, 1060.0, 702.0, 481.0, 397.0, 222.0, 203.0, 137.0, 86.0, 78.0, 49.0, 29.0, 22.0, 20.0, 6.0, 4.0, 7.0, 5.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.54443359375, -0.5267486572265625, -0.509063720703125, -0.4913787841796875, -0.47369384765625, -0.4560089111328125, -0.438323974609375, -0.4206390380859375, -0.4029541015625, -0.3852691650390625, -0.367584228515625, -0.3498992919921875, -0.33221435546875, -0.3145294189453125, -0.296844482421875, -0.2791595458984375, -0.261474609375, -0.2437896728515625, -0.226104736328125, -0.2084197998046875, -0.19073486328125, -0.1730499267578125, -0.155364990234375, -0.1376800537109375, -0.1199951171875, -0.1023101806640625, -0.084625244140625, -0.0669403076171875, -0.04925537109375, -0.0315704345703125, -0.013885498046875, 0.0037994384765625, 0.021484375, 0.0391693115234375, 0.056854248046875, 0.0745391845703125, 0.09222412109375, 0.1099090576171875, 0.127593994140625, 0.1452789306640625, 0.1629638671875, 0.1806488037109375, 0.198333740234375, 0.2160186767578125, 0.23370361328125, 0.2513885498046875, 0.269073486328125, 0.2867584228515625, 0.304443359375, 0.3221282958984375, 0.339813232421875, 0.3574981689453125, 0.37518310546875, 0.3928680419921875, 0.410552978515625, 0.4282379150390625, 0.4459228515625, 0.4636077880859375, 0.481292724609375, 0.4989776611328125, 0.51666259765625, 0.5343475341796875, 0.552032470703125, 0.5697174072265625, 0.58740234375]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 4.0, 7.0, 4.0, 20.0, 17.0, 10.0, 22.0, 26.0, 48.0, 34.0, 54.0, 65.0, 58.0, 55.0, 76.0, 77.0, 72.0, 66.0, 55.0, 44.0, 41.0, 28.0, 26.0, 17.0, 21.0, 13.0, 12.0, 9.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0021991729736328125, -0.002132803201675415, -0.0020664334297180176, -0.00200006365776062, -0.0019336938858032227, -0.0018673241138458252, -0.0018009543418884277, -0.0017345845699310303, -0.0016682147979736328, -0.0016018450260162354, -0.0015354752540588379, -0.0014691054821014404, -0.001402735710144043, -0.0013363659381866455, -0.001269996166229248, -0.0012036263942718506, -0.0011372566223144531, -0.0010708868503570557, -0.0010045170783996582, -0.0009381473064422607, -0.0008717775344848633, -0.0008054077625274658, -0.0007390379905700684, -0.0006726682186126709, -0.0006062984466552734, -0.000539928674697876, -0.0004735589027404785, -0.00040718913078308105, -0.0003408193588256836, -0.00027444958686828613, -0.00020807981491088867, -0.0001417100429534912, -7.534027099609375e-05, -8.970499038696289e-06, 5.739927291870117e-05, 0.00012376904487609863, 0.0001901388168334961, 0.00025650858879089355, 0.000322878360748291, 0.0003892481327056885, 0.00045561790466308594, 0.0005219876766204834, 0.0005883574485778809, 0.0006547272205352783, 0.0007210969924926758, 0.0007874667644500732, 0.0008538365364074707, 0.0009202063083648682, 0.0009865760803222656, 0.001052945852279663, 0.0011193156242370605, 0.001185685396194458, 0.0012520551681518555, 0.001318424940109253, 0.0013847947120666504, 0.0014511644840240479, 0.0015175342559814453, 0.0015839040279388428, 0.0016502737998962402, 0.0017166435718536377, 0.0017830133438110352, 0.0018493831157684326, 0.00191575288772583, 0.0019821226596832275, 0.002048492431640625]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 8.0, 5.0, 12.0, 23.0, 30.0, 42.0, 47.0, 75.0, 104.0, 176.0, 278.0, 559.0, 6904.0, 1037004.0, 2080.0, 475.0, 244.0, 145.0, 83.0, 69.0, 50.0, 39.0, 33.0, 22.0, 12.0, 10.0, 8.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04803466796875, -0.04655170440673828, -0.04506874084472656, -0.043585777282714844, -0.042102813720703125, -0.040619850158691406, -0.03913688659667969, -0.03765392303466797, -0.03617095947265625, -0.03468799591064453, -0.03320503234863281, -0.031722068786621094, -0.030239105224609375, -0.028756141662597656, -0.027273178100585938, -0.02579021453857422, -0.0243072509765625, -0.02282428741455078, -0.021341323852539062, -0.019858360290527344, -0.018375396728515625, -0.016892433166503906, -0.015409469604492188, -0.013926506042480469, -0.01244354248046875, -0.010960578918457031, -0.009477615356445312, -0.007994651794433594, -0.006511688232421875, -0.005028724670410156, -0.0035457611083984375, -0.0020627975463867188, -0.000579833984375, 0.0009031295776367188, 0.0023860931396484375, 0.0038690567016601562, 0.005352020263671875, 0.006834983825683594, 0.008317947387695312, 0.009800910949707031, 0.01128387451171875, 0.012766838073730469, 0.014249801635742188, 0.015732765197753906, 0.017215728759765625, 0.018698692321777344, 0.020181655883789062, 0.02166461944580078, 0.0231475830078125, 0.02463054656982422, 0.026113510131835938, 0.027596473693847656, 0.029079437255859375, 0.030562400817871094, 0.03204536437988281, 0.03352832794189453, 0.03501129150390625, 0.03649425506591797, 0.03797721862792969, 0.039460182189941406, 0.040943145751953125, 0.042426109313964844, 0.04390907287597656, 0.04539203643798828, 0.046875]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 11.0, 54.0, 275.0, 412.0, 216.0, 32.0, 12.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0056892018765211105, -0.005578573327511549, -0.0054679447785019875, -0.005357316695153713, -0.005246688146144152, -0.00513605959713459, -0.005025431048125029, -0.004914802499115467, -0.004804174415767193, -0.004693545866757631, -0.00458291731774807, -0.0044722892343997955, -0.004361660685390234, -0.0042510321363806725, -0.004140403587371111, -0.004029775038361549, -0.003919146955013275, -0.0038085184060037136, -0.0036978900898247957, -0.003587261540815234, -0.0034766332246363163, -0.0033660046756267548, -0.0032553761266171932, -0.0031447478104382753, -0.00303411902859807, -0.0029234904795885086, -0.0028128621634095907, -0.002702233614400029, -0.0025916052982211113, -0.0024809767492115498, -0.0023703482002019882, -0.0022597198840230703, -0.0021490915678441525, -0.002038463018834591, -0.001927834702655673, -0.0018172061536461115, -0.0017065778374671936, -0.001595949288457632, -0.0014853208558633924, -0.0013746924232691526, -0.001264063874259591, -0.0011534354416653514, -0.0010428070090711117, -0.000932178518269211, -0.0008215500856749713, -0.0007109216530807316, -0.000600293162278831, -0.0004896647296845913, -0.0003790362970903516, -0.00026840786449611187, -0.0001577794027980417, -4.715094109997153e-05, 6.347749149426818e-05, 0.0001741059240885079, 0.0002847344148904085, 0.00039536284748464823, 0.0005059912800788879, 0.0006166197126731277, 0.0007272481452673674, 0.000837876636069268, 0.0009485050686635077, 0.0010591335594654083, 0.001169761992059648, 0.0012803904246538877, 0.0013910188572481275]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 5.0, 3.0, 4.0, 8.0, 4.0, 7.0, 6.0, 12.0, 16.0, 18.0, 9.0, 15.0, 14.0, 17.0, 15.0, 23.0, 21.0, 24.0, 30.0, 28.0, 20.0, 32.0, 40.0, 40.0, 29.0, 40.0, 43.0, 46.0, 44.0, 39.0, 36.0, 29.0, 40.0, 21.0, 32.0, 35.0, 25.0, 21.0, 14.0, 21.0, 13.0, 9.0, 13.0, 6.0, 6.0, 8.0, 8.0, 1.0, 4.0, 4.0, 9.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0], "bins": [-0.0008816123008728027, -0.0008549988269805908, -0.0008283853530883789, -0.000801771879196167, -0.0007751584053039551, -0.0007485449314117432, -0.0007219314575195312, -0.0006953179836273193, -0.0006687045097351074, -0.0006420910358428955, -0.0006154775619506836, -0.0005888640880584717, -0.0005622506141662598, -0.0005356371402740479, -0.0005090236663818359, -0.000482410192489624, -0.0004557967185974121, -0.0004291832447052002, -0.0004025697708129883, -0.00037595629692077637, -0.00034934282302856445, -0.00032272934913635254, -0.0002961158752441406, -0.0002695024013519287, -0.0002428889274597168, -0.00021627545356750488, -0.00018966197967529297, -0.00016304850578308105, -0.00013643503189086914, -0.00010982155799865723, -8.320808410644531e-05, -5.65946102142334e-05, -2.9981136322021484e-05, -3.3676624298095703e-06, 2.3245811462402344e-05, 4.985928535461426e-05, 7.647275924682617e-05, 0.00010308623313903809, 0.00012969970703125, 0.00015631318092346191, 0.00018292665481567383, 0.00020954012870788574, 0.00023615360260009766, 0.00026276707649230957, 0.0002893805503845215, 0.0003159940242767334, 0.0003426074981689453, 0.0003692209720611572, 0.00039583444595336914, 0.00042244791984558105, 0.00044906139373779297, 0.0004756748676300049, 0.0005022883415222168, 0.0005289018154144287, 0.0005555152893066406, 0.0005821287631988525, 0.0006087422370910645, 0.0006353557109832764, 0.0006619691848754883, 0.0006885826587677002, 0.0007151961326599121, 0.000741809606552124, 0.0007684230804443359, 0.0007950365543365479, 0.0008216500282287598]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 0.0, 6.0, 4.0, 10.0, 11.0, 16.0, 19.0, 29.0, 26.0, 36.0, 36.0, 32.0, 47.0, 49.0, 49.0, 53.0, 58.0, 52.0, 50.0, 47.0, 48.0, 47.0, 42.0, 36.0, 35.0, 31.0, 30.0, 24.0, 22.0, 21.0, 9.0, 10.0, 6.0, 6.0, 2.0, 7.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6015625, -5.398681640625, -5.19580078125, -4.992919921875, -4.7900390625, -4.587158203125, -4.38427734375, -4.181396484375, -3.978515625, -3.775634765625, -3.57275390625, -3.369873046875, -3.1669921875, -2.964111328125, -2.76123046875, -2.558349609375, -2.35546875, -2.152587890625, -1.94970703125, -1.746826171875, -1.5439453125, -1.341064453125, -1.13818359375, -0.935302734375, -0.732421875, -0.529541015625, -0.32666015625, -0.123779296875, 0.0791015625, 0.281982421875, 0.48486328125, 0.687744140625, 0.890625, 1.093505859375, 1.29638671875, 1.499267578125, 1.7021484375, 1.905029296875, 2.10791015625, 2.310791015625, 2.513671875, 2.716552734375, 2.91943359375, 3.122314453125, 3.3251953125, 3.528076171875, 3.73095703125, 3.933837890625, 4.13671875, 4.339599609375, 4.54248046875, 4.745361328125, 4.9482421875, 5.151123046875, 5.35400390625, 5.556884765625, 5.759765625, 5.962646484375, 6.16552734375, 6.368408203125, 6.5712890625, 6.774169921875, 6.97705078125, 7.179931640625, 7.3828125]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 6.0, 11.0, 4.0, 15.0, 26.0, 24.0, 34.0, 56.0, 75.0, 135.0, 175.0, 298.0, 464.0, 668.0, 1178.0, 2165.0, 4293.0, 9651.0, 27111.0, 109613.0, 533540.0, 274326.0, 54937.0, 16114.0, 6384.0, 3109.0, 1641.0, 927.0, 553.0, 357.0, 204.0, 143.0, 108.0, 68.0, 42.0, 32.0, 22.0, 17.0, 11.0, 9.0, 4.0, 1.0, 3.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.708984375, -3.575408935546875, -3.44183349609375, -3.308258056640625, -3.1746826171875, -3.041107177734375, -2.90753173828125, -2.773956298828125, -2.640380859375, -2.506805419921875, -2.37322998046875, -2.239654541015625, -2.1060791015625, -1.972503662109375, -1.83892822265625, -1.705352783203125, -1.57177734375, -1.438201904296875, -1.30462646484375, -1.171051025390625, -1.0374755859375, -0.903900146484375, -0.77032470703125, -0.636749267578125, -0.503173828125, -0.369598388671875, -0.23602294921875, -0.102447509765625, 0.0311279296875, 0.164703369140625, 0.29827880859375, 0.431854248046875, 0.5654296875, 0.699005126953125, 0.83258056640625, 0.966156005859375, 1.0997314453125, 1.233306884765625, 1.36688232421875, 1.500457763671875, 1.634033203125, 1.767608642578125, 1.90118408203125, 2.034759521484375, 2.1683349609375, 2.301910400390625, 2.43548583984375, 2.569061279296875, 2.70263671875, 2.836212158203125, 2.96978759765625, 3.103363037109375, 3.2369384765625, 3.370513916015625, 3.50408935546875, 3.637664794921875, 3.771240234375, 3.904815673828125, 4.03839111328125, 4.171966552734375, 4.3055419921875, 4.439117431640625, 4.57269287109375, 4.706268310546875, 4.83984375]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 4.0, 7.0, 9.0, 8.0, 8.0, 10.0, 10.0, 13.0, 17.0, 18.0, 20.0, 22.0, 32.0, 31.0, 24.0, 31.0, 30.0, 39.0, 40.0, 36.0, 54.0, 328.0, 1726.0, 86.0, 54.0, 34.0, 45.0, 36.0, 40.0, 18.0, 26.0, 19.0, 25.0, 20.0, 22.0, 13.0, 19.0, 8.0, 13.0, 16.0, 12.0, 10.0, 6.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.7734375, -14.2667236328125, -13.760009765625, -13.2532958984375, -12.74658203125, -12.2398681640625, -11.733154296875, -11.2264404296875, -10.7197265625, -10.2130126953125, -9.706298828125, -9.1995849609375, -8.69287109375, -8.1861572265625, -7.679443359375, -7.1727294921875, -6.666015625, -6.1593017578125, -5.652587890625, -5.1458740234375, -4.63916015625, -4.1324462890625, -3.625732421875, -3.1190185546875, -2.6123046875, -2.1055908203125, -1.598876953125, -1.0921630859375, -0.58544921875, -0.0787353515625, 0.427978515625, 0.9346923828125, 1.44140625, 1.9481201171875, 2.454833984375, 2.9615478515625, 3.46826171875, 3.9749755859375, 4.481689453125, 4.9884033203125, 5.4951171875, 6.0018310546875, 6.508544921875, 7.0152587890625, 7.52197265625, 8.0286865234375, 8.535400390625, 9.0421142578125, 9.548828125, 10.0555419921875, 10.562255859375, 11.0689697265625, 11.57568359375, 12.0823974609375, 12.589111328125, 13.0958251953125, 13.6025390625, 14.1092529296875, 14.615966796875, 15.1226806640625, 15.62939453125, 16.1361083984375, 16.642822265625, 17.1495361328125, 17.65625]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 2.0, 2.0, 3.0, 14.0, 6.0, 13.0, 17.0, 12.0, 10.0, 15.0, 15.0, 28.0, 20.0, 24.0, 31.0, 37.0, 66.0, 107.0, 154.0, 234.0, 353.0, 990.0, 9216.0, 3054018.0, 76953.0, 1926.0, 558.0, 256.0, 161.0, 108.0, 88.0, 41.0, 36.0, 42.0, 27.0, 21.0, 20.0, 17.0, 9.0, 12.0, 10.0, 5.0, 8.0, 9.0, 7.0, 4.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0], "bins": [-29.171875, -28.33154296875, -27.4912109375, -26.65087890625, -25.810546875, -24.97021484375, -24.1298828125, -23.28955078125, -22.44921875, -21.60888671875, -20.7685546875, -19.92822265625, -19.087890625, -18.24755859375, -17.4072265625, -16.56689453125, -15.7265625, -14.88623046875, -14.0458984375, -13.20556640625, -12.365234375, -11.52490234375, -10.6845703125, -9.84423828125, -9.00390625, -8.16357421875, -7.3232421875, -6.48291015625, -5.642578125, -4.80224609375, -3.9619140625, -3.12158203125, -2.28125, -1.44091796875, -0.6005859375, 0.23974609375, 1.080078125, 1.92041015625, 2.7607421875, 3.60107421875, 4.44140625, 5.28173828125, 6.1220703125, 6.96240234375, 7.802734375, 8.64306640625, 9.4833984375, 10.32373046875, 11.1640625, 12.00439453125, 12.8447265625, 13.68505859375, 14.525390625, 15.36572265625, 16.2060546875, 17.04638671875, 17.88671875, 18.72705078125, 19.5673828125, 20.40771484375, 21.248046875, 22.08837890625, 22.9287109375, 23.76904296875, 24.609375]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 11.0, 200.0, 581.0, 209.0, 17.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-96.26148986816406, -94.39361572265625, -92.5257339477539, -90.6578598022461, -88.78998565673828, -86.92210388183594, -85.05422973632812, -83.18635559082031, -81.3184814453125, -79.45060729980469, -77.58272552490234, -75.71485137939453, -73.84697723388672, -71.97909545898438, -70.11122131347656, -68.24334716796875, -66.3754653930664, -64.5075912475586, -62.639713287353516, -60.77183532714844, -58.903961181640625, -57.03608322143555, -55.16820526123047, -53.300331115722656, -51.43245315551758, -49.5645751953125, -47.69670104980469, -45.82882308959961, -43.96094512939453, -42.09307098388672, -40.22519302368164, -38.35731506347656, -36.489437103271484, -34.621559143066406, -32.753684997558594, -30.885807037353516, -29.01793098449707, -27.150054931640625, -25.282176971435547, -23.4143009185791, -21.546424865722656, -19.67854881286621, -17.810672760009766, -15.942794799804688, -14.074918746948242, -12.207042694091797, -10.339165687561035, -8.471288681030273, -6.603412628173828, -4.735536098480225, -2.867659568786621, -0.9997830390930176, 0.8680934906005859, 2.7359695434570312, 4.603846549987793, 6.471723556518555, 8.339599609375, 10.207475662231445, 12.075352668762207, 13.943229675292969, 15.811105728149414, 17.67898178100586, 19.546859741210938, 21.414735794067383, 23.282611846923828]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 0.0, 4.0, 4.0, 1.0, 9.0, 4.0, 7.0, 10.0, 12.0, 10.0, 6.0, 24.0, 12.0, 22.0, 21.0, 25.0, 28.0, 33.0, 39.0, 37.0, 31.0, 44.0, 38.0, 45.0, 44.0, 47.0, 33.0, 42.0, 32.0, 38.0, 34.0, 38.0, 29.0, 30.0, 17.0, 25.0, 19.0, 29.0, 18.0, 8.0, 8.0, 9.0, 10.0, 4.0, 11.0, 5.0, 2.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-47.57497787475586, -45.91034698486328, -44.24571990966797, -42.58108901977539, -40.91645812988281, -39.2518310546875, -37.58720016479492, -35.922569274902344, -34.25794219970703, -32.59331130981445, -30.928682327270508, -29.264053344726562, -27.599422454833984, -25.93479347229004, -24.270164489746094, -22.605533599853516, -20.940902709960938, -19.276273727416992, -17.611642837524414, -15.947013854980469, -14.282383918762207, -12.617753982543945, -10.953125, -9.288495063781738, -7.623865127563477, -5.959235191345215, -4.294605731964111, -2.629976272583008, -0.9653463363647461, 0.6992835998535156, 2.363912582397461, 4.028542518615723, 5.693168640136719, 7.3577985763549805, 9.022428512573242, 10.687057495117188, 12.35168743133545, 14.016317367553711, 15.680946350097656, 17.345577239990234, 19.01020622253418, 20.674835205078125, 22.339466094970703, 24.00409507751465, 25.668724060058594, 27.333354949951172, 28.997983932495117, 30.662612915039062, 32.32724380493164, 33.99187469482422, 35.65650177001953, 37.32113265991211, 38.98576354980469, 40.650390625, 42.31502151489258, 43.979652404785156, 45.64427947998047, 47.30891036987305, 48.97353744506836, 50.63816833496094, 52.302799224853516, 53.967430114746094, 55.632057189941406, 57.296688079833984, 58.96131896972656]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 3.0, 6.0, 5.0, 9.0, 17.0, 13.0, 26.0, 25.0, 33.0, 37.0, 34.0, 35.0, 52.0, 43.0, 51.0, 63.0, 47.0, 55.0, 53.0, 33.0, 45.0, 62.0, 37.0, 27.0, 35.0, 31.0, 31.0, 25.0, 17.0, 20.0, 9.0, 7.0, 6.0, 6.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.734375, -5.53131103515625, -5.3282470703125, -5.12518310546875, -4.922119140625, -4.71905517578125, -4.5159912109375, -4.31292724609375, -4.10986328125, -3.90679931640625, -3.7037353515625, -3.50067138671875, -3.297607421875, -3.09454345703125, -2.8914794921875, -2.68841552734375, -2.4853515625, -2.28228759765625, -2.0792236328125, -1.87615966796875, -1.673095703125, -1.47003173828125, -1.2669677734375, -1.06390380859375, -0.86083984375, -0.65777587890625, -0.4547119140625, -0.25164794921875, -0.048583984375, 0.15447998046875, 0.3575439453125, 0.56060791015625, 0.763671875, 0.96673583984375, 1.1697998046875, 1.37286376953125, 1.575927734375, 1.77899169921875, 1.9820556640625, 2.18511962890625, 2.38818359375, 2.59124755859375, 2.7943115234375, 2.99737548828125, 3.200439453125, 3.40350341796875, 3.6065673828125, 3.80963134765625, 4.0126953125, 4.21575927734375, 4.4188232421875, 4.62188720703125, 4.824951171875, 5.02801513671875, 5.2310791015625, 5.43414306640625, 5.63720703125, 5.84027099609375, 6.0433349609375, 6.24639892578125, 6.449462890625, 6.65252685546875, 6.8555908203125, 7.05865478515625, 7.26171875]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 2.0, 4.0, 6.0, 7.0, 5.0, 7.0, 24.0, 16.0, 31.0, 45.0, 68.0, 101.0, 209.0, 449.0, 1090.0, 3314.0, 11765.0, 52944.0, 373463.0, 2314531.0, 1259168.0, 141137.0, 25830.0, 6537.0, 2049.0, 742.0, 300.0, 160.0, 86.0, 52.0, 33.0, 25.0, 16.0, 20.0, 8.0, 6.0, 6.0, 8.0, 6.0, 6.0, 6.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.125, -10.7384033203125, -10.351806640625, -9.9652099609375, -9.57861328125, -9.1920166015625, -8.805419921875, -8.4188232421875, -8.0322265625, -7.6456298828125, -7.259033203125, -6.8724365234375, -6.48583984375, -6.0992431640625, -5.712646484375, -5.3260498046875, -4.939453125, -4.5528564453125, -4.166259765625, -3.7796630859375, -3.39306640625, -3.0064697265625, -2.619873046875, -2.2332763671875, -1.8466796875, -1.4600830078125, -1.073486328125, -0.6868896484375, -0.30029296875, 0.0863037109375, 0.472900390625, 0.8594970703125, 1.24609375, 1.6326904296875, 2.019287109375, 2.4058837890625, 2.79248046875, 3.1790771484375, 3.565673828125, 3.9522705078125, 4.3388671875, 4.7254638671875, 5.112060546875, 5.4986572265625, 5.88525390625, 6.2718505859375, 6.658447265625, 7.0450439453125, 7.431640625, 7.8182373046875, 8.204833984375, 8.5914306640625, 8.97802734375, 9.3646240234375, 9.751220703125, 10.1378173828125, 10.5244140625, 10.9110107421875, 11.297607421875, 11.6842041015625, 12.07080078125, 12.4573974609375, 12.843994140625, 13.2305908203125, 13.6171875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 8.0, 4.0, 7.0, 7.0, 16.0, 17.0, 14.0, 23.0, 21.0, 37.0, 42.0, 70.0, 72.0, 103.0, 114.0, 140.0, 193.0, 220.0, 300.0, 358.0, 384.0, 342.0, 305.0, 252.0, 214.0, 160.0, 152.0, 116.0, 85.0, 63.0, 54.0, 29.0, 30.0, 29.0, 21.0, 10.0, 14.0, 14.0, 6.0, 5.0, 4.0, 4.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-11.21875, -10.8651123046875, -10.511474609375, -10.1578369140625, -9.80419921875, -9.4505615234375, -9.096923828125, -8.7432861328125, -8.3896484375, -8.0360107421875, -7.682373046875, -7.3287353515625, -6.97509765625, -6.6214599609375, -6.267822265625, -5.9141845703125, -5.560546875, -5.2069091796875, -4.853271484375, -4.4996337890625, -4.14599609375, -3.7923583984375, -3.438720703125, -3.0850830078125, -2.7314453125, -2.3778076171875, -2.024169921875, -1.6705322265625, -1.31689453125, -0.9632568359375, -0.609619140625, -0.2559814453125, 0.09765625, 0.4512939453125, 0.804931640625, 1.1585693359375, 1.51220703125, 1.8658447265625, 2.219482421875, 2.5731201171875, 2.9267578125, 3.2803955078125, 3.634033203125, 3.9876708984375, 4.34130859375, 4.6949462890625, 5.048583984375, 5.4022216796875, 5.755859375, 6.1094970703125, 6.463134765625, 6.8167724609375, 7.17041015625, 7.5240478515625, 7.877685546875, 8.2313232421875, 8.5849609375, 8.9385986328125, 9.292236328125, 9.6458740234375, 9.99951171875, 10.3531494140625, 10.706787109375, 11.0604248046875, 11.4140625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 5.0, 6.0, 7.0, 11.0, 12.0, 19.0, 29.0, 45.0, 57.0, 69.0, 101.0, 164.0, 281.0, 711.0, 3474.0, 80223.0, 3784969.0, 314229.0, 7927.0, 1038.0, 327.0, 176.0, 110.0, 72.0, 52.0, 39.0, 35.0, 17.0, 21.0, 18.0, 10.0, 6.0, 7.0, 4.0, 5.0, 6.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-43.96875, -42.37890625, -40.7890625, -39.19921875, -37.609375, -36.01953125, -34.4296875, -32.83984375, -31.25, -29.66015625, -28.0703125, -26.48046875, -24.890625, -23.30078125, -21.7109375, -20.12109375, -18.53125, -16.94140625, -15.3515625, -13.76171875, -12.171875, -10.58203125, -8.9921875, -7.40234375, -5.8125, -4.22265625, -2.6328125, -1.04296875, 0.546875, 2.13671875, 3.7265625, 5.31640625, 6.90625, 8.49609375, 10.0859375, 11.67578125, 13.265625, 14.85546875, 16.4453125, 18.03515625, 19.625, 21.21484375, 22.8046875, 24.39453125, 25.984375, 27.57421875, 29.1640625, 30.75390625, 32.34375, 33.93359375, 35.5234375, 37.11328125, 38.703125, 40.29296875, 41.8828125, 43.47265625, 45.0625, 46.65234375, 48.2421875, 49.83203125, 51.421875, 53.01171875, 54.6015625, 56.19140625, 57.78125]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [25.0, 103.0, 294.0, 350.0, 188.0, 50.0, 10.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.158655166625977, -13.8875093460083, -7.616363525390625, -1.3452167510986328, 4.925928115844727, 11.197072982788086, 17.46822166442871, 23.73936653137207, 30.01051139831543, 36.28165817260742, 42.55280303955078, 48.823951721191406, 55.0950927734375, 61.366241455078125, 67.63739013671875, 73.90853118896484, 80.17967987060547, 86.4508285522461, 92.72196960449219, 98.99311828613281, 105.26426696777344, 111.53540802001953, 117.80655670166016, 124.07769775390625, 130.34884643554688, 136.6199951171875, 142.89114379882812, 149.16229248046875, 155.4334259033203, 161.70457458496094, 167.97572326660156, 174.2468719482422, 180.51800537109375, 186.78915405273438, 193.060302734375, 199.33145141601562, 205.6025848388672, 211.8737335205078, 218.14488220214844, 224.41603088378906, 230.68716430664062, 236.95831298828125, 243.22946166992188, 249.5006103515625, 255.77174377441406, 262.04290771484375, 268.31402587890625, 274.5851745605469, 280.8563232421875, 287.1274719238281, 293.39862060546875, 299.6697692871094, 305.94091796875, 312.2120361328125, 318.48321533203125, 324.75433349609375, 331.0255126953125, 337.2966613769531, 343.56781005859375, 349.8389587402344, 356.110107421875, 362.3812255859375, 368.65240478515625, 374.92352294921875, 381.1946716308594]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 6.0, 8.0, 6.0, 7.0, 9.0, 12.0, 14.0, 15.0, 12.0, 18.0, 26.0, 25.0, 26.0, 25.0, 21.0, 26.0, 32.0, 34.0, 35.0, 35.0, 38.0, 36.0, 36.0, 23.0, 34.0, 42.0, 41.0, 40.0, 28.0, 36.0, 28.0, 27.0, 17.0, 22.0, 22.0, 15.0, 18.0, 17.0, 18.0, 20.0, 12.0, 11.0, 6.0, 6.0, 7.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-41.127525329589844, -39.811710357666016, -38.49589538574219, -37.18008041381836, -35.86426544189453, -34.54844665527344, -33.232635498046875, -31.91681671142578, -30.601001739501953, -29.285186767578125, -27.969371795654297, -26.65355682373047, -25.337739944458008, -24.02192497253418, -22.70611000061035, -21.39029312133789, -20.074480056762695, -18.758665084838867, -17.44285011291504, -16.127033233642578, -14.81121826171875, -13.495403289794922, -12.179588317871094, -10.86377239227295, -9.547957420349121, -8.232142448425293, -6.916326522827148, -5.60051155090332, -4.284696102142334, -2.9688806533813477, -1.6530656814575195, -0.337249755859375, 0.9785652160644531, 2.2943806648254395, 3.6101958751678467, 4.926011085510254, 6.24182653427124, 7.557641983032227, 8.873456954956055, 10.1892728805542, 11.505087852478027, 12.820902824401855, 14.13671875, 15.452533721923828, 16.768348693847656, 18.084163665771484, 19.399978637695312, 20.715795516967773, 22.0316104888916, 23.34742546081543, 24.663240432739258, 25.97905731201172, 27.294872283935547, 28.610687255859375, 29.926502227783203, 31.24231719970703, 32.55813217163086, 33.87394714355469, 35.189762115478516, 36.505577087402344, 37.82139205932617, 39.13720703125, 40.453025817871094, 41.76884078979492, 43.08465576171875]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 6.0, 8.0, 11.0, 13.0, 13.0, 11.0, 23.0, 27.0, 33.0, 39.0, 46.0, 35.0, 46.0, 45.0, 50.0, 46.0, 54.0, 48.0, 52.0, 58.0, 42.0, 39.0, 40.0, 40.0, 29.0, 35.0, 28.0, 21.0, 15.0, 10.0, 20.0, 6.0, 5.0, 3.0, 4.0, 1.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.9296875, -5.72491455078125, -5.5201416015625, -5.31536865234375, -5.110595703125, -4.90582275390625, -4.7010498046875, -4.49627685546875, -4.29150390625, -4.08673095703125, -3.8819580078125, -3.67718505859375, -3.472412109375, -3.26763916015625, -3.0628662109375, -2.85809326171875, -2.6533203125, -2.44854736328125, -2.2437744140625, -2.03900146484375, -1.834228515625, -1.62945556640625, -1.4246826171875, -1.21990966796875, -1.01513671875, -0.81036376953125, -0.6055908203125, -0.40081787109375, -0.196044921875, 0.00872802734375, 0.2135009765625, 0.41827392578125, 0.623046875, 0.82781982421875, 1.0325927734375, 1.23736572265625, 1.442138671875, 1.64691162109375, 1.8516845703125, 2.05645751953125, 2.26123046875, 2.46600341796875, 2.6707763671875, 2.87554931640625, 3.080322265625, 3.28509521484375, 3.4898681640625, 3.69464111328125, 3.8994140625, 4.10418701171875, 4.3089599609375, 4.51373291015625, 4.718505859375, 4.92327880859375, 5.1280517578125, 5.33282470703125, 5.53759765625, 5.74237060546875, 5.9471435546875, 6.15191650390625, 6.356689453125, 6.56146240234375, 6.7662353515625, 6.97100830078125, 7.17578125]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 4.0, 6.0, 12.0, 17.0, 18.0, 29.0, 45.0, 89.0, 95.0, 176.0, 237.0, 319.0, 457.0, 672.0, 962.0, 1387.0, 1962.0, 2792.0, 4023.0, 5742.0, 8281.0, 11973.0, 17406.0, 26136.0, 40403.0, 64095.0, 109601.0, 197621.0, 220800.0, 125596.0, 72522.0, 44546.0, 28792.0, 19338.0, 12896.0, 8879.0, 6196.0, 4345.0, 3045.0, 2126.0, 1524.0, 1027.0, 747.0, 507.0, 352.0, 254.0, 157.0, 123.0, 80.0, 47.0, 36.0, 18.0, 25.0, 8.0, 8.0, 7.0, 3.0, 1.0, 2.0, 1.0], "bins": [-0.68701171875, -0.665618896484375, -0.64422607421875, -0.622833251953125, -0.6014404296875, -0.580047607421875, -0.55865478515625, -0.537261962890625, -0.515869140625, -0.494476318359375, -0.47308349609375, -0.451690673828125, -0.4302978515625, -0.408905029296875, -0.38751220703125, -0.366119384765625, -0.3447265625, -0.323333740234375, -0.30194091796875, -0.280548095703125, -0.2591552734375, -0.237762451171875, -0.21636962890625, -0.194976806640625, -0.173583984375, -0.152191162109375, -0.13079833984375, -0.109405517578125, -0.0880126953125, -0.066619873046875, -0.04522705078125, -0.023834228515625, -0.00244140625, 0.018951416015625, 0.04034423828125, 0.061737060546875, 0.0831298828125, 0.104522705078125, 0.12591552734375, 0.147308349609375, 0.168701171875, 0.190093994140625, 0.21148681640625, 0.232879638671875, 0.2542724609375, 0.275665283203125, 0.29705810546875, 0.318450927734375, 0.33984375, 0.361236572265625, 0.38262939453125, 0.404022216796875, 0.4254150390625, 0.446807861328125, 0.46820068359375, 0.489593505859375, 0.510986328125, 0.532379150390625, 0.55377197265625, 0.575164794921875, 0.5965576171875, 0.617950439453125, 0.63934326171875, 0.660736083984375, 0.68212890625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 7.0, 3.0, 5.0, 4.0, 6.0, 8.0, 11.0, 12.0, 14.0, 15.0, 19.0, 17.0, 26.0, 29.0, 28.0, 28.0, 29.0, 38.0, 49.0, 48.0, 39.0, 48.0, 37.0, 1055.0, 30.0, 43.0, 28.0, 32.0, 32.0, 27.0, 31.0, 27.0, 24.0, 24.0, 35.0, 14.0, 16.0, 15.0, 12.0, 13.0, 13.0, 7.0, 5.0, 6.0, 5.0, 6.0, 3.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 2.0], "bins": [-3.45703125, -3.353363037109375, -3.24969482421875, -3.146026611328125, -3.0423583984375, -2.938690185546875, -2.83502197265625, -2.731353759765625, -2.627685546875, -2.524017333984375, -2.42034912109375, -2.316680908203125, -2.2130126953125, -2.109344482421875, -2.00567626953125, -1.902008056640625, -1.79833984375, -1.694671630859375, -1.59100341796875, -1.487335205078125, -1.3836669921875, -1.279998779296875, -1.17633056640625, -1.072662353515625, -0.968994140625, -0.865325927734375, -0.76165771484375, -0.657989501953125, -0.5543212890625, -0.450653076171875, -0.34698486328125, -0.243316650390625, -0.1396484375, -0.035980224609375, 0.06768798828125, 0.171356201171875, 0.2750244140625, 0.378692626953125, 0.48236083984375, 0.586029052734375, 0.689697265625, 0.793365478515625, 0.89703369140625, 1.000701904296875, 1.1043701171875, 1.208038330078125, 1.31170654296875, 1.415374755859375, 1.51904296875, 1.622711181640625, 1.72637939453125, 1.830047607421875, 1.9337158203125, 2.037384033203125, 2.14105224609375, 2.244720458984375, 2.348388671875, 2.452056884765625, 2.55572509765625, 2.659393310546875, 2.7630615234375, 2.866729736328125, 2.97039794921875, 3.074066162109375, 3.177734375]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 3.0, 7.0, 13.0, 14.0, 23.0, 39.0, 62.0, 94.0, 130.0, 194.0, 260.0, 390.0, 491.0, 707.0, 1014.0, 1453.0, 2035.0, 2900.0, 4345.0, 6385.0, 9559.0, 14029.0, 21573.0, 33255.0, 53647.0, 90944.0, 167073.0, 1289496.0, 161436.0, 88231.0, 51760.0, 32190.0, 20419.0, 13651.0, 9057.0, 6153.0, 4246.0, 2898.0, 2003.0, 1419.0, 1036.0, 712.0, 528.0, 407.0, 248.0, 190.0, 137.0, 101.0, 64.0, 43.0, 26.0, 17.0, 12.0, 10.0, 9.0, 5.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.59375, -0.5748825073242188, -0.5560150146484375, -0.5371475219726562, -0.518280029296875, -0.49941253662109375, -0.4805450439453125, -0.46167755126953125, -0.44281005859375, -0.42394256591796875, -0.4050750732421875, -0.38620758056640625, -0.367340087890625, -0.34847259521484375, -0.3296051025390625, -0.31073760986328125, -0.2918701171875, -0.27300262451171875, -0.2541351318359375, -0.23526763916015625, -0.216400146484375, -0.19753265380859375, -0.1786651611328125, -0.15979766845703125, -0.14093017578125, -0.12206268310546875, -0.1031951904296875, -0.08432769775390625, -0.065460205078125, -0.04659271240234375, -0.0277252197265625, -0.00885772705078125, 0.010009765625, 0.02887725830078125, 0.0477447509765625, 0.06661224365234375, 0.085479736328125, 0.10434722900390625, 0.1232147216796875, 0.14208221435546875, 0.16094970703125, 0.17981719970703125, 0.1986846923828125, 0.21755218505859375, 0.236419677734375, 0.25528717041015625, 0.2741546630859375, 0.29302215576171875, 0.3118896484375, 0.33075714111328125, 0.3496246337890625, 0.36849212646484375, 0.387359619140625, 0.40622711181640625, 0.4250946044921875, 0.44396209716796875, 0.46282958984375, 0.48169708251953125, 0.5005645751953125, 0.5194320678710938, 0.538299560546875, 0.5571670532226562, 0.5760345458984375, 0.5949020385742188, 0.61376953125]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 1.0, 5.0, 2.0, 3.0, 5.0, 9.0, 10.0, 12.0, 14.0, 13.0, 30.0, 40.0, 43.0, 57.0, 69.0, 94.0, 88.0, 90.0, 101.0, 73.0, 56.0, 50.0, 31.0, 32.0, 17.0, 19.0, 5.0, 3.0, 11.0, 3.0, 4.0, 7.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0026950836181640625, -0.0026199519634246826, -0.0025448203086853027, -0.002469688653945923, -0.002394556999206543, -0.002319425344467163, -0.002244293689727783, -0.0021691620349884033, -0.0020940303802490234, -0.0020188987255096436, -0.0019437670707702637, -0.0018686354160308838, -0.001793503761291504, -0.001718372106552124, -0.0016432404518127441, -0.0015681087970733643, -0.0014929771423339844, -0.0014178454875946045, -0.0013427138328552246, -0.0012675821781158447, -0.0011924505233764648, -0.001117318868637085, -0.001042187213897705, -0.0009670555591583252, -0.0008919239044189453, -0.0008167922496795654, -0.0007416605949401855, -0.0006665289402008057, -0.0005913972854614258, -0.0005162656307220459, -0.000441133975982666, -0.00036600232124328613, -0.00029087066650390625, -0.00021573901176452637, -0.00014060735702514648, -6.54757022857666e-05, 9.655952453613281e-06, 8.478760719299316e-05, 0.00015991926193237305, 0.00023505091667175293, 0.0003101825714111328, 0.0003853142261505127, 0.0004604458808898926, 0.0005355775356292725, 0.0006107091903686523, 0.0006858408451080322, 0.0007609724998474121, 0.000836104154586792, 0.0009112358093261719, 0.0009863674640655518, 0.0010614991188049316, 0.0011366307735443115, 0.0012117624282836914, 0.0012868940830230713, 0.0013620257377624512, 0.001437157392501831, 0.001512289047241211, 0.0015874207019805908, 0.0016625523567199707, 0.0017376840114593506, 0.0018128156661987305, 0.0018879473209381104, 0.0019630789756774902, 0.00203821063041687, 0.00211334228515625]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 7.0, 5.0, 14.0, 9.0, 11.0, 27.0, 32.0, 36.0, 56.0, 67.0, 81.0, 135.0, 199.0, 383.0, 925.0, 136856.0, 906883.0, 1587.0, 453.0, 263.0, 178.0, 93.0, 59.0, 48.0, 31.0, 31.0, 25.0, 13.0, 18.0, 6.0, 4.0, 3.0, 3.0, 6.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0426025390625, -0.041234493255615234, -0.03986644744873047, -0.0384984016418457, -0.03713035583496094, -0.03576231002807617, -0.034394264221191406, -0.03302621841430664, -0.031658172607421875, -0.03029012680053711, -0.028922080993652344, -0.027554035186767578, -0.026185989379882812, -0.024817943572998047, -0.02344989776611328, -0.022081851959228516, -0.02071380615234375, -0.019345760345458984, -0.01797771453857422, -0.016609668731689453, -0.015241622924804688, -0.013873577117919922, -0.012505531311035156, -0.01113748550415039, -0.009769439697265625, -0.00840139389038086, -0.007033348083496094, -0.005665302276611328, -0.0042972564697265625, -0.002929210662841797, -0.0015611648559570312, -0.00019311904907226562, 0.0011749267578125, 0.0025429725646972656, 0.003911018371582031, 0.005279064178466797, 0.0066471099853515625, 0.008015155792236328, 0.009383201599121094, 0.01075124740600586, 0.012119293212890625, 0.01348733901977539, 0.014855384826660156, 0.016223430633544922, 0.017591476440429688, 0.018959522247314453, 0.02032756805419922, 0.021695613861083984, 0.02306365966796875, 0.024431705474853516, 0.02579975128173828, 0.027167797088623047, 0.028535842895507812, 0.029903888702392578, 0.031271934509277344, 0.03263998031616211, 0.034008026123046875, 0.03537607192993164, 0.036744117736816406, 0.03811216354370117, 0.03948020935058594, 0.0408482551574707, 0.04221630096435547, 0.043584346771240234, 0.044952392578125]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 14.0, 31.0, 71.0, 165.0, 281.0, 238.0, 131.0, 45.0, 20.0, 8.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0036393117625266314, -0.0035615754313766956, -0.0034838393330574036, -0.003406103001907468, -0.003328366670757532, -0.0032506303396075964, -0.0031728942412883043, -0.0030951579101383686, -0.003017421578988433, -0.002939685247838497, -0.002861949149519205, -0.0027842128183692694, -0.0027064764872193336, -0.002628740156069398, -0.002551004057750106, -0.00247326772660017, -0.002395531628280878, -0.0023177952971309423, -0.0022400591988116503, -0.0021623228676617146, -0.002084586536511779, -0.002006850205361843, -0.001929114107042551, -0.0018513777758926153, -0.0017736414447426796, -0.0016959052300080657, -0.00161816889885813, -0.001540432684123516, -0.0014626963529735804, -0.0013849601382389665, -0.0013072239235043526, -0.0012294875923544168, -0.0011517511447891593, -0.0010740149300545454, -0.0009962785989046097, -0.0009185423841699958, -0.0008408060530200601, -0.0007630698382854462, -0.0006853335653431714, -0.0006075972924008965, -0.0005298610194586217, -0.00045212474651634693, -0.0003743884735740721, -0.00029665222973562777, -0.00021891595679335296, -0.00014117968385107815, -6.34434400126338e-05, 1.4292832929641008e-05, 9.202910587191582e-05, 0.00016976537881419063, 0.00024750165175646544, 0.0003252378955949098, 0.0004029741685371846, 0.0004807104414794594, 0.0005584466853179038, 0.0006361829582601786, 0.0007139192312024534, 0.0007916555041447282, 0.000869391777087003, 0.0009471280500292778, 0.0010248642647638917, 0.0011026005959138274, 0.0011803368106484413, 0.001258073141798377, 0.001335809356532991]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 2.0, 6.0, 6.0, 16.0, 15.0, 17.0, 18.0, 21.0, 19.0, 21.0, 24.0, 33.0, 38.0, 40.0, 37.0, 41.0, 35.0, 41.0, 47.0, 38.0, 35.0, 36.0, 40.0, 38.0, 54.0, 35.0, 24.0, 24.0, 35.0, 27.0, 21.0, 15.0, 13.0, 15.0, 14.0, 13.0, 12.0, 12.0, 4.0, 10.0, 2.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009309649467468262, -0.0008998150005936623, -0.0008686650544404984, -0.0008375151082873344, -0.0008063651621341705, -0.0007752152159810066, -0.0007440652698278427, -0.0007129153236746788, -0.0006817653775215149, -0.000650615431368351, -0.0006194654852151871, -0.0005883155390620232, -0.0005571655929088593, -0.0005260156467556953, -0.0004948657006025314, -0.0004637157544493675, -0.0004325658082962036, -0.0004014158621430397, -0.0003702659159898758, -0.0003391159698367119, -0.000307966023683548, -0.00027681607753038406, -0.00024566613137722015, -0.00021451618522405624, -0.00018336623907089233, -0.00015221629291772842, -0.00012106634676456451, -8.99164006114006e-05, -5.8766454458236694e-05, -2.7616508305072784e-05, 3.5334378480911255e-06, 3.4683384001255035e-05, 6.583333015441895e-05, 9.698327630758286e-05, 0.00012813322246074677, 0.00015928316861391068, 0.00019043311476707458, 0.0002215830609202385, 0.0002527330070734024, 0.0002838829532265663, 0.0003150328993797302, 0.00034618284553289413, 0.00037733279168605804, 0.00040848273783922195, 0.00043963268399238586, 0.0004707826301455498, 0.0005019325762987137, 0.0005330825224518776, 0.0005642324686050415, 0.0005953824147582054, 0.0006265323609113693, 0.0006576823070645332, 0.0006888322532176971, 0.000719982199370861, 0.000751132145524025, 0.0007822820916771889, 0.0008134320378303528, 0.0008445819839835167, 0.0008757319301366806, 0.0009068818762898445, 0.0009380318224430084, 0.0009691817685961723, 0.0010003317147493362, 0.0010314816609025002, 0.001062631607055664]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 6.0, 8.0, 11.0, 13.0, 13.0, 11.0, 23.0, 27.0, 33.0, 39.0, 46.0, 35.0, 46.0, 45.0, 50.0, 46.0, 54.0, 48.0, 52.0, 58.0, 42.0, 39.0, 40.0, 40.0, 29.0, 35.0, 28.0, 21.0, 15.0, 10.0, 20.0, 6.0, 5.0, 3.0, 4.0, 1.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.9296875, -5.72491455078125, -5.5201416015625, -5.31536865234375, -5.110595703125, -4.90582275390625, -4.7010498046875, -4.49627685546875, -4.29150390625, -4.08673095703125, -3.8819580078125, -3.67718505859375, -3.472412109375, -3.26763916015625, -3.0628662109375, -2.85809326171875, -2.6533203125, -2.44854736328125, -2.2437744140625, -2.03900146484375, -1.834228515625, -1.62945556640625, -1.4246826171875, -1.21990966796875, -1.01513671875, -0.81036376953125, -0.6055908203125, -0.40081787109375, -0.196044921875, 0.00872802734375, 0.2135009765625, 0.41827392578125, 0.623046875, 0.82781982421875, 1.0325927734375, 1.23736572265625, 1.442138671875, 1.64691162109375, 1.8516845703125, 2.05645751953125, 2.26123046875, 2.46600341796875, 2.6707763671875, 2.87554931640625, 3.080322265625, 3.28509521484375, 3.4898681640625, 3.69464111328125, 3.8994140625, 4.10418701171875, 4.3089599609375, 4.51373291015625, 4.718505859375, 4.92327880859375, 5.1280517578125, 5.33282470703125, 5.53759765625, 5.74237060546875, 5.9471435546875, 6.15191650390625, 6.356689453125, 6.56146240234375, 6.7662353515625, 6.97100830078125, 7.17578125]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 5.0, 19.0, 15.0, 36.0, 56.0, 80.0, 124.0, 213.0, 282.0, 531.0, 918.0, 1491.0, 2644.0, 5021.0, 10163.0, 24080.0, 70052.0, 284377.0, 463154.0, 120588.0, 35597.0, 14349.0, 6693.0, 3498.0, 1820.0, 1060.0, 618.0, 401.0, 251.0, 170.0, 92.0, 77.0, 40.0, 19.0, 9.0, 9.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.734375, -3.60650634765625, -3.4786376953125, -3.35076904296875, -3.222900390625, -3.09503173828125, -2.9671630859375, -2.83929443359375, -2.71142578125, -2.58355712890625, -2.4556884765625, -2.32781982421875, -2.199951171875, -2.07208251953125, -1.9442138671875, -1.81634521484375, -1.6884765625, -1.56060791015625, -1.4327392578125, -1.30487060546875, -1.177001953125, -1.04913330078125, -0.9212646484375, -0.79339599609375, -0.66552734375, -0.53765869140625, -0.4097900390625, -0.28192138671875, -0.154052734375, -0.02618408203125, 0.1016845703125, 0.22955322265625, 0.357421875, 0.48529052734375, 0.6131591796875, 0.74102783203125, 0.868896484375, 0.99676513671875, 1.1246337890625, 1.25250244140625, 1.38037109375, 1.50823974609375, 1.6361083984375, 1.76397705078125, 1.891845703125, 2.01971435546875, 2.1475830078125, 2.27545166015625, 2.4033203125, 2.53118896484375, 2.6590576171875, 2.78692626953125, 2.914794921875, 3.04266357421875, 3.1705322265625, 3.29840087890625, 3.42626953125, 3.55413818359375, 3.6820068359375, 3.80987548828125, 3.937744140625, 4.06561279296875, 4.1934814453125, 4.32135009765625, 4.44921875]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 0.0, 3.0, 1.0, 3.0, 9.0, 8.0, 13.0, 13.0, 7.0, 18.0, 22.0, 19.0, 29.0, 25.0, 31.0, 29.0, 38.0, 48.0, 33.0, 39.0, 70.0, 505.0, 1562.0, 83.0, 64.0, 40.0, 46.0, 39.0, 33.0, 22.0, 28.0, 26.0, 28.0, 13.0, 12.0, 18.0, 14.0, 13.0, 11.0, 13.0, 4.0, 3.0, 4.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 1.0], "bins": [-18.5625, -17.9638671875, -17.365234375, -16.7666015625, -16.16796875, -15.5693359375, -14.970703125, -14.3720703125, -13.7734375, -13.1748046875, -12.576171875, -11.9775390625, -11.37890625, -10.7802734375, -10.181640625, -9.5830078125, -8.984375, -8.3857421875, -7.787109375, -7.1884765625, -6.58984375, -5.9912109375, -5.392578125, -4.7939453125, -4.1953125, -3.5966796875, -2.998046875, -2.3994140625, -1.80078125, -1.2021484375, -0.603515625, -0.0048828125, 0.59375, 1.1923828125, 1.791015625, 2.3896484375, 2.98828125, 3.5869140625, 4.185546875, 4.7841796875, 5.3828125, 5.9814453125, 6.580078125, 7.1787109375, 7.77734375, 8.3759765625, 8.974609375, 9.5732421875, 10.171875, 10.7705078125, 11.369140625, 11.9677734375, 12.56640625, 13.1650390625, 13.763671875, 14.3623046875, 14.9609375, 15.5595703125, 16.158203125, 16.7568359375, 17.35546875, 17.9541015625, 18.552734375, 19.1513671875, 19.75]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 5.0, 9.0, 15.0, 13.0, 12.0, 17.0, 16.0, 16.0, 27.0, 37.0, 31.0, 51.0, 73.0, 111.0, 158.0, 216.0, 480.0, 1277.0, 28245.0, 3097438.0, 15189.0, 1079.0, 415.0, 238.0, 152.0, 94.0, 51.0, 45.0, 40.0, 23.0, 23.0, 19.0, 16.0, 15.0, 11.0, 7.0, 10.0, 6.0, 4.0, 1.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-33.03125, -32.04345703125, -31.0556640625, -30.06787109375, -29.080078125, -28.09228515625, -27.1044921875, -26.11669921875, -25.12890625, -24.14111328125, -23.1533203125, -22.16552734375, -21.177734375, -20.18994140625, -19.2021484375, -18.21435546875, -17.2265625, -16.23876953125, -15.2509765625, -14.26318359375, -13.275390625, -12.28759765625, -11.2998046875, -10.31201171875, -9.32421875, -8.33642578125, -7.3486328125, -6.36083984375, -5.373046875, -4.38525390625, -3.3974609375, -2.40966796875, -1.421875, -0.43408203125, 0.5537109375, 1.54150390625, 2.529296875, 3.51708984375, 4.5048828125, 5.49267578125, 6.48046875, 7.46826171875, 8.4560546875, 9.44384765625, 10.431640625, 11.41943359375, 12.4072265625, 13.39501953125, 14.3828125, 15.37060546875, 16.3583984375, 17.34619140625, 18.333984375, 19.32177734375, 20.3095703125, 21.29736328125, 22.28515625, 23.27294921875, 24.2607421875, 25.24853515625, 26.236328125, 27.22412109375, 28.2119140625, 29.19970703125, 30.1875]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [7.0, 24.0, 137.0, 260.0, 310.0, 176.0, 73.0, 19.0, 6.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9876203536987305, -3.842341899871826, -2.6970632076263428, -1.5517845153808594, -0.4065060615539551, 0.7387723922729492, 1.8840513229370117, 3.029329299926758, 4.17460823059082, 5.319886684417725, 6.465165138244629, 7.610444068908691, 8.755722045898438, 9.9010009765625, 11.046279907226562, 12.191557884216309, 13.336836814880371, 14.482115745544434, 15.62739372253418, 16.772672653198242, 17.917951583862305, 19.063228607177734, 20.208507537841797, 21.35378646850586, 22.499065399169922, 23.644344329833984, 24.789623260498047, 25.93490219116211, 27.08017921447754, 28.2254581451416, 29.370737075805664, 30.516014099121094, 31.661296844482422, 32.806575775146484, 33.95185470581055, 35.09713363647461, 36.24241256713867, 37.38768768310547, 38.53296661376953, 39.678245544433594, 40.823524475097656, 41.96880340576172, 43.11408233642578, 44.259361267089844, 45.404640197753906, 46.54991912841797, 47.69519805908203, 48.84047317504883, 49.985755920410156, 51.13103485107422, 52.27631378173828, 53.421592712402344, 54.566871643066406, 55.71215057373047, 56.85742950439453, 58.00270462036133, 59.14798355102539, 60.29326248168945, 61.438541412353516, 62.58382034301758, 63.72909927368164, 64.87437438964844, 66.0196533203125, 67.16493225097656, 68.31021118164062]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 6.0, 7.0, 5.0, 10.0, 6.0, 13.0, 22.0, 22.0, 18.0, 18.0, 20.0, 15.0, 26.0, 30.0, 30.0, 24.0, 35.0, 40.0, 33.0, 37.0, 33.0, 34.0, 34.0, 33.0, 37.0, 37.0, 38.0, 32.0, 41.0, 23.0, 35.0, 31.0, 21.0, 16.0, 28.0, 18.0, 15.0, 17.0, 10.0, 10.0, 9.0, 8.0, 8.0, 9.0, 2.0, 3.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-55.81963348388672, -54.091609954833984, -52.363582611083984, -50.63555908203125, -48.907535552978516, -47.17951202392578, -45.45148468017578, -43.72346115112305, -41.99543762207031, -40.26741409301758, -38.53938674926758, -36.811363220214844, -35.08333969116211, -33.355316162109375, -31.627288818359375, -29.89926528930664, -28.17123794555664, -26.443212509155273, -24.71518898010254, -22.987163543701172, -21.259140014648438, -19.53111457824707, -17.803089141845703, -16.07506561279297, -14.347040176391602, -12.61901569366455, -10.8909912109375, -9.162965774536133, -7.434941291809082, -5.706916809082031, -3.978891372680664, -2.2508668899536133, -0.5228424072265625, 1.2051823139190674, 2.9332070350646973, 4.661231994628906, 6.389256477355957, 8.117280960083008, 9.845306396484375, 11.573330879211426, 13.301355361938477, 15.029379844665527, 16.757404327392578, 18.485429763793945, 20.213455200195312, 21.941478729248047, 23.669504165649414, 25.39752960205078, 27.125553131103516, 28.853578567504883, 30.581602096557617, 32.309627532958984, 34.03765106201172, 35.76567840576172, 37.49370193481445, 39.22172546386719, 40.94975280761719, 42.67777633666992, 44.40580368041992, 46.133827209472656, 47.86185073852539, 49.589874267578125, 51.317901611328125, 53.04592514038086, 54.773948669433594]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 8.0, 7.0, 10.0, 12.0, 10.0, 15.0, 25.0, 19.0, 30.0, 42.0, 46.0, 38.0, 44.0, 54.0, 42.0, 46.0, 60.0, 43.0, 62.0, 48.0, 49.0, 42.0, 39.0, 37.0, 28.0, 40.0, 26.0, 21.0, 20.0, 6.0, 15.0, 6.0, 5.0, 4.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.09765625, -5.8870849609375, -5.676513671875, -5.4659423828125, -5.25537109375, -5.0447998046875, -4.834228515625, -4.6236572265625, -4.4130859375, -4.2025146484375, -3.991943359375, -3.7813720703125, -3.57080078125, -3.3602294921875, -3.149658203125, -2.9390869140625, -2.728515625, -2.5179443359375, -2.307373046875, -2.0968017578125, -1.88623046875, -1.6756591796875, -1.465087890625, -1.2545166015625, -1.0439453125, -0.8333740234375, -0.622802734375, -0.4122314453125, -0.20166015625, 0.0089111328125, 0.219482421875, 0.4300537109375, 0.640625, 0.8511962890625, 1.061767578125, 1.2723388671875, 1.48291015625, 1.6934814453125, 1.904052734375, 2.1146240234375, 2.3251953125, 2.5357666015625, 2.746337890625, 2.9569091796875, 3.16748046875, 3.3780517578125, 3.588623046875, 3.7991943359375, 4.009765625, 4.2203369140625, 4.430908203125, 4.6414794921875, 4.85205078125, 5.0626220703125, 5.273193359375, 5.4837646484375, 5.6943359375, 5.9049072265625, 6.115478515625, 6.3260498046875, 6.53662109375, 6.7471923828125, 6.957763671875, 7.1683349609375, 7.37890625]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 6.0, 4.0, 9.0, 4.0, 15.0, 11.0, 19.0, 24.0, 26.0, 49.0, 72.0, 130.0, 184.0, 525.0, 2148.0, 10982.0, 111447.0, 2549466.0, 1451115.0, 58119.0, 7352.0, 1605.0, 459.0, 174.0, 107.0, 66.0, 53.0, 24.0, 23.0, 22.0, 6.0, 16.0, 9.0, 11.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.21875, -17.587890625, -16.95703125, -16.326171875, -15.6953125, -15.064453125, -14.43359375, -13.802734375, -13.171875, -12.541015625, -11.91015625, -11.279296875, -10.6484375, -10.017578125, -9.38671875, -8.755859375, -8.125, -7.494140625, -6.86328125, -6.232421875, -5.6015625, -4.970703125, -4.33984375, -3.708984375, -3.078125, -2.447265625, -1.81640625, -1.185546875, -0.5546875, 0.076171875, 0.70703125, 1.337890625, 1.96875, 2.599609375, 3.23046875, 3.861328125, 4.4921875, 5.123046875, 5.75390625, 6.384765625, 7.015625, 7.646484375, 8.27734375, 8.908203125, 9.5390625, 10.169921875, 10.80078125, 11.431640625, 12.0625, 12.693359375, 13.32421875, 13.955078125, 14.5859375, 15.216796875, 15.84765625, 16.478515625, 17.109375, 17.740234375, 18.37109375, 19.001953125, 19.6328125, 20.263671875, 20.89453125, 21.525390625, 22.15625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 6.0, 6.0, 8.0, 6.0, 24.0, 17.0, 35.0, 30.0, 58.0, 67.0, 90.0, 121.0, 149.0, 179.0, 245.0, 317.0, 393.0, 406.0, 367.0, 368.0, 290.0, 207.0, 173.0, 118.0, 108.0, 75.0, 52.0, 45.0, 26.0, 24.0, 11.0, 13.0, 9.0, 7.0, 10.0, 6.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.4765625, -15.0655517578125, -14.654541015625, -14.2435302734375, -13.83251953125, -13.4215087890625, -13.010498046875, -12.5994873046875, -12.1884765625, -11.7774658203125, -11.366455078125, -10.9554443359375, -10.54443359375, -10.1334228515625, -9.722412109375, -9.3114013671875, -8.900390625, -8.4893798828125, -8.078369140625, -7.6673583984375, -7.25634765625, -6.8453369140625, -6.434326171875, -6.0233154296875, -5.6123046875, -5.2012939453125, -4.790283203125, -4.3792724609375, -3.96826171875, -3.5572509765625, -3.146240234375, -2.7352294921875, -2.32421875, -1.9132080078125, -1.502197265625, -1.0911865234375, -0.68017578125, -0.2691650390625, 0.141845703125, 0.5528564453125, 0.9638671875, 1.3748779296875, 1.785888671875, 2.1968994140625, 2.60791015625, 3.0189208984375, 3.429931640625, 3.8409423828125, 4.251953125, 4.6629638671875, 5.073974609375, 5.4849853515625, 5.89599609375, 6.3070068359375, 6.718017578125, 7.1290283203125, 7.5400390625, 7.9510498046875, 8.362060546875, 8.7730712890625, 9.18408203125, 9.5950927734375, 10.006103515625, 10.4171142578125, 10.828125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 3.0, 9.0, 14.0, 10.0, 26.0, 37.0, 31.0, 64.0, 94.0, 119.0, 192.0, 312.0, 620.0, 4304.0, 154037.0, 3918815.0, 110646.0, 3549.0, 539.0, 290.0, 165.0, 129.0, 75.0, 54.0, 45.0, 24.0, 24.0, 21.0, 13.0, 10.0, 6.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.375, -38.724609375, -37.07421875, -35.423828125, -33.7734375, -32.123046875, -30.47265625, -28.822265625, -27.171875, -25.521484375, -23.87109375, -22.220703125, -20.5703125, -18.919921875, -17.26953125, -15.619140625, -13.96875, -12.318359375, -10.66796875, -9.017578125, -7.3671875, -5.716796875, -4.06640625, -2.416015625, -0.765625, 0.884765625, 2.53515625, 4.185546875, 5.8359375, 7.486328125, 9.13671875, 10.787109375, 12.4375, 14.087890625, 15.73828125, 17.388671875, 19.0390625, 20.689453125, 22.33984375, 23.990234375, 25.640625, 27.291015625, 28.94140625, 30.591796875, 32.2421875, 33.892578125, 35.54296875, 37.193359375, 38.84375, 40.494140625, 42.14453125, 43.794921875, 45.4453125, 47.095703125, 48.74609375, 50.396484375, 52.046875, 53.697265625, 55.34765625, 56.998046875, 58.6484375, 60.298828125, 61.94921875, 63.599609375, 65.25]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 8.0, 12.0, 8.0, 32.0, 44.0, 75.0, 112.0, 126.0, 143.0, 124.0, 119.0, 78.0, 52.0, 28.0, 21.0, 17.0, 5.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.53249740600586, -59.126258850097656, -56.72001647949219, -54.313777923583984, -51.907535552978516, -49.50129699707031, -47.095054626464844, -44.68881607055664, -42.28257751464844, -39.876338958740234, -37.470096588134766, -35.06385803222656, -32.657615661621094, -30.25137710571289, -27.845136642456055, -25.43889617919922, -23.03265380859375, -20.626413345336914, -18.220172882080078, -15.813933372497559, -13.407692909240723, -11.001452445983887, -8.595212936401367, -6.188972473144531, -3.7827320098876953, -1.3764917850494385, 1.0297484397888184, 3.435988426208496, 5.842228889465332, 8.248469352722168, 10.654708862304688, 13.060949325561523, 15.467193603515625, 17.87343406677246, 20.279674530029297, 22.6859130859375, 25.09215545654297, 27.498394012451172, 29.904634475708008, 32.310874938964844, 34.71711730957031, 37.123355865478516, 39.529598236083984, 41.93583679199219, 44.342079162597656, 46.74831771850586, 49.15455627441406, 51.56079864501953, 53.967037200927734, 56.37327575683594, 58.779518127441406, 61.18575668334961, 63.59199905395508, 65.99823760986328, 68.40447998046875, 70.81071472167969, 73.21695709228516, 75.62319946289062, 78.02943420410156, 80.43567657470703, 82.8419189453125, 85.24816131591797, 87.6543960571289, 90.06063842773438, 92.46688079833984]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 6.0, 5.0, 5.0, 6.0, 4.0, 9.0, 11.0, 17.0, 13.0, 18.0, 18.0, 29.0, 29.0, 33.0, 25.0, 39.0, 34.0, 25.0, 42.0, 34.0, 40.0, 29.0, 45.0, 43.0, 43.0, 44.0, 33.0, 33.0, 37.0, 37.0, 36.0, 22.0, 21.0, 16.0, 15.0, 29.0, 13.0, 11.0, 17.0, 8.0, 7.0, 9.0, 6.0, 3.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0], "bins": [-50.12028503417969, -48.74879837036133, -47.37731170654297, -46.00582504272461, -44.63433837890625, -43.262855529785156, -41.89136505126953, -40.51988220214844, -39.14839553833008, -37.77690887451172, -36.40542221069336, -35.033935546875, -33.66244888305664, -32.29096221923828, -30.919477462768555, -29.547992706298828, -28.176504135131836, -26.805017471313477, -25.433530807495117, -24.06204605102539, -22.69055938720703, -21.319072723388672, -19.947586059570312, -18.576099395751953, -17.204612731933594, -15.833126068115234, -14.461640357971191, -13.090153694152832, -11.718667984008789, -10.34718132019043, -8.97569465637207, -7.604208946228027, -6.232723236083984, -4.861237049102783, -3.489750623703003, -2.1182641983032227, -0.7467780113220215, 0.6247081756591797, 1.996194839477539, 3.367680549621582, 4.739167213439941, 6.110653400421143, 7.482139587402344, 8.853626251220703, 10.225112915039062, 11.596598625183105, 12.968085289001465, 14.339570999145508, 15.711057662963867, 17.082544326782227, 18.454030990600586, 19.825515747070312, 21.197002410888672, 22.56848907470703, 23.93997573852539, 25.31146240234375, 26.68294906616211, 28.05443572998047, 29.425922393798828, 30.797409057617188, 32.16889572143555, 33.540382385253906, 34.911865234375, 36.28335189819336, 37.65483856201172]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 7.0, 6.0, 6.0, 12.0, 11.0, 14.0, 15.0, 25.0, 30.0, 20.0, 33.0, 30.0, 31.0, 46.0, 52.0, 61.0, 46.0, 39.0, 53.0, 51.0, 57.0, 37.0, 39.0, 44.0, 46.0, 33.0, 35.0, 25.0, 28.0, 20.0, 9.0, 14.0, 12.0, 9.0, 2.0, 5.0, 4.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.390625, -5.1868896484375, -4.983154296875, -4.7794189453125, -4.57568359375, -4.3719482421875, -4.168212890625, -3.9644775390625, -3.7607421875, -3.5570068359375, -3.353271484375, -3.1495361328125, -2.94580078125, -2.7420654296875, -2.538330078125, -2.3345947265625, -2.130859375, -1.9271240234375, -1.723388671875, -1.5196533203125, -1.31591796875, -1.1121826171875, -0.908447265625, -0.7047119140625, -0.5009765625, -0.2972412109375, -0.093505859375, 0.1102294921875, 0.31396484375, 0.5177001953125, 0.721435546875, 0.9251708984375, 1.12890625, 1.3326416015625, 1.536376953125, 1.7401123046875, 1.94384765625, 2.1475830078125, 2.351318359375, 2.5550537109375, 2.7587890625, 2.9625244140625, 3.166259765625, 3.3699951171875, 3.57373046875, 3.7774658203125, 3.981201171875, 4.1849365234375, 4.388671875, 4.5924072265625, 4.796142578125, 4.9998779296875, 5.20361328125, 5.4073486328125, 5.611083984375, 5.8148193359375, 6.0185546875, 6.2222900390625, 6.426025390625, 6.6297607421875, 6.83349609375, 7.0372314453125, 7.240966796875, 7.4447021484375, 7.6484375]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 9.0, 10.0, 22.0, 38.0, 55.0, 57.0, 102.0, 171.0, 227.0, 340.0, 520.0, 696.0, 1056.0, 1542.0, 2117.0, 3025.0, 4508.0, 6407.0, 9323.0, 13994.0, 20706.0, 31572.0, 50004.0, 83999.0, 154173.0, 235353.0, 173503.0, 94529.0, 55294.0, 34678.0, 22737.0, 15150.0, 10143.0, 6924.0, 4762.0, 3319.0, 2223.0, 1695.0, 1102.0, 778.0, 559.0, 340.0, 287.0, 160.0, 114.0, 66.0, 59.0, 44.0, 22.0, 17.0, 7.0, 11.0, 4.0, 6.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.71923828125, -0.6964797973632812, -0.6737213134765625, -0.6509628295898438, -0.628204345703125, -0.6054458618164062, -0.5826873779296875, -0.5599288940429688, -0.53717041015625, -0.5144119262695312, -0.4916534423828125, -0.46889495849609375, -0.446136474609375, -0.42337799072265625, -0.4006195068359375, -0.37786102294921875, -0.3551025390625, -0.33234405517578125, -0.3095855712890625, -0.28682708740234375, -0.264068603515625, -0.24131011962890625, -0.2185516357421875, -0.19579315185546875, -0.17303466796875, -0.15027618408203125, -0.1275177001953125, -0.10475921630859375, -0.082000732421875, -0.05924224853515625, -0.0364837646484375, -0.01372528076171875, 0.009033203125, 0.03179168701171875, 0.0545501708984375, 0.07730865478515625, 0.100067138671875, 0.12282562255859375, 0.1455841064453125, 0.16834259033203125, 0.19110107421875, 0.21385955810546875, 0.2366180419921875, 0.25937652587890625, 0.282135009765625, 0.30489349365234375, 0.3276519775390625, 0.35041046142578125, 0.3731689453125, 0.39592742919921875, 0.4186859130859375, 0.44144439697265625, 0.464202880859375, 0.48696136474609375, 0.5097198486328125, 0.5324783325195312, 0.55523681640625, 0.5779953002929688, 0.6007537841796875, 0.6235122680664062, 0.646270751953125, 0.6690292358398438, 0.6917877197265625, 0.7145462036132812, 0.7373046875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 7.0, 7.0, 6.0, 7.0, 15.0, 17.0, 14.0, 24.0, 22.0, 19.0, 27.0, 24.0, 27.0, 35.0, 24.0, 27.0, 52.0, 40.0, 56.0, 1057.0, 40.0, 39.0, 49.0, 43.0, 38.0, 29.0, 31.0, 36.0, 29.0, 19.0, 23.0, 21.0, 23.0, 18.0, 14.0, 9.0, 16.0, 9.0, 9.0, 5.0, 2.0, 2.0, 2.0, 4.0, 1.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.263671875, -3.1611328125, -3.05859375, -2.9560546875, -2.853515625, -2.7509765625, -2.6484375, -2.5458984375, -2.443359375, -2.3408203125, -2.23828125, -2.1357421875, -2.033203125, -1.9306640625, -1.828125, -1.7255859375, -1.623046875, -1.5205078125, -1.41796875, -1.3154296875, -1.212890625, -1.1103515625, -1.0078125, -0.9052734375, -0.802734375, -0.7001953125, -0.59765625, -0.4951171875, -0.392578125, -0.2900390625, -0.1875, -0.0849609375, 0.017578125, 0.1201171875, 0.22265625, 0.3251953125, 0.427734375, 0.5302734375, 0.6328125, 0.7353515625, 0.837890625, 0.9404296875, 1.04296875, 1.1455078125, 1.248046875, 1.3505859375, 1.453125, 1.5556640625, 1.658203125, 1.7607421875, 1.86328125, 1.9658203125, 2.068359375, 2.1708984375, 2.2734375, 2.3759765625, 2.478515625, 2.5810546875, 2.68359375, 2.7861328125, 2.888671875, 2.9912109375, 3.09375, 3.1962890625, 3.298828125]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 6.0, 6.0, 6.0, 17.0, 15.0, 25.0, 45.0, 62.0, 108.0, 142.0, 217.0, 326.0, 472.0, 728.0, 957.0, 1379.0, 1976.0, 3061.0, 4634.0, 7005.0, 10844.0, 16866.0, 26753.0, 44179.0, 77416.0, 144004.0, 1291967.0, 199938.0, 107361.0, 59594.0, 35117.0, 21533.0, 13903.0, 8950.0, 5636.0, 3829.0, 2586.0, 1745.0, 1196.0, 835.0, 552.0, 381.0, 264.0, 166.0, 117.0, 71.0, 54.0, 36.0, 24.0, 11.0, 10.0, 11.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.6298828125, -0.6094131469726562, -0.5889434814453125, -0.5684738159179688, -0.548004150390625, -0.5275344848632812, -0.5070648193359375, -0.48659515380859375, -0.46612548828125, -0.44565582275390625, -0.4251861572265625, -0.40471649169921875, -0.384246826171875, -0.36377716064453125, -0.3433074951171875, -0.32283782958984375, -0.3023681640625, -0.28189849853515625, -0.2614288330078125, -0.24095916748046875, -0.220489501953125, -0.20001983642578125, -0.1795501708984375, -0.15908050537109375, -0.13861083984375, -0.11814117431640625, -0.0976715087890625, -0.07720184326171875, -0.056732177734375, -0.03626251220703125, -0.0157928466796875, 0.00467681884765625, 0.025146484375, 0.04561614990234375, 0.0660858154296875, 0.08655548095703125, 0.107025146484375, 0.12749481201171875, 0.1479644775390625, 0.16843414306640625, 0.18890380859375, 0.20937347412109375, 0.2298431396484375, 0.25031280517578125, 0.270782470703125, 0.29125213623046875, 0.3117218017578125, 0.33219146728515625, 0.3526611328125, 0.37313079833984375, 0.3936004638671875, 0.41407012939453125, 0.434539794921875, 0.45500946044921875, 0.4754791259765625, 0.49594879150390625, 0.51641845703125, 0.5368881225585938, 0.5573577880859375, 0.5778274536132812, 0.598297119140625, 0.6187667846679688, 0.6392364501953125, 0.6597061157226562, 0.68017578125]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 3.0, 6.0, 4.0, 7.0, 8.0, 12.0, 14.0, 12.0, 24.0, 27.0, 24.0, 18.0, 49.0, 42.0, 53.0, 58.0, 68.0, 51.0, 60.0, 70.0, 62.0, 57.0, 42.0, 45.0, 30.0, 32.0, 20.0, 19.0, 17.0, 15.0, 10.0, 11.0, 6.0, 4.0, 7.0, 3.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.00194549560546875, -0.0018904954195022583, -0.0018354952335357666, -0.001780495047569275, -0.0017254948616027832, -0.0016704946756362915, -0.0016154944896697998, -0.001560494303703308, -0.0015054941177368164, -0.0014504939317703247, -0.001395493745803833, -0.0013404935598373413, -0.0012854933738708496, -0.001230493187904358, -0.0011754930019378662, -0.0011204928159713745, -0.0010654926300048828, -0.0010104924440383911, -0.0009554922580718994, -0.0009004920721054077, -0.000845491886138916, -0.0007904917001724243, -0.0007354915142059326, -0.0006804913282394409, -0.0006254911422729492, -0.0005704909563064575, -0.0005154907703399658, -0.0004604905843734741, -0.0004054903984069824, -0.0003504902124404907, -0.000295490026473999, -0.00024048984050750732, -0.00018548965454101562, -0.00013048946857452393, -7.548928260803223e-05, -2.0489096641540527e-05, 3.451108932495117e-05, 8.951127529144287e-05, 0.00014451146125793457, 0.00019951164722442627, 0.00025451183319091797, 0.00030951201915740967, 0.00036451220512390137, 0.00041951239109039307, 0.00047451257705688477, 0.0005295127630233765, 0.0005845129489898682, 0.0006395131349563599, 0.0006945133209228516, 0.0007495135068893433, 0.000804513692855835, 0.0008595138788223267, 0.0009145140647888184, 0.0009695142507553101, 0.0010245144367218018, 0.0010795146226882935, 0.0011345148086547852, 0.0011895149946212769, 0.0012445151805877686, 0.0012995153665542603, 0.001354515552520752, 0.0014095157384872437, 0.0014645159244537354, 0.001519516110420227, 0.0015745162963867188]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 8.0, 4.0, 4.0, 4.0, 8.0, 7.0, 6.0, 13.0, 15.0, 25.0, 39.0, 57.0, 86.0, 133.0, 221.0, 436.0, 1627.0, 1007507.0, 36870.0, 691.0, 294.0, 187.0, 99.0, 62.0, 44.0, 29.0, 23.0, 17.0, 11.0, 17.0, 4.0, 6.0, 4.0, 4.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04339599609375, -0.041886329650878906, -0.04037666320800781, -0.03886699676513672, -0.037357330322265625, -0.03584766387939453, -0.03433799743652344, -0.032828330993652344, -0.03131866455078125, -0.029808998107910156, -0.028299331665039062, -0.02678966522216797, -0.025279998779296875, -0.02377033233642578, -0.022260665893554688, -0.020750999450683594, -0.0192413330078125, -0.017731666564941406, -0.016222000122070312, -0.014712333679199219, -0.013202667236328125, -0.011693000793457031, -0.010183334350585938, -0.008673667907714844, -0.00716400146484375, -0.005654335021972656, -0.0041446685791015625, -0.0026350021362304688, -0.001125335693359375, 0.00038433074951171875, 0.0018939971923828125, 0.0034036636352539062, 0.004913330078125, 0.006422996520996094, 0.007932662963867188, 0.009442329406738281, 0.010951995849609375, 0.012461662292480469, 0.013971328735351562, 0.015480995178222656, 0.01699066162109375, 0.018500328063964844, 0.020009994506835938, 0.02151966094970703, 0.023029327392578125, 0.02453899383544922, 0.026048660278320312, 0.027558326721191406, 0.0290679931640625, 0.030577659606933594, 0.03208732604980469, 0.03359699249267578, 0.035106658935546875, 0.03661632537841797, 0.03812599182128906, 0.039635658264160156, 0.04114532470703125, 0.042654991149902344, 0.04416465759277344, 0.04567432403564453, 0.047183990478515625, 0.04869365692138672, 0.05020332336425781, 0.051712989807128906, 0.05322265625]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 10.0, 761.0, 248.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00523178419098258, -0.004789181984961033, -0.0043465797789394855, -0.0039039775729179382, -0.003461375366896391, -0.0030187733937054873, -0.00257617118768394, -0.0021335689816623926, -0.0016909667756408453, -0.001248364569619298, -0.0008057624218054116, -0.0003631602739915252, 7.944193203002214e-05, 0.0005220440216362476, 0.000964646227657795, 0.0014072484336793423, 0.0018498506397008896, 0.002292452845722437, 0.0027350550517439842, 0.0031776572577655315, 0.003620259463787079, 0.004062861204147339, 0.0045054638758301735, 0.0049480656161904335, 0.005390668287873268, 0.0058332704938948154, 0.006275872699916363, 0.00671847490593791, 0.007161077111959457, 0.007603678852319717, 0.008046281524002552, 0.008488883264362812, 0.008931485004723072, 0.009374086745083332, 0.009816689416766167, 0.010259291157126427, 0.010701893828809261, 0.011144495569169521, 0.011587098240852356, 0.012029699981212616, 0.01247230265289545, 0.01291490439325571, 0.013357507064938545, 0.013800108805298805, 0.01424271147698164, 0.0146853132173419, 0.015127915889024734, 0.015570517629384995, 0.016013119369745255, 0.016455721110105515, 0.016898322850465775, 0.017340926453471184, 0.017783528193831444, 0.018226129934191704, 0.018668731674551964, 0.019111335277557373, 0.019553937017917633, 0.019996538758277893, 0.020439140498638153, 0.020881744101643562, 0.021324345842003822, 0.021766947582364082, 0.022209549322724342, 0.02265215292572975, 0.02309475466609001]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 3.0, 10.0, 9.0, 8.0, 11.0, 13.0, 10.0, 17.0, 14.0, 17.0, 26.0, 30.0, 36.0, 38.0, 21.0, 33.0, 36.0, 39.0, 41.0, 48.0, 46.0, 41.0, 52.0, 38.0, 35.0, 45.0, 29.0, 34.0, 34.0, 40.0, 19.0, 24.0, 13.0, 18.0, 16.0, 10.0, 9.0, 8.0, 7.0, 5.0, 3.0, 6.0, 3.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0009239912033081055, -0.0008953018113970757, -0.0008666124194860458, -0.000837923027575016, -0.0008092336356639862, -0.0007805442437529564, -0.0007518548518419266, -0.0007231654599308968, -0.0006944760680198669, -0.0006657866761088371, -0.0006370972841978073, -0.0006084078922867775, -0.0005797185003757477, -0.0005510291084647179, -0.000522339716553688, -0.0004936503246426582, -0.0004649609327316284, -0.0004362715408205986, -0.0004075821489095688, -0.00037889275699853897, -0.00035020336508750916, -0.00032151397317647934, -0.0002928245812654495, -0.0002641351893544197, -0.0002354457974433899, -0.00020675640553236008, -0.00017806701362133026, -0.00014937762171030045, -0.00012068822979927063, -9.199883788824081e-05, -6.3309445977211e-05, -3.462005406618118e-05, -5.930662155151367e-06, 2.275872975587845e-05, 5.1448121666908264e-05, 8.013751357793808e-05, 0.0001088269054889679, 0.0001375162973999977, 0.00016620568931102753, 0.00019489508122205734, 0.00022358447313308716, 0.000252273865044117, 0.0002809632569551468, 0.0003096526488661766, 0.0003383420407772064, 0.00036703143268823624, 0.00039572082459926605, 0.00042441021651029587, 0.0004530996084213257, 0.0004817890003323555, 0.0005104783922433853, 0.0005391677841544151, 0.000567857176065445, 0.0005965465679764748, 0.0006252359598875046, 0.0006539253517985344, 0.0006826147437095642, 0.000711304135620594, 0.0007399935275316238, 0.0007686829194426537, 0.0007973723113536835, 0.0008260617032647133, 0.0008547510951757431, 0.0008834404870867729, 0.0009121298789978027]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 7.0, 6.0, 6.0, 12.0, 11.0, 14.0, 15.0, 25.0, 30.0, 20.0, 33.0, 30.0, 31.0, 46.0, 52.0, 61.0, 46.0, 39.0, 53.0, 51.0, 57.0, 37.0, 39.0, 44.0, 46.0, 33.0, 35.0, 25.0, 28.0, 20.0, 9.0, 14.0, 12.0, 9.0, 2.0, 5.0, 4.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.390625, -5.1868896484375, -4.983154296875, -4.7794189453125, -4.57568359375, -4.3719482421875, -4.168212890625, -3.9644775390625, -3.7607421875, -3.5570068359375, -3.353271484375, -3.1495361328125, -2.94580078125, -2.7420654296875, -2.538330078125, -2.3345947265625, -2.130859375, -1.9271240234375, -1.723388671875, -1.5196533203125, -1.31591796875, -1.1121826171875, -0.908447265625, -0.7047119140625, -0.5009765625, -0.2972412109375, -0.093505859375, 0.1102294921875, 0.31396484375, 0.5177001953125, 0.721435546875, 0.9251708984375, 1.12890625, 1.3326416015625, 1.536376953125, 1.7401123046875, 1.94384765625, 2.1475830078125, 2.351318359375, 2.5550537109375, 2.7587890625, 2.9625244140625, 3.166259765625, 3.3699951171875, 3.57373046875, 3.7774658203125, 3.981201171875, 4.1849365234375, 4.388671875, 4.5924072265625, 4.796142578125, 4.9998779296875, 5.20361328125, 5.4073486328125, 5.611083984375, 5.8148193359375, 6.0185546875, 6.2222900390625, 6.426025390625, 6.6297607421875, 6.83349609375, 7.0372314453125, 7.240966796875, 7.4447021484375, 7.6484375]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 4.0, 4.0, 8.0, 15.0, 11.0, 25.0, 25.0, 49.0, 62.0, 89.0, 121.0, 157.0, 247.0, 356.0, 486.0, 676.0, 885.0, 1278.0, 1827.0, 2414.0, 3466.0, 5094.0, 7593.0, 12631.0, 25019.0, 63656.0, 211232.0, 459942.0, 148983.0, 48347.0, 20613.0, 10943.0, 6728.0, 4458.0, 3190.0, 2286.0, 1612.0, 1120.0, 810.0, 607.0, 429.0, 302.0, 211.0, 164.0, 105.0, 71.0, 65.0, 40.0, 42.0, 18.0, 10.0, 16.0, 11.0, 11.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-3.96875, -3.84613037109375, -3.7235107421875, -3.60089111328125, -3.478271484375, -3.35565185546875, -3.2330322265625, -3.11041259765625, -2.98779296875, -2.86517333984375, -2.7425537109375, -2.61993408203125, -2.497314453125, -2.37469482421875, -2.2520751953125, -2.12945556640625, -2.0068359375, -1.88421630859375, -1.7615966796875, -1.63897705078125, -1.516357421875, -1.39373779296875, -1.2711181640625, -1.14849853515625, -1.02587890625, -0.90325927734375, -0.7806396484375, -0.65802001953125, -0.535400390625, -0.41278076171875, -0.2901611328125, -0.16754150390625, -0.044921875, 0.07769775390625, 0.2003173828125, 0.32293701171875, 0.445556640625, 0.56817626953125, 0.6907958984375, 0.81341552734375, 0.93603515625, 1.05865478515625, 1.1812744140625, 1.30389404296875, 1.426513671875, 1.54913330078125, 1.6717529296875, 1.79437255859375, 1.9169921875, 2.03961181640625, 2.1622314453125, 2.28485107421875, 2.407470703125, 2.53009033203125, 2.6527099609375, 2.77532958984375, 2.89794921875, 3.02056884765625, 3.1431884765625, 3.26580810546875, 3.388427734375, 3.51104736328125, 3.6336669921875, 3.75628662109375, 3.87890625]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 2.0, 4.0, 3.0, 5.0, 5.0, 13.0, 10.0, 14.0, 15.0, 19.0, 22.0, 22.0, 33.0, 28.0, 26.0, 40.0, 50.0, 37.0, 63.0, 102.0, 403.0, 1609.0, 102.0, 57.0, 56.0, 34.0, 34.0, 28.0, 29.0, 30.0, 37.0, 25.0, 22.0, 17.0, 18.0, 10.0, 9.0, 1.0, 3.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-21.34375, -20.69873046875, -20.0537109375, -19.40869140625, -18.763671875, -18.11865234375, -17.4736328125, -16.82861328125, -16.18359375, -15.53857421875, -14.8935546875, -14.24853515625, -13.603515625, -12.95849609375, -12.3134765625, -11.66845703125, -11.0234375, -10.37841796875, -9.7333984375, -9.08837890625, -8.443359375, -7.79833984375, -7.1533203125, -6.50830078125, -5.86328125, -5.21826171875, -4.5732421875, -3.92822265625, -3.283203125, -2.63818359375, -1.9931640625, -1.34814453125, -0.703125, -0.05810546875, 0.5869140625, 1.23193359375, 1.876953125, 2.52197265625, 3.1669921875, 3.81201171875, 4.45703125, 5.10205078125, 5.7470703125, 6.39208984375, 7.037109375, 7.68212890625, 8.3271484375, 8.97216796875, 9.6171875, 10.26220703125, 10.9072265625, 11.55224609375, 12.197265625, 12.84228515625, 13.4873046875, 14.13232421875, 14.77734375, 15.42236328125, 16.0673828125, 16.71240234375, 17.357421875, 18.00244140625, 18.6474609375, 19.29248046875, 19.9375]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 9.0, 2.0, 5.0, 10.0, 12.0, 26.0, 30.0, 26.0, 28.0, 37.0, 46.0, 70.0, 108.0, 182.0, 239.0, 392.0, 1544.0, 21743.0, 3062024.0, 54996.0, 2719.0, 512.0, 272.0, 180.0, 127.0, 86.0, 51.0, 38.0, 38.0, 29.0, 17.0, 25.0, 17.0, 10.0, 14.0, 8.0, 2.0, 6.0, 3.0, 4.0, 3.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-35.4375, -34.2802734375, -33.123046875, -31.9658203125, -30.80859375, -29.6513671875, -28.494140625, -27.3369140625, -26.1796875, -25.0224609375, -23.865234375, -22.7080078125, -21.55078125, -20.3935546875, -19.236328125, -18.0791015625, -16.921875, -15.7646484375, -14.607421875, -13.4501953125, -12.29296875, -11.1357421875, -9.978515625, -8.8212890625, -7.6640625, -6.5068359375, -5.349609375, -4.1923828125, -3.03515625, -1.8779296875, -0.720703125, 0.4365234375, 1.59375, 2.7509765625, 3.908203125, 5.0654296875, 6.22265625, 7.3798828125, 8.537109375, 9.6943359375, 10.8515625, 12.0087890625, 13.166015625, 14.3232421875, 15.48046875, 16.6376953125, 17.794921875, 18.9521484375, 20.109375, 21.2666015625, 22.423828125, 23.5810546875, 24.73828125, 25.8955078125, 27.052734375, 28.2099609375, 29.3671875, 30.5244140625, 31.681640625, 32.8388671875, 33.99609375, 35.1533203125, 36.310546875, 37.4677734375, 38.625]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 7.0, 41.0, 148.0, 333.0, 307.0, 140.0, 32.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.50423049926758, -55.807281494140625, -54.11033248901367, -52.41338348388672, -50.716434478759766, -49.01948547363281, -47.322540283203125, -45.62559127807617, -43.92864227294922, -42.231693267822266, -40.53474426269531, -38.83779525756836, -37.140846252441406, -35.44390106201172, -33.7469482421875, -32.05000305175781, -30.353052139282227, -28.656103134155273, -26.95915412902832, -25.26220703125, -23.565258026123047, -21.868309020996094, -20.17136001586914, -18.474411010742188, -16.777462005615234, -15.080513000488281, -13.383564949035645, -11.686615943908691, -9.989667892456055, -8.292718887329102, -6.595769882202148, -4.898821830749512, -3.201873779296875, -1.5049251317977905, 0.19202351570129395, 1.888972282409668, 3.585920810699463, 5.282869338989258, 6.979818344116211, 8.676766395568848, 10.3737154006958, 12.070664405822754, 13.76761245727539, 15.464561462402344, 17.161510467529297, 18.85845947265625, 20.555408477783203, 22.252355575561523, 23.949304580688477, 25.64625358581543, 27.343202590942383, 29.040149688720703, 30.737098693847656, 32.43404769897461, 34.13099670410156, 35.827945709228516, 37.52489471435547, 39.22184371948242, 40.918792724609375, 42.61574172973633, 44.31269073486328, 46.00963592529297, 47.70658874511719, 49.403533935546875, 51.10048294067383]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 6.0, 6.0, 5.0, 5.0, 9.0, 13.0, 18.0, 12.0, 25.0, 24.0, 16.0, 18.0, 24.0, 23.0, 30.0, 35.0, 38.0, 43.0, 34.0, 45.0, 64.0, 42.0, 39.0, 38.0, 47.0, 43.0, 43.0, 29.0, 29.0, 29.0, 24.0, 25.0, 21.0, 22.0, 12.0, 13.0, 12.0, 7.0, 10.0, 7.0, 3.0, 7.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-57.369537353515625, -55.53218078613281, -53.694828033447266, -51.85747146606445, -50.02011489868164, -48.182762145996094, -46.34540557861328, -44.50804901123047, -42.670692443847656, -40.833335876464844, -38.9959831237793, -37.158626556396484, -35.32126998901367, -33.483917236328125, -31.646560668945312, -29.8092041015625, -27.971851348876953, -26.134496688842773, -24.29714012145996, -22.45978546142578, -20.62242889404297, -18.78507423400879, -16.94771957397461, -15.110363960266113, -13.273008346557617, -11.435652732849121, -9.598297119140625, -7.760942459106445, -5.923586845397949, -4.086231231689453, -2.2488765716552734, -0.41152095794677734, 1.4258346557617188, 3.2631900310516357, 5.100545406341553, 6.937900543212891, 8.775256156921387, 10.612611770629883, 12.449966430664062, 14.287322044372559, 16.124677658081055, 17.962032318115234, 19.799388885498047, 21.636743545532227, 23.474098205566406, 25.31145477294922, 27.1488094329834, 28.986164093017578, 30.82352066040039, 32.6608772277832, 34.49822998046875, 36.33558654785156, 38.172943115234375, 40.01029968261719, 41.847652435302734, 43.68500900268555, 45.522361755371094, 47.359718322753906, 49.19707107543945, 51.034427642822266, 52.87178421020508, 54.709136962890625, 56.54649353027344, 58.38385009765625, 60.22120666503906]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 8.0, 7.0, 6.0, 13.0, 13.0, 17.0, 24.0, 31.0, 23.0, 24.0, 34.0, 30.0, 46.0, 61.0, 55.0, 49.0, 39.0, 55.0, 48.0, 51.0, 44.0, 44.0, 44.0, 47.0, 26.0, 40.0, 28.0, 25.0, 14.0, 16.0, 14.0, 8.0, 7.0, 6.0, 3.0, 4.0, 1.0, 0.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.76171875, -5.55206298828125, -5.3424072265625, -5.13275146484375, -4.923095703125, -4.71343994140625, -4.5037841796875, -4.29412841796875, -4.08447265625, -3.87481689453125, -3.6651611328125, -3.45550537109375, -3.245849609375, -3.03619384765625, -2.8265380859375, -2.61688232421875, -2.4072265625, -2.19757080078125, -1.9879150390625, -1.77825927734375, -1.568603515625, -1.35894775390625, -1.1492919921875, -0.93963623046875, -0.72998046875, -0.52032470703125, -0.3106689453125, -0.10101318359375, 0.108642578125, 0.31829833984375, 0.5279541015625, 0.73760986328125, 0.947265625, 1.15692138671875, 1.3665771484375, 1.57623291015625, 1.785888671875, 1.99554443359375, 2.2052001953125, 2.41485595703125, 2.62451171875, 2.83416748046875, 3.0438232421875, 3.25347900390625, 3.463134765625, 3.67279052734375, 3.8824462890625, 4.09210205078125, 4.3017578125, 4.51141357421875, 4.7210693359375, 4.93072509765625, 5.140380859375, 5.35003662109375, 5.5596923828125, 5.76934814453125, 5.97900390625, 6.18865966796875, 6.3983154296875, 6.60797119140625, 6.817626953125, 7.02728271484375, 7.2369384765625, 7.44659423828125, 7.65625]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 5.0, 2.0, 9.0, 8.0, 16.0, 22.0, 36.0, 53.0, 87.0, 126.0, 197.0, 290.0, 472.0, 694.0, 1200.0, 2200.0, 3932.0, 7713.0, 16000.0, 36441.0, 93699.0, 284273.0, 828644.0, 1414331.0, 969557.0, 345877.0, 109338.0, 41589.0, 18324.0, 8833.0, 4384.0, 2376.0, 1355.0, 829.0, 471.0, 307.0, 199.0, 122.0, 96.0, 64.0, 44.0, 26.0, 18.0, 10.0, 6.0, 3.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.12109375, -4.928466796875, -4.73583984375, -4.543212890625, -4.3505859375, -4.157958984375, -3.96533203125, -3.772705078125, -3.580078125, -3.387451171875, -3.19482421875, -3.002197265625, -2.8095703125, -2.616943359375, -2.42431640625, -2.231689453125, -2.0390625, -1.846435546875, -1.65380859375, -1.461181640625, -1.2685546875, -1.075927734375, -0.88330078125, -0.690673828125, -0.498046875, -0.305419921875, -0.11279296875, 0.079833984375, 0.2724609375, 0.465087890625, 0.65771484375, 0.850341796875, 1.04296875, 1.235595703125, 1.42822265625, 1.620849609375, 1.8134765625, 2.006103515625, 2.19873046875, 2.391357421875, 2.583984375, 2.776611328125, 2.96923828125, 3.161865234375, 3.3544921875, 3.547119140625, 3.73974609375, 3.932373046875, 4.125, 4.317626953125, 4.51025390625, 4.702880859375, 4.8955078125, 5.088134765625, 5.28076171875, 5.473388671875, 5.666015625, 5.858642578125, 6.05126953125, 6.243896484375, 6.4365234375, 6.629150390625, 6.82177734375, 7.014404296875, 7.20703125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 5.0, 3.0, 11.0, 7.0, 18.0, 19.0, 24.0, 27.0, 39.0, 55.0, 71.0, 99.0, 97.0, 137.0, 158.0, 202.0, 284.0, 291.0, 327.0, 387.0, 305.0, 304.0, 264.0, 176.0, 173.0, 123.0, 105.0, 89.0, 64.0, 49.0, 23.0, 40.0, 28.0, 16.0, 17.0, 8.0, 9.0, 8.0, 5.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.6796875, -12.3214111328125, -11.963134765625, -11.6048583984375, -11.24658203125, -10.8883056640625, -10.530029296875, -10.1717529296875, -9.8134765625, -9.4552001953125, -9.096923828125, -8.7386474609375, -8.38037109375, -8.0220947265625, -7.663818359375, -7.3055419921875, -6.947265625, -6.5889892578125, -6.230712890625, -5.8724365234375, -5.51416015625, -5.1558837890625, -4.797607421875, -4.4393310546875, -4.0810546875, -3.7227783203125, -3.364501953125, -3.0062255859375, -2.64794921875, -2.2896728515625, -1.931396484375, -1.5731201171875, -1.21484375, -0.8565673828125, -0.498291015625, -0.1400146484375, 0.21826171875, 0.5765380859375, 0.934814453125, 1.2930908203125, 1.6513671875, 2.0096435546875, 2.367919921875, 2.7261962890625, 3.08447265625, 3.4427490234375, 3.801025390625, 4.1593017578125, 4.517578125, 4.8758544921875, 5.234130859375, 5.5924072265625, 5.95068359375, 6.3089599609375, 6.667236328125, 7.0255126953125, 7.3837890625, 7.7420654296875, 8.100341796875, 8.4586181640625, 8.81689453125, 9.1751708984375, 9.533447265625, 9.8917236328125, 10.25]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 4.0, 6.0, 3.0, 12.0, 14.0, 16.0, 16.0, 34.0, 44.0, 50.0, 86.0, 97.0, 163.0, 238.0, 517.0, 2441.0, 46765.0, 3386842.0, 741697.0, 13120.0, 1142.0, 359.0, 162.0, 128.0, 82.0, 63.0, 49.0, 33.0, 24.0, 16.0, 13.0, 12.0, 11.0, 5.0, 6.0, 1.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-42.09375, -40.6328125, -39.171875, -37.7109375, -36.25, -34.7890625, -33.328125, -31.8671875, -30.40625, -28.9453125, -27.484375, -26.0234375, -24.5625, -23.1015625, -21.640625, -20.1796875, -18.71875, -17.2578125, -15.796875, -14.3359375, -12.875, -11.4140625, -9.953125, -8.4921875, -7.03125, -5.5703125, -4.109375, -2.6484375, -1.1875, 0.2734375, 1.734375, 3.1953125, 4.65625, 6.1171875, 7.578125, 9.0390625, 10.5, 11.9609375, 13.421875, 14.8828125, 16.34375, 17.8046875, 19.265625, 20.7265625, 22.1875, 23.6484375, 25.109375, 26.5703125, 28.03125, 29.4921875, 30.953125, 32.4140625, 33.875, 35.3359375, 36.796875, 38.2578125, 39.71875, 41.1796875, 42.640625, 44.1015625, 45.5625, 47.0234375, 48.484375, 49.9453125, 51.40625]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 30.0, 99.0, 270.0, 333.0, 184.0, 73.0, 17.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-207.2979736328125, -201.4225616455078, -195.54714965820312, -189.67173767089844, -183.79632568359375, -177.92091369628906, -172.04550170898438, -166.1700897216797, -160.294677734375, -154.4192657470703, -148.54385375976562, -142.66844177246094, -136.79302978515625, -130.91761779785156, -125.04220581054688, -119.16679382324219, -113.2913818359375, -107.41596984863281, -101.54055786132812, -95.66514587402344, -89.78973388671875, -83.91432189941406, -78.03890991210938, -72.16349792480469, -66.2880859375, -60.41267395019531, -54.537261962890625, -48.66184997558594, -42.78643798828125, -36.91102600097656, -31.035614013671875, -25.160202026367188, -19.284805297851562, -13.409393310546875, -7.5339813232421875, -1.6585693359375, 4.2168426513671875, 10.092254638671875, 15.967666625976562, 21.84307861328125, 27.718490600585938, 33.593902587890625, 39.46931457519531, 45.3447265625, 51.22013854980469, 57.095550537109375, 62.97096252441406, 68.84637451171875, 74.72178649902344, 80.59719848632812, 86.47261047363281, 92.3480224609375, 98.22343444824219, 104.09884643554688, 109.97425842285156, 115.84967041015625, 121.72508239746094, 127.60049438476562, 133.4759063720703, 139.351318359375, 145.2267303466797, 151.10214233398438, 156.97755432128906, 162.85296630859375, 168.72837829589844]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 5.0, 7.0, 6.0, 4.0, 7.0, 13.0, 10.0, 11.0, 15.0, 18.0, 19.0, 19.0, 23.0, 28.0, 28.0, 31.0, 28.0, 43.0, 32.0, 35.0, 31.0, 41.0, 34.0, 39.0, 38.0, 43.0, 38.0, 36.0, 34.0, 32.0, 36.0, 34.0, 24.0, 24.0, 26.0, 22.0, 20.0, 15.0, 10.0, 10.0, 7.0, 5.0, 7.0, 6.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-44.34063720703125, -42.91967010498047, -41.49869918823242, -40.077728271484375, -38.656761169433594, -37.23579406738281, -35.814823150634766, -34.39385223388672, -32.97288513183594, -31.551916122436523, -30.13094711303711, -28.709978103637695, -27.28900909423828, -25.868040084838867, -24.447071075439453, -23.02610206604004, -21.605133056640625, -20.18416404724121, -18.763195037841797, -17.342226028442383, -15.921257019042969, -14.500288009643555, -13.07931900024414, -11.658349990844727, -10.237380981445312, -8.816411972045898, -7.395442962646484, -5.97447395324707, -4.553504943847656, -3.132535934448242, -1.7115669250488281, -0.29059791564941406, 1.13037109375, 2.551340103149414, 3.972309112548828, 5.393278121948242, 6.814247131347656, 8.23521614074707, 9.656185150146484, 11.077154159545898, 12.498123168945312, 13.919092178344727, 15.34006118774414, 16.761030197143555, 18.18199920654297, 19.602968215942383, 21.023937225341797, 22.44490623474121, 23.865875244140625, 25.28684425354004, 26.707813262939453, 28.128782272338867, 29.54975128173828, 30.970720291137695, 32.39168930053711, 33.812660217285156, 35.23362731933594, 36.65459442138672, 38.075565338134766, 39.49653625488281, 40.917503356933594, 42.338470458984375, 43.75944137573242, 45.18041229248047, 46.60137939453125]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 10.0, 7.0, 7.0, 18.0, 23.0, 25.0, 15.0, 20.0, 34.0, 41.0, 34.0, 47.0, 52.0, 52.0, 59.0, 39.0, 55.0, 53.0, 37.0, 49.0, 47.0, 35.0, 37.0, 45.0, 31.0, 27.0, 30.0, 19.0, 10.0, 13.0, 11.0, 6.0, 7.0, 4.0, 4.0, 3.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.45703125, -6.23828125, -6.01953125, -5.80078125, -5.58203125, -5.36328125, -5.14453125, -4.92578125, -4.70703125, -4.48828125, -4.26953125, -4.05078125, -3.83203125, -3.61328125, -3.39453125, -3.17578125, -2.95703125, -2.73828125, -2.51953125, -2.30078125, -2.08203125, -1.86328125, -1.64453125, -1.42578125, -1.20703125, -0.98828125, -0.76953125, -0.55078125, -0.33203125, -0.11328125, 0.10546875, 0.32421875, 0.54296875, 0.76171875, 0.98046875, 1.19921875, 1.41796875, 1.63671875, 1.85546875, 2.07421875, 2.29296875, 2.51171875, 2.73046875, 2.94921875, 3.16796875, 3.38671875, 3.60546875, 3.82421875, 4.04296875, 4.26171875, 4.48046875, 4.69921875, 4.91796875, 5.13671875, 5.35546875, 5.57421875, 5.79296875, 6.01171875, 6.23046875, 6.44921875, 6.66796875, 6.88671875, 7.10546875, 7.32421875, 7.54296875]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 8.0, 7.0, 12.0, 16.0, 27.0, 39.0, 67.0, 69.0, 121.0, 135.0, 233.0, 336.0, 454.0, 639.0, 856.0, 1183.0, 1756.0, 2471.0, 3448.0, 4969.0, 6921.0, 10159.0, 14659.0, 22016.0, 33908.0, 53457.0, 89479.0, 160320.0, 233091.0, 159710.0, 89811.0, 53536.0, 33909.0, 22361.0, 14715.0, 10039.0, 7081.0, 4800.0, 3481.0, 2366.0, 1631.0, 1209.0, 866.0, 676.0, 450.0, 343.0, 209.0, 138.0, 115.0, 77.0, 64.0, 41.0, 33.0, 17.0, 18.0, 6.0, 2.0, 3.0, 4.0, 1.0], "bins": [-0.7626953125, -0.739227294921875, -0.71575927734375, -0.692291259765625, -0.6688232421875, -0.645355224609375, -0.62188720703125, -0.598419189453125, -0.574951171875, -0.551483154296875, -0.52801513671875, -0.504547119140625, -0.4810791015625, -0.457611083984375, -0.43414306640625, -0.410675048828125, -0.38720703125, -0.363739013671875, -0.34027099609375, -0.316802978515625, -0.2933349609375, -0.269866943359375, -0.24639892578125, -0.222930908203125, -0.199462890625, -0.175994873046875, -0.15252685546875, -0.129058837890625, -0.1055908203125, -0.082122802734375, -0.05865478515625, -0.035186767578125, -0.01171875, 0.011749267578125, 0.03521728515625, 0.058685302734375, 0.0821533203125, 0.105621337890625, 0.12908935546875, 0.152557373046875, 0.176025390625, 0.199493408203125, 0.22296142578125, 0.246429443359375, 0.2698974609375, 0.293365478515625, 0.31683349609375, 0.340301513671875, 0.36376953125, 0.387237548828125, 0.41070556640625, 0.434173583984375, 0.4576416015625, 0.481109619140625, 0.50457763671875, 0.528045654296875, 0.551513671875, 0.574981689453125, 0.59844970703125, 0.621917724609375, 0.6453857421875, 0.668853759765625, 0.69232177734375, 0.715789794921875, 0.7392578125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 4.0, 5.0, 5.0, 6.0, 8.0, 16.0, 12.0, 16.0, 18.0, 16.0, 20.0, 25.0, 27.0, 28.0, 40.0, 27.0, 32.0, 41.0, 41.0, 44.0, 37.0, 1058.0, 24.0, 38.0, 47.0, 38.0, 36.0, 31.0, 37.0, 37.0, 32.0, 18.0, 30.0, 17.0, 22.0, 9.0, 9.0, 14.0, 15.0, 8.0, 10.0, 5.0, 5.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.162109375, -3.055755615234375, -2.94940185546875, -2.843048095703125, -2.7366943359375, -2.630340576171875, -2.52398681640625, -2.417633056640625, -2.311279296875, -2.204925537109375, -2.09857177734375, -1.992218017578125, -1.8858642578125, -1.779510498046875, -1.67315673828125, -1.566802978515625, -1.46044921875, -1.354095458984375, -1.24774169921875, -1.141387939453125, -1.0350341796875, -0.928680419921875, -0.82232666015625, -0.715972900390625, -0.609619140625, -0.503265380859375, -0.39691162109375, -0.290557861328125, -0.1842041015625, -0.077850341796875, 0.02850341796875, 0.134857177734375, 0.2412109375, 0.347564697265625, 0.45391845703125, 0.560272216796875, 0.6666259765625, 0.772979736328125, 0.87933349609375, 0.985687255859375, 1.092041015625, 1.198394775390625, 1.30474853515625, 1.411102294921875, 1.5174560546875, 1.623809814453125, 1.73016357421875, 1.836517333984375, 1.94287109375, 2.049224853515625, 2.15557861328125, 2.261932373046875, 2.3682861328125, 2.474639892578125, 2.58099365234375, 2.687347412109375, 2.793701171875, 2.900054931640625, 3.00640869140625, 3.112762451171875, 3.2191162109375, 3.325469970703125, 3.43182373046875, 3.538177490234375, 3.64453125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 6.0, 8.0, 10.0, 12.0, 9.0, 21.0, 33.0, 43.0, 53.0, 93.0, 146.0, 232.0, 324.0, 545.0, 757.0, 1165.0, 1815.0, 2754.0, 4287.0, 6828.0, 10789.0, 17749.0, 29527.0, 50447.0, 90542.0, 173755.0, 1309468.0, 175843.0, 90518.0, 50918.0, 30005.0, 18304.0, 11083.0, 6843.0, 4251.0, 2718.0, 1790.0, 1164.0, 772.0, 498.0, 329.0, 230.0, 132.0, 110.0, 71.0, 35.0, 30.0, 23.0, 16.0, 14.0, 11.0, 2.0, 5.0, 1.0, 5.0, 5.0, 1.0], "bins": [-0.77490234375, -0.7517776489257812, -0.7286529541015625, -0.7055282592773438, -0.682403564453125, -0.6592788696289062, -0.6361541748046875, -0.6130294799804688, -0.58990478515625, -0.5667800903320312, -0.5436553955078125, -0.5205307006835938, -0.497406005859375, -0.47428131103515625, -0.4511566162109375, -0.42803192138671875, -0.4049072265625, -0.38178253173828125, -0.3586578369140625, -0.33553314208984375, -0.312408447265625, -0.28928375244140625, -0.2661590576171875, -0.24303436279296875, -0.21990966796875, -0.19678497314453125, -0.1736602783203125, -0.15053558349609375, -0.127410888671875, -0.10428619384765625, -0.0811614990234375, -0.05803680419921875, -0.034912109375, -0.01178741455078125, 0.0113372802734375, 0.03446197509765625, 0.057586669921875, 0.08071136474609375, 0.1038360595703125, 0.12696075439453125, 0.15008544921875, 0.17321014404296875, 0.1963348388671875, 0.21945953369140625, 0.242584228515625, 0.26570892333984375, 0.2888336181640625, 0.31195831298828125, 0.3350830078125, 0.35820770263671875, 0.3813323974609375, 0.40445709228515625, 0.427581787109375, 0.45070648193359375, 0.4738311767578125, 0.49695587158203125, 0.52008056640625, 0.5432052612304688, 0.5663299560546875, 0.5894546508789062, 0.612579345703125, 0.6357040405273438, 0.6588287353515625, 0.6819534301757812, 0.705078125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 6.0, 2.0, 12.0, 15.0, 17.0, 22.0, 45.0, 70.0, 85.0, 106.0, 128.0, 108.0, 101.0, 83.0, 62.0, 40.0, 23.0, 20.0, 18.0, 6.0, 6.0, 8.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.002655029296875, -0.0025481581687927246, -0.0024412870407104492, -0.002334415912628174, -0.0022275447845458984, -0.002120673656463623, -0.0020138025283813477, -0.0019069314002990723, -0.0018000602722167969, -0.0016931891441345215, -0.001586318016052246, -0.0014794468879699707, -0.0013725757598876953, -0.00126570463180542, -0.0011588335037231445, -0.0010519623756408691, -0.0009450912475585938, -0.0008382201194763184, -0.000731348991394043, -0.0006244778633117676, -0.0005176067352294922, -0.0004107356071472168, -0.0003038644790649414, -0.00019699335098266602, -9.012222290039062e-05, 1.6748905181884766e-05, 0.00012362003326416016, 0.00023049116134643555, 0.00033736228942871094, 0.00044423341751098633, 0.0005511045455932617, 0.0006579756736755371, 0.0007648468017578125, 0.0008717179298400879, 0.0009785890579223633, 0.0010854601860046387, 0.001192331314086914, 0.0012992024421691895, 0.0014060735702514648, 0.0015129446983337402, 0.0016198158264160156, 0.001726686954498291, 0.0018335580825805664, 0.0019404292106628418, 0.002047300338745117, 0.0021541714668273926, 0.002261042594909668, 0.0023679137229919434, 0.0024747848510742188, 0.002581655979156494, 0.0026885271072387695, 0.002795398235321045, 0.0029022693634033203, 0.0030091404914855957, 0.003116011619567871, 0.0032228827476501465, 0.003329753875732422, 0.0034366250038146973, 0.0035434961318969727, 0.003650367259979248, 0.0037572383880615234, 0.003864109516143799, 0.003970980644226074, 0.00407785177230835, 0.004184722900390625]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 2.0, 6.0, 10.0, 18.0, 22.0, 35.0, 39.0, 63.0, 100.0, 178.0, 405.0, 1878.0, 1036122.0, 8540.0, 578.0, 230.0, 112.0, 65.0, 47.0, 27.0, 22.0, 12.0, 11.0, 6.0, 6.0, 2.0, 4.0, 3.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.08642578125, -0.08424615859985352, -0.08206653594970703, -0.07988691329956055, -0.07770729064941406, -0.07552766799926758, -0.0733480453491211, -0.07116842269897461, -0.06898880004882812, -0.06680917739868164, -0.06462955474853516, -0.06244993209838867, -0.06027030944824219, -0.0580906867980957, -0.05591106414794922, -0.053731441497802734, -0.05155181884765625, -0.049372196197509766, -0.04719257354736328, -0.0450129508972168, -0.04283332824707031, -0.04065370559692383, -0.038474082946777344, -0.03629446029663086, -0.034114837646484375, -0.03193521499633789, -0.029755592346191406, -0.027575969696044922, -0.025396347045898438, -0.023216724395751953, -0.02103710174560547, -0.018857479095458984, -0.0166778564453125, -0.014498233795166016, -0.012318611145019531, -0.010138988494873047, -0.007959365844726562, -0.005779743194580078, -0.0036001205444335938, -0.0014204978942871094, 0.000759124755859375, 0.0029387474060058594, 0.005118370056152344, 0.007297992706298828, 0.009477615356445312, 0.011657238006591797, 0.013836860656738281, 0.016016483306884766, 0.01819610595703125, 0.020375728607177734, 0.02255535125732422, 0.024734973907470703, 0.026914596557617188, 0.029094219207763672, 0.031273841857910156, 0.03345346450805664, 0.035633087158203125, 0.03781270980834961, 0.039992332458496094, 0.04217195510864258, 0.04435157775878906, 0.04653120040893555, 0.04871082305908203, 0.050890445709228516, 0.053070068359375]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 64.0, 593.0, 333.0, 21.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.011174412444233894, -0.010907172225415707, -0.010639931075274944, -0.010372690856456757, -0.010105449706315994, -0.009838209487497807, -0.009570968337357044, -0.009303728118538857, -0.009036486968398094, -0.008769246749579906, -0.008502005599439144, -0.008234765380620956, -0.007967524230480194, -0.007700284011662006, -0.007433043327182531, -0.007165802642703056, -0.006898562423884869, -0.006631321739405394, -0.006364081054925919, -0.0060968403704464436, -0.0058295996859669685, -0.005562359467148781, -0.005295118782669306, -0.005027878098189831, -0.004760637413710356, -0.004493396729230881, -0.004226156044751406, -0.003958915360271931, -0.0036916749086230993, -0.0034244342241436243, -0.003157193772494793, -0.002889953088015318, -0.002622712403535843, -0.002355471719056368, -0.002088231034576893, -0.0018209905829280615, -0.0015537498984485865, -0.0012865092139691114, -0.0010192686459049582, -0.000752028077840805, -0.00048478739336133003, -0.00021754676708951592, 4.9693859182298183e-05, 0.0003169344854541123, 0.0005841751117259264, 0.0008514157962054014, 0.0011186563642695546, 0.0013858969323337078, 0.0016531376168131828, 0.0019203783012926579, 0.002187618985772133, 0.0024548594374209642, 0.0027221001219004393, 0.0029893408063799143, 0.0032565812580287457, 0.0035238219425082207, 0.0037910626269876957, 0.004058303311467171, 0.004325543995946646, 0.004592784680426121, 0.0048600248992443085, 0.005127266049385071, 0.0053945062682032585, 0.0056617469526827335, 0.0059289876371622086]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 3.0, 7.0, 5.0, 5.0, 7.0, 13.0, 15.0, 12.0, 23.0, 23.0, 35.0, 22.0, 30.0, 27.0, 42.0, 37.0, 39.0, 49.0, 39.0, 51.0, 44.0, 47.0, 39.0, 49.0, 34.0, 37.0, 35.0, 38.0, 28.0, 24.0, 29.0, 17.0, 14.0, 17.0, 12.0, 12.0, 6.0, 13.0, 5.0, 2.0, 6.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013179183006286621, -0.0012793773785233498, -0.0012408364564180374, -0.001202295534312725, -0.0011637546122074127, -0.0011252136901021004, -0.001086672767996788, -0.0010481318458914757, -0.0010095909237861633, -0.000971050001680851, -0.0009325090795755386, -0.0008939681574702263, -0.0008554272353649139, -0.0008168863132596016, -0.0007783453911542892, -0.0007398044690489769, -0.0007012635469436646, -0.0006627226248383522, -0.0006241817027330399, -0.0005856407806277275, -0.0005470998585224152, -0.0005085589364171028, -0.00047001801431179047, -0.0004314770922064781, -0.00039293617010116577, -0.0003543952479958534, -0.0003158543258905411, -0.00027731340378522873, -0.00023877248167991638, -0.00020023155957460403, -0.0001616906374692917, -0.00012314971536397934, -8.460879325866699e-05, -4.6067871153354645e-05, -7.526949048042297e-06, 3.101397305727005e-05, 6.95548951625824e-05, 0.00010809581726789474, 0.0001466367393732071, 0.00018517766147851944, 0.0002237185835838318, 0.00026225950568914413, 0.0003008004277944565, 0.00033934134989976883, 0.0003778822720050812, 0.0004164231941103935, 0.00045496411621570587, 0.0004935050383210182, 0.0005320459604263306, 0.0005705868825316429, 0.0006091278046369553, 0.0006476687267422676, 0.00068620964884758, 0.0007247505709528923, 0.0007632914930582047, 0.000801832415163517, 0.0008403733372688293, 0.0008789142593741417, 0.000917455181479454, 0.0009559961035847664, 0.0009945370256900787, 0.001033077947795391, 0.0010716188699007034, 0.0011101597920060158, 0.0011487007141113281]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 10.0, 7.0, 7.0, 18.0, 23.0, 25.0, 15.0, 20.0, 34.0, 41.0, 34.0, 47.0, 52.0, 52.0, 59.0, 39.0, 55.0, 53.0, 37.0, 49.0, 47.0, 35.0, 37.0, 45.0, 31.0, 27.0, 30.0, 19.0, 10.0, 13.0, 11.0, 6.0, 7.0, 4.0, 4.0, 3.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.45703125, -6.23828125, -6.01953125, -5.80078125, -5.58203125, -5.36328125, -5.14453125, -4.92578125, -4.70703125, -4.48828125, -4.26953125, -4.05078125, -3.83203125, -3.61328125, -3.39453125, -3.17578125, -2.95703125, -2.73828125, -2.51953125, -2.30078125, -2.08203125, -1.86328125, -1.64453125, -1.42578125, -1.20703125, -0.98828125, -0.76953125, -0.55078125, -0.33203125, -0.11328125, 0.10546875, 0.32421875, 0.54296875, 0.76171875, 0.98046875, 1.19921875, 1.41796875, 1.63671875, 1.85546875, 2.07421875, 2.29296875, 2.51171875, 2.73046875, 2.94921875, 3.16796875, 3.38671875, 3.60546875, 3.82421875, 4.04296875, 4.26171875, 4.48046875, 4.69921875, 4.91796875, 5.13671875, 5.35546875, 5.57421875, 5.79296875, 6.01171875, 6.23046875, 6.44921875, 6.66796875, 6.88671875, 7.10546875, 7.32421875, 7.54296875]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 8.0, 7.0, 6.0, 14.0, 21.0, 42.0, 44.0, 65.0, 107.0, 169.0, 342.0, 520.0, 849.0, 1391.0, 2405.0, 4223.0, 8492.0, 17510.0, 41938.0, 124829.0, 436218.0, 275946.0, 77416.0, 28696.0, 12733.0, 6349.0, 3389.0, 1938.0, 1153.0, 668.0, 368.0, 243.0, 173.0, 102.0, 61.0, 38.0, 35.0, 23.0, 3.0, 6.0, 5.0, 6.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1953125, -4.04962158203125, -3.9039306640625, -3.75823974609375, -3.612548828125, -3.46685791015625, -3.3211669921875, -3.17547607421875, -3.02978515625, -2.88409423828125, -2.7384033203125, -2.59271240234375, -2.447021484375, -2.30133056640625, -2.1556396484375, -2.00994873046875, -1.8642578125, -1.71856689453125, -1.5728759765625, -1.42718505859375, -1.281494140625, -1.13580322265625, -0.9901123046875, -0.84442138671875, -0.69873046875, -0.55303955078125, -0.4073486328125, -0.26165771484375, -0.115966796875, 0.02972412109375, 0.1754150390625, 0.32110595703125, 0.466796875, 0.61248779296875, 0.7581787109375, 0.90386962890625, 1.049560546875, 1.19525146484375, 1.3409423828125, 1.48663330078125, 1.63232421875, 1.77801513671875, 1.9237060546875, 2.06939697265625, 2.215087890625, 2.36077880859375, 2.5064697265625, 2.65216064453125, 2.7978515625, 2.94354248046875, 3.0892333984375, 3.23492431640625, 3.380615234375, 3.52630615234375, 3.6719970703125, 3.81768798828125, 3.96337890625, 4.10906982421875, 4.2547607421875, 4.40045166015625, 4.546142578125, 4.69183349609375, 4.8375244140625, 4.98321533203125, 5.12890625]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 5.0, 6.0, 1.0, 4.0, 4.0, 12.0, 11.0, 10.0, 14.0, 11.0, 14.0, 16.0, 24.0, 29.0, 26.0, 22.0, 40.0, 36.0, 47.0, 46.0, 40.0, 84.0, 249.0, 1683.0, 143.0, 77.0, 50.0, 30.0, 41.0, 29.0, 35.0, 21.0, 27.0, 33.0, 27.0, 20.0, 20.0, 21.0, 7.0, 7.0, 8.0, 6.0, 5.0, 4.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 3.0], "bins": [-21.140625, -20.524169921875, -19.90771484375, -19.291259765625, -18.6748046875, -18.058349609375, -17.44189453125, -16.825439453125, -16.208984375, -15.592529296875, -14.97607421875, -14.359619140625, -13.7431640625, -13.126708984375, -12.51025390625, -11.893798828125, -11.27734375, -10.660888671875, -10.04443359375, -9.427978515625, -8.8115234375, -8.195068359375, -7.57861328125, -6.962158203125, -6.345703125, -5.729248046875, -5.11279296875, -4.496337890625, -3.8798828125, -3.263427734375, -2.64697265625, -2.030517578125, -1.4140625, -0.797607421875, -0.18115234375, 0.435302734375, 1.0517578125, 1.668212890625, 2.28466796875, 2.901123046875, 3.517578125, 4.134033203125, 4.75048828125, 5.366943359375, 5.9833984375, 6.599853515625, 7.21630859375, 7.832763671875, 8.44921875, 9.065673828125, 9.68212890625, 10.298583984375, 10.9150390625, 11.531494140625, 12.14794921875, 12.764404296875, 13.380859375, 13.997314453125, 14.61376953125, 15.230224609375, 15.8466796875, 16.463134765625, 17.07958984375, 17.696044921875, 18.3125]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 9.0, 3.0, 5.0, 7.0, 12.0, 11.0, 24.0, 33.0, 35.0, 57.0, 71.0, 88.0, 151.0, 247.0, 333.0, 1362.0, 48549.0, 3087763.0, 5404.0, 663.0, 262.0, 206.0, 116.0, 77.0, 59.0, 37.0, 33.0, 23.0, 24.0, 18.0, 7.0, 6.0, 6.0, 5.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.96875, -55.2041015625, -53.439453125, -51.6748046875, -49.91015625, -48.1455078125, -46.380859375, -44.6162109375, -42.8515625, -41.0869140625, -39.322265625, -37.5576171875, -35.79296875, -34.0283203125, -32.263671875, -30.4990234375, -28.734375, -26.9697265625, -25.205078125, -23.4404296875, -21.67578125, -19.9111328125, -18.146484375, -16.3818359375, -14.6171875, -12.8525390625, -11.087890625, -9.3232421875, -7.55859375, -5.7939453125, -4.029296875, -2.2646484375, -0.5, 1.2646484375, 3.029296875, 4.7939453125, 6.55859375, 8.3232421875, 10.087890625, 11.8525390625, 13.6171875, 15.3818359375, 17.146484375, 18.9111328125, 20.67578125, 22.4404296875, 24.205078125, 25.9697265625, 27.734375, 29.4990234375, 31.263671875, 33.0283203125, 34.79296875, 36.5576171875, 38.322265625, 40.0869140625, 41.8515625, 43.6162109375, 45.380859375, 47.1455078125, 48.91015625, 50.6748046875, 52.439453125, 54.2041015625, 55.96875]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 10.0, 879.0, 129.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.23406219482422, -55.09247970581055, -47.950897216796875, -40.8093147277832, -33.66773223876953, -26.52614974975586, -19.384567260742188, -12.242984771728516, -5.101402282714844, 2.040180206298828, 9.1817626953125, 16.323345184326172, 23.464927673339844, 30.606510162353516, 37.74809265136719, 44.88967514038086, 52.03125762939453, 59.1728401184082, 66.31442260742188, 73.45600891113281, 80.59758758544922, 87.73916625976562, 94.88075256347656, 102.0223388671875, 109.1639175415039, 116.30549621582031, 123.44708251953125, 130.5886688232422, 137.73025512695312, 144.871826171875, 152.01341247558594, 159.15499877929688, 166.29656982421875, 173.4381561279297, 180.57974243164062, 187.7213134765625, 194.86289978027344, 202.00448608398438, 209.14605712890625, 216.2876434326172, 223.42922973632812, 230.57081604003906, 237.71240234375, 244.85397338867188, 251.9955596923828, 259.13714599609375, 266.2787170410156, 273.4203186035156, 280.5618896484375, 287.7034606933594, 294.8450622558594, 301.98663330078125, 309.12823486328125, 316.2698059082031, 323.411376953125, 330.552978515625, 337.6945495605469, 344.83612060546875, 351.97772216796875, 359.1192932128906, 366.2608642578125, 373.4024658203125, 380.5440368652344, 387.6856384277344, 394.82720947265625]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 6.0, 9.0, 12.0, 9.0, 15.0, 13.0, 17.0, 22.0, 20.0, 34.0, 40.0, 25.0, 40.0, 38.0, 43.0, 42.0, 39.0, 28.0, 47.0, 44.0, 48.0, 37.0, 43.0, 35.0, 36.0, 38.0, 23.0, 36.0, 25.0, 32.0, 17.0, 16.0, 13.0, 7.0, 8.0, 9.0, 5.0, 6.0, 6.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.165687561035156, -48.547115325927734, -46.92854309082031, -45.309967041015625, -43.6913948059082, -42.07282257080078, -40.45425033569336, -38.83567810058594, -37.21710205078125, -35.59852981567383, -33.979957580566406, -32.36138153076172, -30.742809295654297, -29.124237060546875, -27.505664825439453, -25.88709259033203, -24.26852035522461, -22.649948120117188, -21.031373977661133, -19.41280174255371, -17.794227600097656, -16.175655364990234, -14.557083129882812, -12.938509941101074, -11.319936752319336, -9.701363563537598, -8.08279037475586, -6.4642181396484375, -4.845644950866699, -3.227071762084961, -1.608499526977539, 0.010073661804199219, 1.6286430358886719, 3.247215986251831, 4.86578893661499, 6.48436164855957, 8.102934837341309, 9.721508026123047, 11.340080261230469, 12.958653450012207, 14.577226638793945, 16.195798873901367, 17.814373016357422, 19.432945251464844, 21.051517486572266, 22.67009162902832, 24.288663864135742, 25.907238006591797, 27.52581024169922, 29.14438247680664, 30.762956619262695, 32.38153076171875, 34.00010299682617, 35.618675231933594, 37.237247467041016, 38.85581970214844, 40.474395751953125, 42.09296798706055, 43.71154022216797, 45.330116271972656, 46.94868850708008, 48.5672607421875, 50.18583297729492, 51.804405212402344, 53.422977447509766]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 5.0, 8.0, 9.0, 18.0, 16.0, 22.0, 20.0, 22.0, 33.0, 33.0, 24.0, 55.0, 50.0, 51.0, 55.0, 43.0, 51.0, 52.0, 47.0, 37.0, 39.0, 40.0, 45.0, 34.0, 33.0, 28.0, 34.0, 25.0, 12.0, 12.0, 12.0, 13.0, 10.0, 6.0, 5.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.578125, -6.35888671875, -6.1396484375, -5.92041015625, -5.701171875, -5.48193359375, -5.2626953125, -5.04345703125, -4.82421875, -4.60498046875, -4.3857421875, -4.16650390625, -3.947265625, -3.72802734375, -3.5087890625, -3.28955078125, -3.0703125, -2.85107421875, -2.6318359375, -2.41259765625, -2.193359375, -1.97412109375, -1.7548828125, -1.53564453125, -1.31640625, -1.09716796875, -0.8779296875, -0.65869140625, -0.439453125, -0.22021484375, -0.0009765625, 0.21826171875, 0.4375, 0.65673828125, 0.8759765625, 1.09521484375, 1.314453125, 1.53369140625, 1.7529296875, 1.97216796875, 2.19140625, 2.41064453125, 2.6298828125, 2.84912109375, 3.068359375, 3.28759765625, 3.5068359375, 3.72607421875, 3.9453125, 4.16455078125, 4.3837890625, 4.60302734375, 4.822265625, 5.04150390625, 5.2607421875, 5.47998046875, 5.69921875, 5.91845703125, 6.1376953125, 6.35693359375, 6.576171875, 6.79541015625, 7.0146484375, 7.23388671875, 7.453125]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 7.0, 15.0, 12.0, 18.0, 14.0, 16.0, 35.0, 35.0, 55.0, 66.0, 111.0, 160.0, 452.0, 4413.0, 408952.0, 3743609.0, 34200.0, 1382.0, 275.0, 117.0, 77.0, 56.0, 42.0, 40.0, 27.0, 24.0, 22.0, 11.0, 10.0, 1.0, 7.0, 7.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.53125, -35.32470703125, -34.1181640625, -32.91162109375, -31.705078125, -30.49853515625, -29.2919921875, -28.08544921875, -26.87890625, -25.67236328125, -24.4658203125, -23.25927734375, -22.052734375, -20.84619140625, -19.6396484375, -18.43310546875, -17.2265625, -16.02001953125, -14.8134765625, -13.60693359375, -12.400390625, -11.19384765625, -9.9873046875, -8.78076171875, -7.57421875, -6.36767578125, -5.1611328125, -3.95458984375, -2.748046875, -1.54150390625, -0.3349609375, 0.87158203125, 2.078125, 3.28466796875, 4.4912109375, 5.69775390625, 6.904296875, 8.11083984375, 9.3173828125, 10.52392578125, 11.73046875, 12.93701171875, 14.1435546875, 15.35009765625, 16.556640625, 17.76318359375, 18.9697265625, 20.17626953125, 21.3828125, 22.58935546875, 23.7958984375, 25.00244140625, 26.208984375, 27.41552734375, 28.6220703125, 29.82861328125, 31.03515625, 32.24169921875, 33.4482421875, 34.65478515625, 35.861328125, 37.06787109375, 38.2744140625, 39.48095703125, 40.6875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 6.0, 10.0, 9.0, 22.0, 21.0, 35.0, 53.0, 85.0, 122.0, 146.0, 216.0, 290.0, 400.0, 479.0, 495.0, 466.0, 343.0, 250.0, 179.0, 123.0, 89.0, 63.0, 50.0, 29.0, 26.0, 21.0, 14.0, 8.0, 5.0, 0.0, 6.0, 3.0, 4.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.546875, -13.069580078125, -12.59228515625, -12.114990234375, -11.6376953125, -11.160400390625, -10.68310546875, -10.205810546875, -9.728515625, -9.251220703125, -8.77392578125, -8.296630859375, -7.8193359375, -7.342041015625, -6.86474609375, -6.387451171875, -5.91015625, -5.432861328125, -4.95556640625, -4.478271484375, -4.0009765625, -3.523681640625, -3.04638671875, -2.569091796875, -2.091796875, -1.614501953125, -1.13720703125, -0.659912109375, -0.1826171875, 0.294677734375, 0.77197265625, 1.249267578125, 1.7265625, 2.203857421875, 2.68115234375, 3.158447265625, 3.6357421875, 4.113037109375, 4.59033203125, 5.067626953125, 5.544921875, 6.022216796875, 6.49951171875, 6.976806640625, 7.4541015625, 7.931396484375, 8.40869140625, 8.885986328125, 9.36328125, 9.840576171875, 10.31787109375, 10.795166015625, 11.2724609375, 11.749755859375, 12.22705078125, 12.704345703125, 13.181640625, 13.658935546875, 14.13623046875, 14.613525390625, 15.0908203125, 15.568115234375, 16.04541015625, 16.522705078125, 17.0]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 3.0, 14.0, 10.0, 12.0, 18.0, 12.0, 27.0, 49.0, 65.0, 85.0, 124.0, 138.0, 230.0, 324.0, 729.0, 4067.0, 154566.0, 3930726.0, 97904.0, 3359.0, 689.0, 329.0, 231.0, 165.0, 106.0, 77.0, 58.0, 40.0, 31.0, 31.0, 20.0, 16.0, 9.0, 6.0, 3.0, 9.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-60.75, -59.1279296875, -57.505859375, -55.8837890625, -54.26171875, -52.6396484375, -51.017578125, -49.3955078125, -47.7734375, -46.1513671875, -44.529296875, -42.9072265625, -41.28515625, -39.6630859375, -38.041015625, -36.4189453125, -34.796875, -33.1748046875, -31.552734375, -29.9306640625, -28.30859375, -26.6865234375, -25.064453125, -23.4423828125, -21.8203125, -20.1982421875, -18.576171875, -16.9541015625, -15.33203125, -13.7099609375, -12.087890625, -10.4658203125, -8.84375, -7.2216796875, -5.599609375, -3.9775390625, -2.35546875, -0.7333984375, 0.888671875, 2.5107421875, 4.1328125, 5.7548828125, 7.376953125, 8.9990234375, 10.62109375, 12.2431640625, 13.865234375, 15.4873046875, 17.109375, 18.7314453125, 20.353515625, 21.9755859375, 23.59765625, 25.2197265625, 26.841796875, 28.4638671875, 30.0859375, 31.7080078125, 33.330078125, 34.9521484375, 36.57421875, 38.1962890625, 39.818359375, 41.4404296875, 43.0625]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 22.0, 111.0, 376.0, 374.0, 114.0, 17.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-155.62362670898438, -147.85243225097656, -140.0812225341797, -132.31002807617188, -124.53882598876953, -116.76762390136719, -108.99642181396484, -101.2252197265625, -93.45402526855469, -85.68282318115234, -77.91162109375, -70.14042663574219, -62.369224548339844, -54.5980224609375, -46.826820373535156, -39.05562210083008, -31.28441619873047, -23.513216018676758, -15.74201488494873, -7.970813751220703, -0.1996135711669922, 7.571586608886719, 15.342788696289062, 23.11398696899414, 30.885189056396484, 38.65639114379883, 46.427589416503906, 54.19879150390625, 61.969993591308594, 69.74119567871094, 77.51239013671875, 85.2835922241211, 93.05479431152344, 100.82599639892578, 108.59719848632812, 116.36839294433594, 124.13959503173828, 131.91079711914062, 139.6820068359375, 147.4532012939453, 155.22439575195312, 162.99559020996094, 170.7667999267578, 178.53799438476562, 186.3092041015625, 194.0803985595703, 201.85159301757812, 209.622802734375, 217.39401245117188, 225.1652069091797, 232.93641662597656, 240.70761108398438, 248.47882080078125, 256.25, 264.0212097167969, 271.79241943359375, 279.5635986328125, 287.3348083496094, 295.1059875488281, 302.877197265625, 310.6484069824219, 318.41961669921875, 326.1907958984375, 333.9620056152344, 341.73321533203125]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 10.0, 7.0, 5.0, 8.0, 7.0, 8.0, 15.0, 24.0, 20.0, 25.0, 39.0, 26.0, 44.0, 50.0, 37.0, 57.0, 55.0, 55.0, 50.0, 46.0, 37.0, 52.0, 48.0, 40.0, 43.0, 33.0, 28.0, 18.0, 24.0, 18.0, 14.0, 21.0, 10.0, 10.0, 6.0, 5.0, 3.0, 8.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-57.649566650390625, -55.94164276123047, -54.23371505737305, -52.525787353515625, -50.81786346435547, -49.10993957519531, -47.40201187133789, -45.69408416748047, -43.98616027832031, -42.278236389160156, -40.570308685302734, -38.86238098144531, -37.154457092285156, -35.446533203125, -33.73860549926758, -32.030677795410156, -30.32275390625, -28.61482810974121, -26.906902313232422, -25.198976516723633, -23.491050720214844, -21.783124923706055, -20.075199127197266, -18.367273330688477, -16.659347534179688, -14.951421737670898, -13.24349594116211, -11.53557014465332, -9.827644348144531, -8.119718551635742, -6.411792755126953, -4.703866958618164, -2.995941162109375, -1.288015365600586, 0.4199104309082031, 2.127836227416992, 3.8357620239257812, 5.54368782043457, 7.251613616943359, 8.959539413452148, 10.667465209960938, 12.375391006469727, 14.083316802978516, 15.791242599487305, 17.499168395996094, 19.207094192504883, 20.915019989013672, 22.62294578552246, 24.33087158203125, 26.03879737854004, 27.746723175048828, 29.454648971557617, 31.162574768066406, 32.87049865722656, 34.578426361083984, 36.286354064941406, 37.99427795410156, 39.70220184326172, 41.41012954711914, 43.11805725097656, 44.82598114013672, 46.533905029296875, 48.2418327331543, 49.94976043701172, 51.657684326171875]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 7.0, 14.0, 14.0, 9.0, 13.0, 26.0, 23.0, 39.0, 37.0, 29.0, 33.0, 52.0, 34.0, 58.0, 50.0, 52.0, 49.0, 52.0, 48.0, 50.0, 43.0, 32.0, 37.0, 35.0, 36.0, 15.0, 25.0, 18.0, 15.0, 15.0, 7.0, 8.0, 8.0, 7.0, 5.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.59765625, -6.37213134765625, -6.1466064453125, -5.92108154296875, -5.695556640625, -5.47003173828125, -5.2445068359375, -5.01898193359375, -4.79345703125, -4.56793212890625, -4.3424072265625, -4.11688232421875, -3.891357421875, -3.66583251953125, -3.4403076171875, -3.21478271484375, -2.9892578125, -2.76373291015625, -2.5382080078125, -2.31268310546875, -2.087158203125, -1.86163330078125, -1.6361083984375, -1.41058349609375, -1.18505859375, -0.95953369140625, -0.7340087890625, -0.50848388671875, -0.282958984375, -0.05743408203125, 0.1680908203125, 0.39361572265625, 0.619140625, 0.84466552734375, 1.0701904296875, 1.29571533203125, 1.521240234375, 1.74676513671875, 1.9722900390625, 2.19781494140625, 2.42333984375, 2.64886474609375, 2.8743896484375, 3.09991455078125, 3.325439453125, 3.55096435546875, 3.7764892578125, 4.00201416015625, 4.2275390625, 4.45306396484375, 4.6785888671875, 4.90411376953125, 5.129638671875, 5.35516357421875, 5.5806884765625, 5.80621337890625, 6.03173828125, 6.25726318359375, 6.4827880859375, 6.70831298828125, 6.933837890625, 7.15936279296875, 7.3848876953125, 7.61041259765625, 7.8359375]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 5.0, 2.0, 7.0, 5.0, 17.0, 27.0, 39.0, 57.0, 79.0, 131.0, 176.0, 288.0, 448.0, 741.0, 975.0, 1601.0, 2513.0, 3833.0, 6117.0, 9422.0, 14631.0, 23940.0, 39216.0, 68221.0, 130909.0, 250006.0, 225964.0, 113897.0, 60266.0, 35451.0, 21885.0, 13361.0, 8610.0, 5582.0, 3610.0, 2277.0, 1462.0, 962.0, 615.0, 424.0, 254.0, 201.0, 102.0, 80.0, 54.0, 30.0, 28.0, 14.0, 15.0, 5.0, 7.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.94482421875, -0.9152069091796875, -0.885589599609375, -0.8559722900390625, -0.82635498046875, -0.7967376708984375, -0.767120361328125, -0.7375030517578125, -0.7078857421875, -0.6782684326171875, -0.648651123046875, -0.6190338134765625, -0.58941650390625, -0.5597991943359375, -0.530181884765625, -0.5005645751953125, -0.470947265625, -0.4413299560546875, -0.411712646484375, -0.3820953369140625, -0.35247802734375, -0.3228607177734375, -0.293243408203125, -0.2636260986328125, -0.2340087890625, -0.2043914794921875, -0.174774169921875, -0.1451568603515625, -0.11553955078125, -0.0859222412109375, -0.056304931640625, -0.0266876220703125, 0.0029296875, 0.0325469970703125, 0.062164306640625, 0.0917816162109375, 0.12139892578125, 0.1510162353515625, 0.180633544921875, 0.2102508544921875, 0.2398681640625, 0.2694854736328125, 0.299102783203125, 0.3287200927734375, 0.35833740234375, 0.3879547119140625, 0.417572021484375, 0.4471893310546875, 0.476806640625, 0.5064239501953125, 0.536041259765625, 0.5656585693359375, 0.59527587890625, 0.6248931884765625, 0.654510498046875, 0.6841278076171875, 0.7137451171875, 0.7433624267578125, 0.772979736328125, 0.8025970458984375, 0.83221435546875, 0.8618316650390625, 0.891448974609375, 0.9210662841796875, 0.95068359375]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 8.0, 4.0, 3.0, 6.0, 12.0, 11.0, 19.0, 13.0, 14.0, 18.0, 18.0, 22.0, 27.0, 36.0, 28.0, 36.0, 40.0, 29.0, 34.0, 34.0, 43.0, 41.0, 1065.0, 37.0, 34.0, 30.0, 52.0, 40.0, 42.0, 36.0, 22.0, 14.0, 23.0, 34.0, 14.0, 12.0, 14.0, 14.0, 9.0, 11.0, 7.0, 4.0, 6.0, 2.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0], "bins": [-3.712890625, -3.598358154296875, -3.48382568359375, -3.369293212890625, -3.2547607421875, -3.140228271484375, -3.02569580078125, -2.911163330078125, -2.796630859375, -2.682098388671875, -2.56756591796875, -2.453033447265625, -2.3385009765625, -2.223968505859375, -2.10943603515625, -1.994903564453125, -1.88037109375, -1.765838623046875, -1.65130615234375, -1.536773681640625, -1.4222412109375, -1.307708740234375, -1.19317626953125, -1.078643798828125, -0.964111328125, -0.849578857421875, -0.73504638671875, -0.620513916015625, -0.5059814453125, -0.391448974609375, -0.27691650390625, -0.162384033203125, -0.0478515625, 0.066680908203125, 0.18121337890625, 0.295745849609375, 0.4102783203125, 0.524810791015625, 0.63934326171875, 0.753875732421875, 0.868408203125, 0.982940673828125, 1.09747314453125, 1.212005615234375, 1.3265380859375, 1.441070556640625, 1.55560302734375, 1.670135498046875, 1.78466796875, 1.899200439453125, 2.01373291015625, 2.128265380859375, 2.2427978515625, 2.357330322265625, 2.47186279296875, 2.586395263671875, 2.700927734375, 2.815460205078125, 2.92999267578125, 3.044525146484375, 3.1590576171875, 3.273590087890625, 3.38812255859375, 3.502655029296875, 3.6171875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 5.0, 6.0, 12.0, 21.0, 25.0, 27.0, 49.0, 82.0, 119.0, 130.0, 213.0, 272.0, 358.0, 485.0, 669.0, 901.0, 1276.0, 1807.0, 2561.0, 3769.0, 5194.0, 7437.0, 10993.0, 16256.0, 24786.0, 37790.0, 60623.0, 102934.0, 178690.0, 1266940.0, 143266.0, 81989.0, 49412.0, 31986.0, 20983.0, 13904.0, 9283.0, 6504.0, 4427.0, 3241.0, 2141.0, 1554.0, 1110.0, 775.0, 587.0, 430.0, 315.0, 241.0, 167.0, 127.0, 93.0, 62.0, 37.0, 33.0, 21.0, 10.0, 9.0, 3.0, 3.0, 3.0, 2.0], "bins": [-0.6201171875, -0.6009140014648438, -0.5817108154296875, -0.5625076293945312, -0.543304443359375, -0.5241012573242188, -0.5048980712890625, -0.48569488525390625, -0.46649169921875, -0.44728851318359375, -0.4280853271484375, -0.40888214111328125, -0.389678955078125, -0.37047576904296875, -0.3512725830078125, -0.33206939697265625, -0.3128662109375, -0.29366302490234375, -0.2744598388671875, -0.25525665283203125, -0.236053466796875, -0.21685028076171875, -0.1976470947265625, -0.17844390869140625, -0.15924072265625, -0.14003753662109375, -0.1208343505859375, -0.10163116455078125, -0.082427978515625, -0.06322479248046875, -0.0440216064453125, -0.02481842041015625, -0.005615234375, 0.01358795166015625, 0.0327911376953125, 0.05199432373046875, 0.071197509765625, 0.09040069580078125, 0.1096038818359375, 0.12880706787109375, 0.14801025390625, 0.16721343994140625, 0.1864166259765625, 0.20561981201171875, 0.224822998046875, 0.24402618408203125, 0.2632293701171875, 0.28243255615234375, 0.3016357421875, 0.32083892822265625, 0.3400421142578125, 0.35924530029296875, 0.378448486328125, 0.39765167236328125, 0.4168548583984375, 0.43605804443359375, 0.45526123046875, 0.47446441650390625, 0.4936676025390625, 0.5128707885742188, 0.532073974609375, 0.5512771606445312, 0.5704803466796875, 0.5896835327148438, 0.60888671875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 2.0, 5.0, 3.0, 6.0, 6.0, 6.0, 7.0, 12.0, 11.0, 19.0, 18.0, 26.0, 27.0, 23.0, 31.0, 39.0, 63.0, 57.0, 60.0, 61.0, 54.0, 61.0, 61.0, 50.0, 53.0, 43.0, 40.0, 36.0, 21.0, 21.0, 12.0, 20.0, 11.0, 9.0, 11.0, 6.0, 3.0, 5.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020503997802734375, -0.001985311508178711, -0.0019202232360839844, -0.0018551349639892578, -0.0017900466918945312, -0.0017249584197998047, -0.0016598701477050781, -0.0015947818756103516, -0.001529693603515625, -0.0014646053314208984, -0.0013995170593261719, -0.0013344287872314453, -0.0012693405151367188, -0.0012042522430419922, -0.0011391639709472656, -0.001074075698852539, -0.0010089874267578125, -0.0009438991546630859, -0.0008788108825683594, -0.0008137226104736328, -0.0007486343383789062, -0.0006835460662841797, -0.0006184577941894531, -0.0005533695220947266, -0.00048828125, -0.00042319297790527344, -0.0003581047058105469, -0.0002930164337158203, -0.00022792816162109375, -0.0001628398895263672, -9.775161743164062e-05, -3.266334533691406e-05, 3.24249267578125e-05, 9.751319885253906e-05, 0.00016260147094726562, 0.0002276897430419922, 0.00029277801513671875, 0.0003578662872314453, 0.0004229545593261719, 0.00048804283142089844, 0.000553131103515625, 0.0006182193756103516, 0.0006833076477050781, 0.0007483959197998047, 0.0008134841918945312, 0.0008785724639892578, 0.0009436607360839844, 0.001008749008178711, 0.0010738372802734375, 0.001138925552368164, 0.0012040138244628906, 0.0012691020965576172, 0.0013341903686523438, 0.0013992786407470703, 0.0014643669128417969, 0.0015294551849365234, 0.00159454345703125, 0.0016596317291259766, 0.0017247200012207031, 0.0017898082733154297, 0.0018548965454101562, 0.0019199848175048828, 0.0019850730895996094, 0.002050161361694336, 0.0021152496337890625]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 6.0, 3.0, 9.0, 8.0, 14.0, 8.0, 20.0, 15.0, 23.0, 37.0, 38.0, 60.0, 84.0, 121.0, 188.0, 288.0, 711.0, 5853.0, 992997.0, 45896.0, 1051.0, 412.0, 200.0, 144.0, 90.0, 58.0, 39.0, 32.0, 27.0, 26.0, 24.0, 11.0, 15.0, 9.0, 5.0, 5.0, 5.0, 7.0, 5.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0], "bins": [-0.044281005859375, -0.04296588897705078, -0.04165077209472656, -0.040335655212402344, -0.039020538330078125, -0.037705421447753906, -0.03639030456542969, -0.03507518768310547, -0.03376007080078125, -0.03244495391845703, -0.031129837036132812, -0.029814720153808594, -0.028499603271484375, -0.027184486389160156, -0.025869369506835938, -0.02455425262451172, -0.0232391357421875, -0.02192401885986328, -0.020608901977539062, -0.019293785095214844, -0.017978668212890625, -0.016663551330566406, -0.015348434448242188, -0.014033317565917969, -0.01271820068359375, -0.011403083801269531, -0.010087966918945312, -0.008772850036621094, -0.007457733154296875, -0.006142616271972656, -0.0048274993896484375, -0.0035123825073242188, -0.002197265625, -0.0008821487426757812, 0.0004329681396484375, 0.0017480850219726562, 0.003063201904296875, 0.004378318786621094, 0.0056934356689453125, 0.007008552551269531, 0.00832366943359375, 0.009638786315917969, 0.010953903198242188, 0.012269020080566406, 0.013584136962890625, 0.014899253845214844, 0.016214370727539062, 0.01752948760986328, 0.0188446044921875, 0.02015972137451172, 0.021474838256835938, 0.022789955139160156, 0.024105072021484375, 0.025420188903808594, 0.026735305786132812, 0.02805042266845703, 0.02936553955078125, 0.03068065643310547, 0.03199577331542969, 0.033310890197753906, 0.034626007080078125, 0.035941123962402344, 0.03725624084472656, 0.03857135772705078, 0.039886474609375]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 8.0, 75.0, 501.0, 393.0, 39.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01471426896750927, -0.014460316859185696, -0.014206363819539547, -0.013952411711215973, -0.013698458671569824, -0.01344450656324625, -0.013190554454922676, -0.012936601415276527, -0.012682649306952953, -0.01242869719862938, -0.01217474415898323, -0.011920792050659657, -0.011666839011013508, -0.011412886902689934, -0.011158933863043785, -0.010904981754720211, -0.010651029646396637, -0.010397077538073063, -0.010143124498426914, -0.00988917239010334, -0.009635219350457191, -0.009381267242133617, -0.009127315133810043, -0.008873362094163895, -0.008619409054517746, -0.008365456946194172, -0.008111503906548023, -0.00785755179822445, -0.007603599224239588, -0.007349646650254726, -0.007095694076269865, -0.006841741502285004, -0.00658778939396143, -0.006333836819976568, -0.006079884245991707, -0.005825932137668133, -0.005571979563683271, -0.00531802698969841, -0.005064074415713549, -0.004810121841728687, -0.004556169267743826, -0.0043022166937589645, -0.004048264119774103, -0.0037943117786198854, -0.0035403594374656677, -0.0032864068634808064, -0.003032454289495945, -0.0027785017155110836, -0.002524549374356866, -0.0022705968003720045, -0.002016644459217787, -0.0017626918852329254, -0.0015087394276633859, -0.0012547869700938463, -0.001000834396108985, -0.0007468819385394454, -0.0004929294809699059, -0.00023897699429653585, 1.4975492376834154e-05, 0.0002689280081540346, 0.0005228804657235742, 0.0007768329232931137, 0.001030785497277975, 0.0012847379548475146, 0.0015386904124170542]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 9.0, 6.0, 3.0, 9.0, 4.0, 16.0, 11.0, 17.0, 30.0, 20.0, 27.0, 23.0, 29.0, 43.0, 37.0, 33.0, 57.0, 29.0, 42.0, 43.0, 43.0, 41.0, 37.0, 45.0, 43.0, 33.0, 28.0, 34.0, 28.0, 22.0, 28.0, 13.0, 21.0, 18.0, 21.0, 13.0, 10.0, 6.0, 6.0, 7.0, 9.0, 5.0, 2.0, 1.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010458827018737793, -0.001012478955090046, -0.0009790752083063126, -0.0009456714615225792, -0.0009122677147388458, -0.0008788639679551125, -0.0008454602211713791, -0.0008120564743876457, -0.0007786527276039124, -0.000745248980820179, -0.0007118452340364456, -0.0006784414872527122, -0.0006450377404689789, -0.0006116339936852455, -0.0005782302469015121, -0.0005448265001177788, -0.0005114227533340454, -0.00047801900655031204, -0.0004446152597665787, -0.0004112115129828453, -0.00037780776619911194, -0.00034440401941537857, -0.0003110002726316452, -0.00027759652584791183, -0.00024419277906417847, -0.0002107890322804451, -0.00017738528549671173, -0.00014398153871297836, -0.000110577791929245, -7.717404514551163e-05, -4.377029836177826e-05, -1.0366551578044891e-05, 2.3037195205688477e-05, 5.6440941989421844e-05, 8.984468877315521e-05, 0.00012324843555688858, 0.00015665218234062195, 0.00019005592912435532, 0.00022345967590808868, 0.00025686342269182205, 0.0002902671694755554, 0.0003236709162592888, 0.00035707466304302216, 0.0003904784098267555, 0.0004238821566104889, 0.00045728590339422226, 0.0004906896501779556, 0.000524093396961689, 0.0005574971437454224, 0.0005909008905291557, 0.0006243046373128891, 0.0006577083840966225, 0.0006911121308803558, 0.0007245158776640892, 0.0007579196244478226, 0.0007913233712315559, 0.0008247271180152893, 0.0008581308647990227, 0.000891534611582756, 0.0009249383583664894, 0.0009583421051502228, 0.0009917458519339561, 0.0010251495987176895, 0.0010585533455014229, 0.0010919570922851562]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 7.0, 14.0, 14.0, 9.0, 13.0, 26.0, 23.0, 39.0, 37.0, 29.0, 33.0, 52.0, 34.0, 58.0, 50.0, 52.0, 49.0, 52.0, 48.0, 50.0, 43.0, 32.0, 37.0, 35.0, 36.0, 15.0, 25.0, 18.0, 15.0, 15.0, 7.0, 8.0, 8.0, 7.0, 5.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.59765625, -6.37213134765625, -6.1466064453125, -5.92108154296875, -5.695556640625, -5.47003173828125, -5.2445068359375, -5.01898193359375, -4.79345703125, -4.56793212890625, -4.3424072265625, -4.11688232421875, -3.891357421875, -3.66583251953125, -3.4403076171875, -3.21478271484375, -2.9892578125, -2.76373291015625, -2.5382080078125, -2.31268310546875, -2.087158203125, -1.86163330078125, -1.6361083984375, -1.41058349609375, -1.18505859375, -0.95953369140625, -0.7340087890625, -0.50848388671875, -0.282958984375, -0.05743408203125, 0.1680908203125, 0.39361572265625, 0.619140625, 0.84466552734375, 1.0701904296875, 1.29571533203125, 1.521240234375, 1.74676513671875, 1.9722900390625, 2.19781494140625, 2.42333984375, 2.64886474609375, 2.8743896484375, 3.09991455078125, 3.325439453125, 3.55096435546875, 3.7764892578125, 4.00201416015625, 4.2275390625, 4.45306396484375, 4.6785888671875, 4.90411376953125, 5.129638671875, 5.35516357421875, 5.5806884765625, 5.80621337890625, 6.03173828125, 6.25726318359375, 6.4827880859375, 6.70831298828125, 6.933837890625, 7.15936279296875, 7.3848876953125, 7.61041259765625, 7.8359375]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 5.0, 3.0, 4.0, 2.0, 6.0, 12.0, 18.0, 15.0, 31.0, 38.0, 53.0, 75.0, 114.0, 172.0, 252.0, 403.0, 594.0, 897.0, 1377.0, 2147.0, 3382.0, 5434.0, 8461.0, 14366.0, 26787.0, 59989.0, 166177.0, 423137.0, 195597.0, 68331.0, 29928.0, 15674.0, 9200.0, 5609.0, 3611.0, 2355.0, 1420.0, 1001.0, 609.0, 454.0, 249.0, 178.0, 128.0, 76.0, 58.0, 43.0, 29.0, 25.0, 14.0, 10.0, 8.0, 7.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-3.173828125, -3.062744140625, -2.95166015625, -2.840576171875, -2.7294921875, -2.618408203125, -2.50732421875, -2.396240234375, -2.28515625, -2.174072265625, -2.06298828125, -1.951904296875, -1.8408203125, -1.729736328125, -1.61865234375, -1.507568359375, -1.396484375, -1.285400390625, -1.17431640625, -1.063232421875, -0.9521484375, -0.841064453125, -0.72998046875, -0.618896484375, -0.5078125, -0.396728515625, -0.28564453125, -0.174560546875, -0.0634765625, 0.047607421875, 0.15869140625, 0.269775390625, 0.380859375, 0.491943359375, 0.60302734375, 0.714111328125, 0.8251953125, 0.936279296875, 1.04736328125, 1.158447265625, 1.26953125, 1.380615234375, 1.49169921875, 1.602783203125, 1.7138671875, 1.824951171875, 1.93603515625, 2.047119140625, 2.158203125, 2.269287109375, 2.38037109375, 2.491455078125, 2.6025390625, 2.713623046875, 2.82470703125, 2.935791015625, 3.046875, 3.157958984375, 3.26904296875, 3.380126953125, 3.4912109375, 3.602294921875, 3.71337890625, 3.824462890625, 3.935546875]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 6.0, 7.0, 9.0, 14.0, 17.0, 18.0, 16.0, 27.0, 16.0, 35.0, 25.0, 32.0, 38.0, 44.0, 48.0, 63.0, 81.0, 121.0, 1548.0, 308.0, 92.0, 77.0, 47.0, 49.0, 42.0, 40.0, 38.0, 20.0, 18.0, 21.0, 25.0, 16.0, 11.0, 14.0, 11.0, 10.0, 9.0, 4.0, 8.0, 3.0, 5.0, 4.0, 1.0, 2.0, 3.0, 4.0, 1.0, 3.0], "bins": [-23.65625, -22.97802734375, -22.2998046875, -21.62158203125, -20.943359375, -20.26513671875, -19.5869140625, -18.90869140625, -18.23046875, -17.55224609375, -16.8740234375, -16.19580078125, -15.517578125, -14.83935546875, -14.1611328125, -13.48291015625, -12.8046875, -12.12646484375, -11.4482421875, -10.77001953125, -10.091796875, -9.41357421875, -8.7353515625, -8.05712890625, -7.37890625, -6.70068359375, -6.0224609375, -5.34423828125, -4.666015625, -3.98779296875, -3.3095703125, -2.63134765625, -1.953125, -1.27490234375, -0.5966796875, 0.08154296875, 0.759765625, 1.43798828125, 2.1162109375, 2.79443359375, 3.47265625, 4.15087890625, 4.8291015625, 5.50732421875, 6.185546875, 6.86376953125, 7.5419921875, 8.22021484375, 8.8984375, 9.57666015625, 10.2548828125, 10.93310546875, 11.611328125, 12.28955078125, 12.9677734375, 13.64599609375, 14.32421875, 15.00244140625, 15.6806640625, 16.35888671875, 17.037109375, 17.71533203125, 18.3935546875, 19.07177734375, 19.75]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 7.0, 2.0, 13.0, 10.0, 10.0, 13.0, 28.0, 25.0, 32.0, 55.0, 90.0, 127.0, 202.0, 444.0, 1220.0, 18333.0, 3112990.0, 10108.0, 1051.0, 360.0, 210.0, 119.0, 77.0, 54.0, 34.0, 30.0, 12.0, 10.0, 9.0, 11.0, 8.0, 2.0, 4.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-69.5625, -67.1162109375, -64.669921875, -62.2236328125, -59.77734375, -57.3310546875, -54.884765625, -52.4384765625, -49.9921875, -47.5458984375, -45.099609375, -42.6533203125, -40.20703125, -37.7607421875, -35.314453125, -32.8681640625, -30.421875, -27.9755859375, -25.529296875, -23.0830078125, -20.63671875, -18.1904296875, -15.744140625, -13.2978515625, -10.8515625, -8.4052734375, -5.958984375, -3.5126953125, -1.06640625, 1.3798828125, 3.826171875, 6.2724609375, 8.71875, 11.1650390625, 13.611328125, 16.0576171875, 18.50390625, 20.9501953125, 23.396484375, 25.8427734375, 28.2890625, 30.7353515625, 33.181640625, 35.6279296875, 38.07421875, 40.5205078125, 42.966796875, 45.4130859375, 47.859375, 50.3056640625, 52.751953125, 55.1982421875, 57.64453125, 60.0908203125, 62.537109375, 64.9833984375, 67.4296875, 69.8759765625, 72.322265625, 74.7685546875, 77.21484375, 79.6611328125, 82.107421875, 84.5537109375, 87.0]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 22.0, 801.0, 193.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.54315948486328, -65.83824920654297, -56.133338928222656, -46.42842483520508, -36.723514556884766, -27.018604278564453, -17.313690185546875, -7.6087799072265625, 2.09613037109375, 11.801041603088379, 21.505952835083008, 31.210865020751953, 40.915775299072266, 50.62068557739258, 60.325599670410156, 70.03050994873047, 79.73542022705078, 89.4403305053711, 99.1452407836914, 108.85015869140625, 118.55506896972656, 128.25997924804688, 137.9648895263672, 147.6697998046875, 157.3747100830078, 167.07962036132812, 176.78453063964844, 186.48944091796875, 196.19435119628906, 205.89926147460938, 215.60418701171875, 225.30908203125, 235.01400756835938, 244.7189178466797, 254.423828125, 264.1287536621094, 273.8336486816406, 283.53857421875, 293.24346923828125, 302.9483947753906, 312.6532897949219, 322.35821533203125, 332.0631103515625, 341.7680358886719, 351.4729309082031, 361.1778564453125, 370.88275146484375, 380.5876770019531, 390.2926025390625, 399.9975280761719, 409.7024230957031, 419.4073486328125, 429.11224365234375, 438.8171691894531, 448.5220642089844, 458.22698974609375, 467.931884765625, 477.6368103027344, 487.3417053222656, 497.046630859375, 506.75152587890625, 516.4564208984375, 526.161376953125, 535.8662719726562, 545.5711669921875]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 3.0, 3.0, 1.0, 5.0, 4.0, 7.0, 10.0, 10.0, 16.0, 20.0, 26.0, 19.0, 23.0, 26.0, 17.0, 36.0, 44.0, 37.0, 39.0, 32.0, 30.0, 36.0, 44.0, 40.0, 39.0, 40.0, 36.0, 36.0, 43.0, 38.0, 21.0, 25.0, 22.0, 34.0, 29.0, 16.0, 15.0, 13.0, 11.0, 11.0, 11.0, 9.0, 7.0, 3.0, 5.0, 4.0, 6.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-67.44723510742188, -65.40769958496094, -63.368160247802734, -61.32862091064453, -59.289085388183594, -57.24954605102539, -55.21000671386719, -53.17047119140625, -51.13093566894531, -49.09139633178711, -47.05186080932617, -45.01232147216797, -42.97278594970703, -40.93324661254883, -38.893707275390625, -36.85417175292969, -34.814632415771484, -32.77509307861328, -30.735557556152344, -28.69601821899414, -26.656482696533203, -24.616943359375, -22.57740592956543, -20.53786849975586, -18.49833106994629, -16.45879364013672, -14.419256210327148, -12.379717826843262, -10.340180397033691, -8.300642967224121, -6.261104583740234, -4.221567153930664, -2.1820297241210938, -0.14249205589294434, 1.897045612335205, 3.9365835189819336, 5.976120948791504, 8.015658378601074, 10.055196762084961, 12.094734191894531, 14.134271621704102, 16.173809051513672, 18.213346481323242, 20.252883911132812, 22.292423248291016, 24.331958770751953, 26.371498107910156, 28.411035537719727, 30.450572967529297, 32.4901123046875, 34.52964782714844, 36.56918716430664, 38.60872268676758, 40.64826202392578, 42.68779754638672, 44.72733688354492, 46.766876220703125, 48.80641555786133, 50.845951080322266, 52.88549041748047, 54.925025939941406, 56.96456527709961, 59.00410461425781, 61.04364013671875, 63.08317565917969]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 8.0, 4.0, 10.0, 18.0, 16.0, 17.0, 18.0, 27.0, 31.0, 37.0, 39.0, 40.0, 41.0, 50.0, 48.0, 46.0, 60.0, 60.0, 53.0, 46.0, 38.0, 53.0, 32.0, 31.0, 36.0, 24.0, 24.0, 22.0, 15.0, 13.0, 10.0, 16.0, 9.0, 1.0, 5.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.6015625, -7.3544921875, -7.107421875, -6.8603515625, -6.61328125, -6.3662109375, -6.119140625, -5.8720703125, -5.625, -5.3779296875, -5.130859375, -4.8837890625, -4.63671875, -4.3896484375, -4.142578125, -3.8955078125, -3.6484375, -3.4013671875, -3.154296875, -2.9072265625, -2.66015625, -2.4130859375, -2.166015625, -1.9189453125, -1.671875, -1.4248046875, -1.177734375, -0.9306640625, -0.68359375, -0.4365234375, -0.189453125, 0.0576171875, 0.3046875, 0.5517578125, 0.798828125, 1.0458984375, 1.29296875, 1.5400390625, 1.787109375, 2.0341796875, 2.28125, 2.5283203125, 2.775390625, 3.0224609375, 3.26953125, 3.5166015625, 3.763671875, 4.0107421875, 4.2578125, 4.5048828125, 4.751953125, 4.9990234375, 5.24609375, 5.4931640625, 5.740234375, 5.9873046875, 6.234375, 6.4814453125, 6.728515625, 6.9755859375, 7.22265625, 7.4697265625, 7.716796875, 7.9638671875, 8.2109375]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 4.0, 11.0, 17.0, 25.0, 20.0, 38.0, 59.0, 66.0, 140.0, 159.0, 281.0, 453.0, 864.0, 1805.0, 4162.0, 11735.0, 40589.0, 207808.0, 1081902.0, 1950527.0, 725578.0, 124954.0, 27900.0, 8606.0, 3237.0, 1463.0, 708.0, 419.0, 245.0, 163.0, 97.0, 66.0, 55.0, 33.0, 25.0, 29.0, 13.0, 7.0, 6.0, 2.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-11.5, -11.1837158203125, -10.867431640625, -10.5511474609375, -10.23486328125, -9.9185791015625, -9.602294921875, -9.2860107421875, -8.9697265625, -8.6534423828125, -8.337158203125, -8.0208740234375, -7.70458984375, -7.3883056640625, -7.072021484375, -6.7557373046875, -6.439453125, -6.1231689453125, -5.806884765625, -5.4906005859375, -5.17431640625, -4.8580322265625, -4.541748046875, -4.2254638671875, -3.9091796875, -3.5928955078125, -3.276611328125, -2.9603271484375, -2.64404296875, -2.3277587890625, -2.011474609375, -1.6951904296875, -1.37890625, -1.0626220703125, -0.746337890625, -0.4300537109375, -0.11376953125, 0.2025146484375, 0.518798828125, 0.8350830078125, 1.1513671875, 1.4676513671875, 1.783935546875, 2.1002197265625, 2.41650390625, 2.7327880859375, 3.049072265625, 3.3653564453125, 3.681640625, 3.9979248046875, 4.314208984375, 4.6304931640625, 4.94677734375, 5.2630615234375, 5.579345703125, 5.8956298828125, 6.2119140625, 6.5281982421875, 6.844482421875, 7.1607666015625, 7.47705078125, 7.7933349609375, 8.109619140625, 8.4259033203125, 8.7421875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 7.0, 8.0, 12.0, 14.0, 16.0, 19.0, 18.0, 27.0, 49.0, 64.0, 84.0, 108.0, 124.0, 176.0, 220.0, 290.0, 336.0, 374.0, 362.0, 363.0, 275.0, 258.0, 197.0, 145.0, 103.0, 93.0, 84.0, 50.0, 41.0, 39.0, 23.0, 17.0, 13.0, 12.0, 21.0, 13.0, 4.0, 10.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.984375, -8.6134033203125, -8.242431640625, -7.8714599609375, -7.50048828125, -7.1295166015625, -6.758544921875, -6.3875732421875, -6.0166015625, -5.6456298828125, -5.274658203125, -4.9036865234375, -4.53271484375, -4.1617431640625, -3.790771484375, -3.4197998046875, -3.048828125, -2.6778564453125, -2.306884765625, -1.9359130859375, -1.56494140625, -1.1939697265625, -0.822998046875, -0.4520263671875, -0.0810546875, 0.2899169921875, 0.660888671875, 1.0318603515625, 1.40283203125, 1.7738037109375, 2.144775390625, 2.5157470703125, 2.88671875, 3.2576904296875, 3.628662109375, 3.9996337890625, 4.37060546875, 4.7415771484375, 5.112548828125, 5.4835205078125, 5.8544921875, 6.2254638671875, 6.596435546875, 6.9674072265625, 7.33837890625, 7.7093505859375, 8.080322265625, 8.4512939453125, 8.822265625, 9.1932373046875, 9.564208984375, 9.9351806640625, 10.30615234375, 10.6771240234375, 11.048095703125, 11.4190673828125, 11.7900390625, 12.1610107421875, 12.531982421875, 12.9029541015625, 13.27392578125, 13.6448974609375, 14.015869140625, 14.3868408203125, 14.7578125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 2.0, 2.0, 0.0, 12.0, 6.0, 5.0, 14.0, 14.0, 28.0, 27.0, 25.0, 33.0, 45.0, 69.0, 83.0, 105.0, 142.0, 188.0, 292.0, 498.0, 1342.0, 10460.0, 332588.0, 3699503.0, 140435.0, 5998.0, 984.0, 454.0, 248.0, 169.0, 113.0, 85.0, 67.0, 54.0, 45.0, 27.0, 22.0, 28.0, 17.0, 15.0, 9.0, 5.0, 4.0, 3.0, 5.0, 4.0, 1.0, 4.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-37.96875, -36.75927734375, -35.5498046875, -34.34033203125, -33.130859375, -31.92138671875, -30.7119140625, -29.50244140625, -28.29296875, -27.08349609375, -25.8740234375, -24.66455078125, -23.455078125, -22.24560546875, -21.0361328125, -19.82666015625, -18.6171875, -17.40771484375, -16.1982421875, -14.98876953125, -13.779296875, -12.56982421875, -11.3603515625, -10.15087890625, -8.94140625, -7.73193359375, -6.5224609375, -5.31298828125, -4.103515625, -2.89404296875, -1.6845703125, -0.47509765625, 0.734375, 1.94384765625, 3.1533203125, 4.36279296875, 5.572265625, 6.78173828125, 7.9912109375, 9.20068359375, 10.41015625, 11.61962890625, 12.8291015625, 14.03857421875, 15.248046875, 16.45751953125, 17.6669921875, 18.87646484375, 20.0859375, 21.29541015625, 22.5048828125, 23.71435546875, 24.923828125, 26.13330078125, 27.3427734375, 28.55224609375, 29.76171875, 30.97119140625, 32.1806640625, 33.39013671875, 34.599609375, 35.80908203125, 37.0185546875, 38.22802734375, 39.4375]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 8.0, 17.0, 24.0, 49.0, 58.0, 108.0, 117.0, 112.0, 149.0, 133.0, 102.0, 57.0, 37.0, 22.0, 7.0, 6.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.56111145019531, -62.14396286010742, -59.726810455322266, -57.309661865234375, -54.89250946044922, -52.47536087036133, -50.05821228027344, -47.64105987548828, -45.223907470703125, -42.806758880615234, -40.38960647583008, -37.97245788574219, -35.55530548095703, -33.13815689086914, -30.721006393432617, -28.303855895996094, -25.886707305908203, -23.46955680847168, -21.052406311035156, -18.635257720947266, -16.21810531616211, -13.800955772399902, -11.383806228637695, -8.966655731201172, -6.549505233764648, -4.132354736328125, -1.7152047157287598, 0.7019453048706055, 3.119095802307129, 5.536246299743652, 7.953395843505859, 10.370546340942383, 12.787696838378906, 15.20484733581543, 17.621997833251953, 20.039146423339844, 22.456298828125, 24.87344741821289, 27.290597915649414, 29.707748413085938, 32.124900817871094, 34.542049407958984, 36.95920181274414, 39.37635040283203, 41.79350280761719, 44.21065139770508, 46.62779998779297, 49.044952392578125, 51.462100982666016, 53.879249572753906, 56.29640197753906, 58.71355056762695, 61.13070297241211, 63.5478515625, 65.96500396728516, 68.38215637207031, 70.79930114746094, 73.2164535522461, 75.63359832763672, 78.05075073242188, 80.46790313720703, 82.88505554199219, 85.30220031738281, 87.71935272216797, 90.13650512695312]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 7.0, 8.0, 7.0, 13.0, 7.0, 19.0, 19.0, 10.0, 21.0, 28.0, 41.0, 30.0, 36.0, 30.0, 52.0, 59.0, 45.0, 59.0, 50.0, 43.0, 46.0, 47.0, 41.0, 44.0, 37.0, 32.0, 30.0, 24.0, 23.0, 17.0, 23.0, 14.0, 16.0, 8.0, 6.0, 4.0, 4.0, 1.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-62.367523193359375, -60.69341278076172, -59.01930618286133, -57.34519958496094, -55.67108917236328, -53.996978759765625, -52.322872161865234, -50.648765563964844, -48.97465515136719, -47.30054473876953, -45.62643814086914, -43.95233154296875, -42.278221130371094, -40.60411071777344, -38.93000411987305, -37.255897521972656, -35.581787109375, -33.907676696777344, -32.23357009887695, -30.55946159362793, -28.885353088378906, -27.211244583129883, -25.53713607788086, -23.863027572631836, -22.188919067382812, -20.51481056213379, -18.840702056884766, -17.166593551635742, -15.492485046386719, -13.818376541137695, -12.144268035888672, -10.470159530639648, -8.796051025390625, -7.121942520141602, -5.447834014892578, -3.7737255096435547, -2.0996170043945312, -0.4255084991455078, 1.2486000061035156, 2.922708511352539, 4.5968170166015625, 6.270925521850586, 7.945034027099609, 9.619142532348633, 11.293251037597656, 12.96735954284668, 14.641468048095703, 16.315576553344727, 17.98968505859375, 19.663793563842773, 21.337902069091797, 23.01201057434082, 24.686119079589844, 26.360227584838867, 28.03433609008789, 29.708444595336914, 31.382553100585938, 33.056663513183594, 34.730770111083984, 36.404876708984375, 38.07898712158203, 39.75309753417969, 41.42720413208008, 43.10131072998047, 44.775421142578125]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 8.0, 8.0, 4.0, 14.0, 14.0, 15.0, 16.0, 29.0, 26.0, 33.0, 32.0, 37.0, 47.0, 39.0, 42.0, 58.0, 49.0, 41.0, 47.0, 51.0, 51.0, 45.0, 43.0, 48.0, 32.0, 33.0, 21.0, 18.0, 17.0, 18.0, 21.0, 16.0, 8.0, 9.0, 4.0, 3.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.80078125, -7.56231689453125, -7.3238525390625, -7.08538818359375, -6.846923828125, -6.60845947265625, -6.3699951171875, -6.13153076171875, -5.89306640625, -5.65460205078125, -5.4161376953125, -5.17767333984375, -4.939208984375, -4.70074462890625, -4.4622802734375, -4.22381591796875, -3.9853515625, -3.74688720703125, -3.5084228515625, -3.26995849609375, -3.031494140625, -2.79302978515625, -2.5545654296875, -2.31610107421875, -2.07763671875, -1.83917236328125, -1.6007080078125, -1.36224365234375, -1.123779296875, -0.88531494140625, -0.6468505859375, -0.40838623046875, -0.169921875, 0.06854248046875, 0.3070068359375, 0.54547119140625, 0.783935546875, 1.02239990234375, 1.2608642578125, 1.49932861328125, 1.73779296875, 1.97625732421875, 2.2147216796875, 2.45318603515625, 2.691650390625, 2.93011474609375, 3.1685791015625, 3.40704345703125, 3.6455078125, 3.88397216796875, 4.1224365234375, 4.36090087890625, 4.599365234375, 4.83782958984375, 5.0762939453125, 5.31475830078125, 5.55322265625, 5.79168701171875, 6.0301513671875, 6.26861572265625, 6.507080078125, 6.74554443359375, 6.9840087890625, 7.22247314453125, 7.4609375]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 9.0, 6.0, 5.0, 10.0, 17.0, 27.0, 55.0, 62.0, 90.0, 124.0, 177.0, 298.0, 434.0, 630.0, 893.0, 1334.0, 1969.0, 3034.0, 4536.0, 6834.0, 10409.0, 15655.0, 24235.0, 37756.0, 62096.0, 108489.0, 199731.0, 233191.0, 134985.0, 74504.0, 44765.0, 27971.0, 17923.0, 12201.0, 7996.0, 5275.0, 3560.0, 2337.0, 1580.0, 1096.0, 748.0, 470.0, 332.0, 236.0, 150.0, 99.0, 74.0, 48.0, 44.0, 24.0, 11.0, 10.0, 5.0, 8.0, 5.0, 1.0, 4.0, 1.0, 1.0], "bins": [-0.9287109375, -0.8998489379882812, -0.8709869384765625, -0.8421249389648438, -0.813262939453125, -0.7844009399414062, -0.7555389404296875, -0.7266769409179688, -0.69781494140625, -0.6689529418945312, -0.6400909423828125, -0.6112289428710938, -0.582366943359375, -0.5535049438476562, -0.5246429443359375, -0.49578094482421875, -0.4669189453125, -0.43805694580078125, -0.4091949462890625, -0.38033294677734375, -0.351470947265625, -0.32260894775390625, -0.2937469482421875, -0.26488494873046875, -0.23602294921875, -0.20716094970703125, -0.1782989501953125, -0.14943695068359375, -0.120574951171875, -0.09171295166015625, -0.0628509521484375, -0.03398895263671875, -0.005126953125, 0.02373504638671875, 0.0525970458984375, 0.08145904541015625, 0.110321044921875, 0.13918304443359375, 0.1680450439453125, 0.19690704345703125, 0.22576904296875, 0.25463104248046875, 0.2834930419921875, 0.31235504150390625, 0.341217041015625, 0.37007904052734375, 0.3989410400390625, 0.42780303955078125, 0.4566650390625, 0.48552703857421875, 0.5143890380859375, 0.5432510375976562, 0.572113037109375, 0.6009750366210938, 0.6298370361328125, 0.6586990356445312, 0.68756103515625, 0.7164230346679688, 0.7452850341796875, 0.7741470336914062, 0.803009033203125, 0.8318710327148438, 0.8607330322265625, 0.8895950317382812, 0.91845703125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 5.0, 3.0, 4.0, 1.0, 3.0, 5.0, 11.0, 7.0, 12.0, 16.0, 11.0, 19.0, 16.0, 21.0, 25.0, 25.0, 16.0, 39.0, 27.0, 29.0, 29.0, 39.0, 49.0, 35.0, 43.0, 1066.0, 45.0, 51.0, 49.0, 29.0, 33.0, 31.0, 38.0, 27.0, 29.0, 22.0, 22.0, 16.0, 19.0, 13.0, 8.0, 6.0, 15.0, 8.0, 4.0, 6.0, 4.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.828125, -3.70123291015625, -3.5743408203125, -3.44744873046875, -3.320556640625, -3.19366455078125, -3.0667724609375, -2.93988037109375, -2.81298828125, -2.68609619140625, -2.5592041015625, -2.43231201171875, -2.305419921875, -2.17852783203125, -2.0516357421875, -1.92474365234375, -1.7978515625, -1.67095947265625, -1.5440673828125, -1.41717529296875, -1.290283203125, -1.16339111328125, -1.0364990234375, -0.90960693359375, -0.78271484375, -0.65582275390625, -0.5289306640625, -0.40203857421875, -0.275146484375, -0.14825439453125, -0.0213623046875, 0.10552978515625, 0.232421875, 0.35931396484375, 0.4862060546875, 0.61309814453125, 0.739990234375, 0.86688232421875, 0.9937744140625, 1.12066650390625, 1.24755859375, 1.37445068359375, 1.5013427734375, 1.62823486328125, 1.755126953125, 1.88201904296875, 2.0089111328125, 2.13580322265625, 2.2626953125, 2.38958740234375, 2.5164794921875, 2.64337158203125, 2.770263671875, 2.89715576171875, 3.0240478515625, 3.15093994140625, 3.27783203125, 3.40472412109375, 3.5316162109375, 3.65850830078125, 3.785400390625, 3.91229248046875, 4.0391845703125, 4.16607666015625, 4.29296875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 5.0, 6.0, 6.0, 16.0, 23.0, 33.0, 40.0, 74.0, 89.0, 130.0, 189.0, 280.0, 399.0, 563.0, 846.0, 1205.0, 1705.0, 2571.0, 3736.0, 5726.0, 8623.0, 13416.0, 21115.0, 33769.0, 55751.0, 97472.0, 182993.0, 1298360.0, 152959.0, 83045.0, 48220.0, 29488.0, 18680.0, 11960.0, 7736.0, 5126.0, 3408.0, 2262.0, 1532.0, 1127.0, 795.0, 510.0, 372.0, 238.0, 178.0, 122.0, 81.0, 47.0, 37.0, 25.0, 22.0, 10.0, 9.0, 2.0, 6.0, 0.0, 0.0, 3.0], "bins": [-0.806640625, -0.7824630737304688, -0.7582855224609375, -0.7341079711914062, -0.709930419921875, -0.6857528686523438, -0.6615753173828125, -0.6373977661132812, -0.61322021484375, -0.5890426635742188, -0.5648651123046875, -0.5406875610351562, -0.516510009765625, -0.49233245849609375, -0.4681549072265625, -0.44397735595703125, -0.4197998046875, -0.39562225341796875, -0.3714447021484375, -0.34726715087890625, -0.323089599609375, -0.29891204833984375, -0.2747344970703125, -0.25055694580078125, -0.22637939453125, -0.20220184326171875, -0.1780242919921875, -0.15384674072265625, -0.129669189453125, -0.10549163818359375, -0.0813140869140625, -0.05713653564453125, -0.032958984375, -0.00878143310546875, 0.0153961181640625, 0.03957366943359375, 0.063751220703125, 0.08792877197265625, 0.1121063232421875, 0.13628387451171875, 0.16046142578125, 0.18463897705078125, 0.2088165283203125, 0.23299407958984375, 0.257171630859375, 0.28134918212890625, 0.3055267333984375, 0.32970428466796875, 0.3538818359375, 0.37805938720703125, 0.4022369384765625, 0.42641448974609375, 0.450592041015625, 0.47476959228515625, 0.4989471435546875, 0.5231246948242188, 0.54730224609375, 0.5714797973632812, 0.5956573486328125, 0.6198348999023438, 0.644012451171875, 0.6681900024414062, 0.6923675537109375, 0.7165451049804688, 0.74072265625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 0.0, 1.0, 5.0, 3.0, 4.0, 3.0, 2.0, 6.0, 8.0, 13.0, 6.0, 14.0, 14.0, 10.0, 16.0, 19.0, 36.0, 22.0, 41.0, 49.0, 42.0, 48.0, 63.0, 55.0, 57.0, 62.0, 47.0, 45.0, 45.0, 45.0, 30.0, 41.0, 31.0, 14.0, 21.0, 13.0, 10.0, 13.0, 5.0, 8.0, 8.0, 5.0, 9.0, 5.0, 3.0, 1.0, 0.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018720626831054688, -0.0018130689859390259, -0.001754075288772583, -0.0016950815916061401, -0.0016360878944396973, -0.0015770941972732544, -0.0015181005001068115, -0.0014591068029403687, -0.0014001131057739258, -0.001341119408607483, -0.00128212571144104, -0.0012231320142745972, -0.0011641383171081543, -0.0011051446199417114, -0.0010461509227752686, -0.0009871572256088257, -0.0009281635284423828, -0.0008691698312759399, -0.0008101761341094971, -0.0007511824369430542, -0.0006921887397766113, -0.0006331950426101685, -0.0005742013454437256, -0.0005152076482772827, -0.00045621395111083984, -0.00039722025394439697, -0.0003382265567779541, -0.00027923285961151123, -0.00022023916244506836, -0.0001612454652786255, -0.00010225176811218262, -4.3258070945739746e-05, 1.5735626220703125e-05, 7.4729323387146e-05, 0.00013372302055358887, 0.00019271671772003174, 0.0002517104148864746, 0.0003107041120529175, 0.00036969780921936035, 0.0004286915063858032, 0.0004876852035522461, 0.000546678900718689, 0.0006056725978851318, 0.0006646662950515747, 0.0007236599922180176, 0.0007826536893844604, 0.0008416473865509033, 0.0009006410837173462, 0.0009596347808837891, 0.001018628478050232, 0.0010776221752166748, 0.0011366158723831177, 0.0011956095695495605, 0.0012546032667160034, 0.0013135969638824463, 0.0013725906610488892, 0.001431584358215332, 0.001490578055381775, 0.0015495717525482178, 0.0016085654497146606, 0.0016675591468811035, 0.0017265528440475464, 0.0017855465412139893, 0.0018445402383804321, 0.001903533935546875]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 5.0, 9.0, 9.0, 7.0, 10.0, 10.0, 9.0, 22.0, 19.0, 28.0, 34.0, 49.0, 73.0, 99.0, 137.0, 263.0, 664.0, 3650.0, 988800.0, 52579.0, 989.0, 416.0, 209.0, 125.0, 78.0, 58.0, 37.0, 28.0, 22.0, 19.0, 18.0, 14.0, 14.0, 11.0, 7.0, 6.0, 4.0, 7.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.045806884765625, -0.044406890869140625, -0.04300689697265625, -0.041606903076171875, -0.0402069091796875, -0.038806915283203125, -0.03740692138671875, -0.036006927490234375, -0.03460693359375, -0.033206939697265625, -0.03180694580078125, -0.030406951904296875, -0.0290069580078125, -0.027606964111328125, -0.02620697021484375, -0.024806976318359375, -0.023406982421875, -0.022006988525390625, -0.02060699462890625, -0.019207000732421875, -0.0178070068359375, -0.016407012939453125, -0.01500701904296875, -0.013607025146484375, -0.01220703125, -0.010807037353515625, -0.00940704345703125, -0.008007049560546875, -0.0066070556640625, -0.005207061767578125, -0.00380706787109375, -0.002407073974609375, -0.001007080078125, 0.000392913818359375, 0.00179290771484375, 0.003192901611328125, 0.0045928955078125, 0.005992889404296875, 0.00739288330078125, 0.008792877197265625, 0.01019287109375, 0.011592864990234375, 0.01299285888671875, 0.014392852783203125, 0.0157928466796875, 0.017192840576171875, 0.01859283447265625, 0.019992828369140625, 0.021392822265625, 0.022792816162109375, 0.02419281005859375, 0.025592803955078125, 0.0269927978515625, 0.028392791748046875, 0.02979278564453125, 0.031192779541015625, 0.0325927734375, 0.033992767333984375, 0.03539276123046875, 0.036792755126953125, 0.0381927490234375, 0.039592742919921875, 0.04099273681640625, 0.042392730712890625, 0.043792724609375]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 42.0, 148.0, 349.0, 305.0, 128.0, 27.0, 6.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0068414597772061825, -0.006709668319672346, -0.00657787686213851, -0.006446085404604673, -0.006314293947070837, -0.006182502489537001, -0.006050711032003164, -0.005918919108808041, -0.005787127651274204, -0.005655336193740368, -0.0055235447362065315, -0.005391753278672695, -0.005259961821138859, -0.005128170363605022, -0.004996378906071186, -0.00486458744853735, -0.004732795991003513, -0.004601004533469677, -0.004469213075935841, -0.004337421618402004, -0.004205630160868168, -0.0040738387033343315, -0.003942047245800495, -0.003810255555436015, -0.0036784640979021788, -0.0035466726403683424, -0.003414881182834506, -0.0032830897253006697, -0.0031512980349361897, -0.0030195065774023533, -0.002887715119868517, -0.0027559236623346806, -0.0026241319719702005, -0.002492340514436364, -0.002360549056902528, -0.0022287575993686914, -0.0020969659090042114, -0.001965174451470375, -0.0018333829939365387, -0.0017015915364027023, -0.001569800078868866, -0.0014380086213350296, -0.0013062171638011932, -0.001174425589852035, -0.0010426341323181987, -0.0009108426747843623, -0.000779051159042865, -0.0006472596433013678, -0.0005154681857675314, -0.0003836766991298646, -0.00025188521249219775, -0.00012009372585453093, 1.1697760783135891e-05, 0.00014348921831697226, 0.00027528073405846953, 0.0004070722497999668, 0.0005388637073338032, 0.0006706551648676395, 0.0008024466806091368, 0.0009342381963506341, 0.0010660296538844705, 0.0011978211114183068, 0.001329612685367465, 0.0014614041429013014, 0.0015931956004351377]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 5.0, 7.0, 6.0, 6.0, 6.0, 8.0, 21.0, 12.0, 19.0, 16.0, 28.0, 27.0, 30.0, 40.0, 40.0, 40.0, 41.0, 37.0, 53.0, 37.0, 50.0, 36.0, 35.0, 36.0, 43.0, 37.0, 34.0, 29.0, 29.0, 30.0, 26.0, 23.0, 19.0, 12.0, 12.0, 16.0, 12.0, 12.0, 10.0, 7.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0011265277862548828, -0.0010912679135799408, -0.0010560080409049988, -0.0010207481682300568, -0.0009854882955551147, -0.0009502284228801727, -0.0009149685502052307, -0.0008797086775302887, -0.0008444488048553467, -0.0008091889321804047, -0.0007739290595054626, -0.0007386691868305206, -0.0007034093141555786, -0.0006681494414806366, -0.0006328895688056946, -0.0005976296961307526, -0.0005623698234558105, -0.0005271099507808685, -0.0004918500781059265, -0.0004565902054309845, -0.0004213303327560425, -0.00038607046008110046, -0.00035081058740615845, -0.00031555071473121643, -0.0002802908420562744, -0.0002450309693813324, -0.00020977109670639038, -0.00017451122403144836, -0.00013925135135650635, -0.00010399147868156433, -6.873160600662231e-05, -3.34717333316803e-05, 1.7881393432617188e-06, 3.7048012018203735e-05, 7.230788469314575e-05, 0.00010756775736808777, 0.00014282763004302979, 0.0001780875027179718, 0.00021334737539291382, 0.00024860724806785583, 0.00028386712074279785, 0.00031912699341773987, 0.0003543868660926819, 0.0003896467387676239, 0.0004249066114425659, 0.00046016648411750793, 0.00049542635679245, 0.000530686229467392, 0.000565946102142334, 0.000601205974817276, 0.000636465847492218, 0.00067172572016716, 0.000706985592842102, 0.0007422454655170441, 0.0007775053381919861, 0.0008127652108669281, 0.0008480250835418701, 0.0008832849562168121, 0.0009185448288917542, 0.0009538047015666962, 0.0009890645742416382, 0.0010243244469165802, 0.0010595843195915222, 0.0010948441922664642, 0.0011301040649414062]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 8.0, 8.0, 4.0, 14.0, 14.0, 15.0, 16.0, 29.0, 26.0, 33.0, 32.0, 37.0, 47.0, 40.0, 41.0, 58.0, 49.0, 41.0, 47.0, 51.0, 51.0, 45.0, 43.0, 48.0, 32.0, 33.0, 21.0, 18.0, 17.0, 18.0, 21.0, 16.0, 7.0, 10.0, 4.0, 3.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.80078125, -7.56231689453125, -7.3238525390625, -7.08538818359375, -6.846923828125, -6.60845947265625, -6.3699951171875, -6.13153076171875, -5.89306640625, -5.65460205078125, -5.4161376953125, -5.17767333984375, -4.939208984375, -4.70074462890625, -4.4622802734375, -4.22381591796875, -3.9853515625, -3.74688720703125, -3.5084228515625, -3.26995849609375, -3.031494140625, -2.79302978515625, -2.5545654296875, -2.31610107421875, -2.07763671875, -1.83917236328125, -1.6007080078125, -1.36224365234375, -1.123779296875, -0.88531494140625, -0.6468505859375, -0.40838623046875, -0.169921875, 0.06854248046875, 0.3070068359375, 0.54547119140625, 0.783935546875, 1.02239990234375, 1.2608642578125, 1.49932861328125, 1.73779296875, 1.97625732421875, 2.2147216796875, 2.45318603515625, 2.691650390625, 2.93011474609375, 3.1685791015625, 3.40704345703125, 3.6455078125, 3.88397216796875, 4.1224365234375, 4.36090087890625, 4.599365234375, 4.83782958984375, 5.0762939453125, 5.31475830078125, 5.55322265625, 5.79168701171875, 6.0301513671875, 6.26861572265625, 6.507080078125, 6.74554443359375, 6.9840087890625, 7.22247314453125, 7.4609375]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 7.0, 8.0, 3.0, 15.0, 25.0, 31.0, 34.0, 72.0, 83.0, 108.0, 165.0, 281.0, 524.0, 865.0, 1713.0, 3558.0, 8291.0, 20671.0, 55035.0, 156677.0, 396829.0, 258621.0, 89125.0, 32602.0, 12663.0, 5306.0, 2377.0, 1202.0, 605.0, 330.0, 235.0, 164.0, 105.0, 61.0, 53.0, 39.0, 21.0, 17.0, 12.0, 10.0, 11.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.67578125, -4.5284423828125, -4.381103515625, -4.2337646484375, -4.08642578125, -3.9390869140625, -3.791748046875, -3.6444091796875, -3.4970703125, -3.3497314453125, -3.202392578125, -3.0550537109375, -2.90771484375, -2.7603759765625, -2.613037109375, -2.4656982421875, -2.318359375, -2.1710205078125, -2.023681640625, -1.8763427734375, -1.72900390625, -1.5816650390625, -1.434326171875, -1.2869873046875, -1.1396484375, -0.9923095703125, -0.844970703125, -0.6976318359375, -0.55029296875, -0.4029541015625, -0.255615234375, -0.1082763671875, 0.0390625, 0.1864013671875, 0.333740234375, 0.4810791015625, 0.62841796875, 0.7757568359375, 0.923095703125, 1.0704345703125, 1.2177734375, 1.3651123046875, 1.512451171875, 1.6597900390625, 1.80712890625, 1.9544677734375, 2.101806640625, 2.2491455078125, 2.396484375, 2.5438232421875, 2.691162109375, 2.8385009765625, 2.98583984375, 3.1331787109375, 3.280517578125, 3.4278564453125, 3.5751953125, 3.7225341796875, 3.869873046875, 4.0172119140625, 4.16455078125, 4.3118896484375, 4.459228515625, 4.6065673828125, 4.75390625]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 0.0, 7.0, 6.0, 2.0, 9.0, 3.0, 15.0, 14.0, 25.0, 19.0, 35.0, 26.0, 42.0, 51.0, 50.0, 61.0, 87.0, 349.0, 1702.0, 136.0, 71.0, 46.0, 47.0, 41.0, 37.0, 29.0, 31.0, 18.0, 23.0, 12.0, 11.0, 14.0, 6.0, 4.0, 7.0, 4.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-32.84375, -31.853759765625, -30.86376953125, -29.873779296875, -28.8837890625, -27.893798828125, -26.90380859375, -25.913818359375, -24.923828125, -23.933837890625, -22.94384765625, -21.953857421875, -20.9638671875, -19.973876953125, -18.98388671875, -17.993896484375, -17.00390625, -16.013916015625, -15.02392578125, -14.033935546875, -13.0439453125, -12.053955078125, -11.06396484375, -10.073974609375, -9.083984375, -8.093994140625, -7.10400390625, -6.114013671875, -5.1240234375, -4.134033203125, -3.14404296875, -2.154052734375, -1.1640625, -0.174072265625, 0.81591796875, 1.805908203125, 2.7958984375, 3.785888671875, 4.77587890625, 5.765869140625, 6.755859375, 7.745849609375, 8.73583984375, 9.725830078125, 10.7158203125, 11.705810546875, 12.69580078125, 13.685791015625, 14.67578125, 15.665771484375, 16.65576171875, 17.645751953125, 18.6357421875, 19.625732421875, 20.61572265625, 21.605712890625, 22.595703125, 23.585693359375, 24.57568359375, 25.565673828125, 26.5556640625, 27.545654296875, 28.53564453125, 29.525634765625, 30.515625]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 6.0, 9.0, 14.0, 18.0, 16.0, 19.0, 30.0, 33.0, 62.0, 84.0, 101.0, 158.0, 199.0, 324.0, 728.0, 6989.0, 3126438.0, 8651.0, 764.0, 336.0, 198.0, 145.0, 105.0, 63.0, 57.0, 33.0, 37.0, 21.0, 15.0, 5.0, 12.0, 8.0, 8.0, 5.0, 3.0, 2.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-67.0, -64.8046875, -62.609375, -60.4140625, -58.21875, -56.0234375, -53.828125, -51.6328125, -49.4375, -47.2421875, -45.046875, -42.8515625, -40.65625, -38.4609375, -36.265625, -34.0703125, -31.875, -29.6796875, -27.484375, -25.2890625, -23.09375, -20.8984375, -18.703125, -16.5078125, -14.3125, -12.1171875, -9.921875, -7.7265625, -5.53125, -3.3359375, -1.140625, 1.0546875, 3.25, 5.4453125, 7.640625, 9.8359375, 12.03125, 14.2265625, 16.421875, 18.6171875, 20.8125, 23.0078125, 25.203125, 27.3984375, 29.59375, 31.7890625, 33.984375, 36.1796875, 38.375, 40.5703125, 42.765625, 44.9609375, 47.15625, 49.3515625, 51.546875, 53.7421875, 55.9375, 58.1328125, 60.328125, 62.5234375, 64.71875, 66.9140625, 69.109375, 71.3046875, 73.5]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 7.0, 446.0, 563.0], "bins": [-427.08331298828125, -420.3058776855469, -413.5284118652344, -406.7509765625, -399.9735107421875, -393.1960754394531, -386.41864013671875, -379.64117431640625, -372.8637390136719, -366.0863037109375, -359.308837890625, -352.5314025878906, -345.7539367675781, -338.97650146484375, -332.19903564453125, -325.4216003417969, -318.6441345214844, -311.86669921875, -305.0892333984375, -298.3117980957031, -291.5343322753906, -284.75689697265625, -277.97943115234375, -271.2019958496094, -264.424560546875, -257.6471252441406, -250.86965942382812, -244.09222412109375, -237.3147735595703, -230.53732299804688, -223.75987243652344, -216.982421875, -210.20497131347656, -203.42752075195312, -196.6500701904297, -189.87261962890625, -183.09518432617188, -176.31773376464844, -169.540283203125, -162.76283264160156, -155.98538208007812, -149.2079315185547, -142.43048095703125, -135.65304565429688, -128.87559509277344, -122.09814453125, -115.32069396972656, -108.54324340820312, -101.76580047607422, -94.98834991455078, -88.21090698242188, -81.43345642089844, -74.656005859375, -67.87855529785156, -61.101112365722656, -54.32366180419922, -47.54621887207031, -40.76877212524414, -33.9913215637207, -27.21387481689453, -20.436426162719727, -13.658977508544922, -6.88153076171875, -0.1040802001953125, 6.673367500305176]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 5.0, 3.0, 6.0, 10.0, 2.0, 6.0, 14.0, 14.0, 17.0, 16.0, 17.0, 25.0, 16.0, 15.0, 23.0, 24.0, 17.0, 24.0, 29.0, 35.0, 29.0, 36.0, 40.0, 39.0, 32.0, 35.0, 40.0, 29.0, 31.0, 25.0, 30.0, 40.0, 26.0, 24.0, 23.0, 18.0, 26.0, 20.0, 21.0, 15.0, 11.0, 12.0, 15.0, 16.0, 15.0, 13.0, 6.0, 6.0, 3.0, 5.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 6.0], "bins": [-51.062828063964844, -49.474693298339844, -47.88655471801758, -46.29841995239258, -44.71028518676758, -43.12215042114258, -41.53401184082031, -39.94587707519531, -38.35774230957031, -36.76960754394531, -35.18146896362305, -33.59333419799805, -32.00519943237305, -30.417062759399414, -28.82892608642578, -27.24079132080078, -25.65265464782715, -24.064517974853516, -22.476383209228516, -20.888246536254883, -19.300111770629883, -17.71197509765625, -16.12384033203125, -14.535703659057617, -12.9475679397583, -11.359432220458984, -9.771296501159668, -8.183160781860352, -6.595024585723877, -5.0068888664245605, -3.418752670288086, -1.8306169509887695, -0.24248123168945312, 1.3456546068191528, 2.933790445327759, 4.521926403045654, 6.110062122344971, 7.698197841644287, 9.286334037780762, 10.874469757080078, 12.462605476379395, 14.050741195678711, 15.638876914978027, 17.227012634277344, 18.815149307250977, 20.403284072875977, 21.99142074584961, 23.57955551147461, 25.167692184448242, 26.755828857421875, 28.343963623046875, 29.932100296020508, 31.520235061645508, 33.10837173461914, 34.69650650024414, 36.284645080566406, 37.872779846191406, 39.460914611816406, 41.04905319213867, 42.63718795776367, 44.22532272338867, 45.81345748901367, 47.40159606933594, 48.98973083496094, 50.57786560058594]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 5.0, 5.0, 7.0, 13.0, 7.0, 17.0, 13.0, 18.0, 20.0, 27.0, 30.0, 39.0, 35.0, 34.0, 47.0, 46.0, 47.0, 55.0, 39.0, 49.0, 44.0, 45.0, 42.0, 47.0, 45.0, 40.0, 24.0, 30.0, 15.0, 19.0, 17.0, 16.0, 18.0, 15.0, 9.0, 9.0, 5.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.078125, -7.84033203125, -7.6025390625, -7.36474609375, -7.126953125, -6.88916015625, -6.6513671875, -6.41357421875, -6.17578125, -5.93798828125, -5.7001953125, -5.46240234375, -5.224609375, -4.98681640625, -4.7490234375, -4.51123046875, -4.2734375, -4.03564453125, -3.7978515625, -3.56005859375, -3.322265625, -3.08447265625, -2.8466796875, -2.60888671875, -2.37109375, -2.13330078125, -1.8955078125, -1.65771484375, -1.419921875, -1.18212890625, -0.9443359375, -0.70654296875, -0.46875, -0.23095703125, 0.0068359375, 0.24462890625, 0.482421875, 0.72021484375, 0.9580078125, 1.19580078125, 1.43359375, 1.67138671875, 1.9091796875, 2.14697265625, 2.384765625, 2.62255859375, 2.8603515625, 3.09814453125, 3.3359375, 3.57373046875, 3.8115234375, 4.04931640625, 4.287109375, 4.52490234375, 4.7626953125, 5.00048828125, 5.23828125, 5.47607421875, 5.7138671875, 5.95166015625, 6.189453125, 6.42724609375, 6.6650390625, 6.90283203125, 7.140625]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 6.0, 9.0, 4.0, 8.0, 8.0, 9.0, 18.0, 10.0, 21.0, 15.0, 27.0, 31.0, 37.0, 49.0, 60.0, 130.0, 349.0, 1465.0, 11696.0, 654399.0, 3435826.0, 84788.0, 4066.0, 662.0, 233.0, 86.0, 55.0, 44.0, 26.0, 25.0, 24.0, 18.0, 14.0, 14.0, 16.0, 12.0, 10.0, 5.0, 4.0, 3.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-31.828125, -30.89990234375, -29.9716796875, -29.04345703125, -28.115234375, -27.18701171875, -26.2587890625, -25.33056640625, -24.40234375, -23.47412109375, -22.5458984375, -21.61767578125, -20.689453125, -19.76123046875, -18.8330078125, -17.90478515625, -16.9765625, -16.04833984375, -15.1201171875, -14.19189453125, -13.263671875, -12.33544921875, -11.4072265625, -10.47900390625, -9.55078125, -8.62255859375, -7.6943359375, -6.76611328125, -5.837890625, -4.90966796875, -3.9814453125, -3.05322265625, -2.125, -1.19677734375, -0.2685546875, 0.65966796875, 1.587890625, 2.51611328125, 3.4443359375, 4.37255859375, 5.30078125, 6.22900390625, 7.1572265625, 8.08544921875, 9.013671875, 9.94189453125, 10.8701171875, 11.79833984375, 12.7265625, 13.65478515625, 14.5830078125, 15.51123046875, 16.439453125, 17.36767578125, 18.2958984375, 19.22412109375, 20.15234375, 21.08056640625, 22.0087890625, 22.93701171875, 23.865234375, 24.79345703125, 25.7216796875, 26.64990234375, 27.578125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 5.0, 6.0, 4.0, 10.0, 11.0, 18.0, 23.0, 44.0, 58.0, 70.0, 99.0, 148.0, 183.0, 274.0, 359.0, 401.0, 480.0, 443.0, 376.0, 290.0, 221.0, 154.0, 122.0, 84.0, 54.0, 47.0, 20.0, 21.0, 11.0, 14.0, 6.0, 6.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-15.7734375, -15.31787109375, -14.8623046875, -14.40673828125, -13.951171875, -13.49560546875, -13.0400390625, -12.58447265625, -12.12890625, -11.67333984375, -11.2177734375, -10.76220703125, -10.306640625, -9.85107421875, -9.3955078125, -8.93994140625, -8.484375, -8.02880859375, -7.5732421875, -7.11767578125, -6.662109375, -6.20654296875, -5.7509765625, -5.29541015625, -4.83984375, -4.38427734375, -3.9287109375, -3.47314453125, -3.017578125, -2.56201171875, -2.1064453125, -1.65087890625, -1.1953125, -0.73974609375, -0.2841796875, 0.17138671875, 0.626953125, 1.08251953125, 1.5380859375, 1.99365234375, 2.44921875, 2.90478515625, 3.3603515625, 3.81591796875, 4.271484375, 4.72705078125, 5.1826171875, 5.63818359375, 6.09375, 6.54931640625, 7.0048828125, 7.46044921875, 7.916015625, 8.37158203125, 8.8271484375, 9.28271484375, 9.73828125, 10.19384765625, 10.6494140625, 11.10498046875, 11.560546875, 12.01611328125, 12.4716796875, 12.92724609375, 13.3828125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 6.0, 4.0, 4.0, 16.0, 16.0, 17.0, 25.0, 17.0, 43.0, 38.0, 49.0, 54.0, 82.0, 134.0, 159.0, 239.0, 440.0, 1083.0, 6615.0, 320600.0, 3791151.0, 68534.0, 3071.0, 731.0, 341.0, 201.0, 146.0, 106.0, 76.0, 63.0, 54.0, 29.0, 29.0, 20.0, 18.0, 14.0, 14.0, 9.0, 10.0, 5.0, 8.0, 2.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.46875, -40.05517578125, -38.6416015625, -37.22802734375, -35.814453125, -34.40087890625, -32.9873046875, -31.57373046875, -30.16015625, -28.74658203125, -27.3330078125, -25.91943359375, -24.505859375, -23.09228515625, -21.6787109375, -20.26513671875, -18.8515625, -17.43798828125, -16.0244140625, -14.61083984375, -13.197265625, -11.78369140625, -10.3701171875, -8.95654296875, -7.54296875, -6.12939453125, -4.7158203125, -3.30224609375, -1.888671875, -0.47509765625, 0.9384765625, 2.35205078125, 3.765625, 5.17919921875, 6.5927734375, 8.00634765625, 9.419921875, 10.83349609375, 12.2470703125, 13.66064453125, 15.07421875, 16.48779296875, 17.9013671875, 19.31494140625, 20.728515625, 22.14208984375, 23.5556640625, 24.96923828125, 26.3828125, 27.79638671875, 29.2099609375, 30.62353515625, 32.037109375, 33.45068359375, 34.8642578125, 36.27783203125, 37.69140625, 39.10498046875, 40.5185546875, 41.93212890625, 43.345703125, 44.75927734375, 46.1728515625, 47.58642578125, 49.0]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 16.0, 242.0, 610.0, 132.0, 17.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.20087432861328, -89.50810241699219, -78.81533813476562, -68.12257385253906, -57.42980194091797, -46.73703384399414, -36.04426574707031, -25.35149383544922, -14.658729553222656, -3.965961456298828, 6.726806640625, 17.419574737548828, 28.112342834472656, 38.805110931396484, 49.49787902832031, 60.190650939941406, 70.88341522216797, 81.57618713378906, 92.26895141601562, 102.96171569824219, 113.65448760986328, 124.34725952148438, 135.04002380371094, 145.7327880859375, 156.42556762695312, 167.1183319091797, 177.81109619140625, 188.50387573242188, 199.19664001464844, 209.889404296875, 220.58218383789062, 231.2749481201172, 241.96771240234375, 252.6604766845703, 263.3532409667969, 274.0460205078125, 284.73876953125, 295.4315490722656, 306.12432861328125, 316.81707763671875, 327.5098571777344, 338.20263671875, 348.8953857421875, 359.5881652832031, 370.28094482421875, 380.97369384765625, 391.6664733886719, 402.3592529296875, 413.052001953125, 423.7447814941406, 434.4375305175781, 445.13031005859375, 455.82305908203125, 466.5158386230469, 477.2086181640625, 487.9013671875, 498.5941467285156, 509.28692626953125, 519.9796752929688, 530.6724243164062, 541.365234375, 552.0579833984375, 562.750732421875, 573.4435424804688, 584.1362915039062]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 5.0, 9.0, 10.0, 13.0, 17.0, 16.0, 12.0, 22.0, 24.0, 33.0, 30.0, 27.0, 25.0, 30.0, 32.0, 26.0, 35.0, 36.0, 49.0, 46.0, 45.0, 39.0, 42.0, 34.0, 27.0, 34.0, 31.0, 25.0, 31.0, 26.0, 24.0, 16.0, 19.0, 8.0, 18.0, 20.0, 13.0, 12.0, 9.0, 6.0, 8.0, 6.0, 1.0, 2.0, 2.0, 2.0, 3.0], "bins": [-46.99755859375, -45.72099304199219, -44.44442367553711, -43.1678581237793, -41.89128875732422, -40.614723205566406, -39.33815383911133, -38.061588287353516, -36.78501892089844, -35.508453369140625, -34.23188400268555, -32.955318450927734, -31.678749084472656, -30.402183532714844, -29.1256160736084, -27.849048614501953, -26.57248306274414, -25.295915603637695, -24.01934814453125, -22.742780685424805, -21.46621322631836, -20.189647674560547, -18.9130802154541, -17.636512756347656, -16.35994529724121, -15.083377838134766, -13.80681037902832, -12.530243873596191, -11.253676414489746, -9.9771089553833, -8.700542449951172, -7.423974990844727, -6.147407531738281, -4.870840072631836, -3.594273090362549, -2.3177058696746826, -1.0411386489868164, 0.2354288101196289, 1.511995792388916, 2.788562774658203, 4.065130233764648, 5.341697692871094, 6.618264675140381, 7.894831657409668, 9.171399116516113, 10.447966575622559, 11.724533081054688, 13.001100540161133, 14.277667999267578, 15.554235458374023, 16.83080291748047, 18.107370376586914, 19.38393783569336, 20.660503387451172, 21.937070846557617, 23.213638305664062, 24.490205764770508, 25.766773223876953, 27.0433406829834, 28.319908142089844, 29.596473693847656, 30.873043060302734, 32.14960861206055, 33.426177978515625, 34.70274353027344]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 6.0, 2.0, 3.0, 6.0, 9.0, 3.0, 6.0, 9.0, 8.0, 15.0, 11.0, 17.0, 19.0, 23.0, 30.0, 31.0, 38.0, 46.0, 37.0, 50.0, 61.0, 50.0, 43.0, 52.0, 39.0, 40.0, 48.0, 46.0, 33.0, 40.0, 32.0, 27.0, 29.0, 22.0, 8.0, 17.0, 13.0, 12.0, 9.0, 8.0, 3.0, 4.0, 4.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.0625, -7.8306884765625, -7.598876953125, -7.3670654296875, -7.13525390625, -6.9034423828125, -6.671630859375, -6.4398193359375, -6.2080078125, -5.9761962890625, -5.744384765625, -5.5125732421875, -5.28076171875, -5.0489501953125, -4.817138671875, -4.5853271484375, -4.353515625, -4.1217041015625, -3.889892578125, -3.6580810546875, -3.42626953125, -3.1944580078125, -2.962646484375, -2.7308349609375, -2.4990234375, -2.2672119140625, -2.035400390625, -1.8035888671875, -1.57177734375, -1.3399658203125, -1.108154296875, -0.8763427734375, -0.64453125, -0.4127197265625, -0.180908203125, 0.0509033203125, 0.28271484375, 0.5145263671875, 0.746337890625, 0.9781494140625, 1.2099609375, 1.4417724609375, 1.673583984375, 1.9053955078125, 2.13720703125, 2.3690185546875, 2.600830078125, 2.8326416015625, 3.064453125, 3.2962646484375, 3.528076171875, 3.7598876953125, 3.99169921875, 4.2235107421875, 4.455322265625, 4.6871337890625, 4.9189453125, 5.1507568359375, 5.382568359375, 5.6143798828125, 5.84619140625, 6.0780029296875, 6.309814453125, 6.5416259765625, 6.7734375]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 4.0, 12.0, 17.0, 15.0, 21.0, 33.0, 51.0, 64.0, 99.0, 140.0, 221.0, 278.0, 401.0, 576.0, 804.0, 1173.0, 1677.0, 2314.0, 3318.0, 4859.0, 7100.0, 10571.0, 15474.0, 23616.0, 36895.0, 59225.0, 102145.0, 187554.0, 235718.0, 139215.0, 78025.0, 47109.0, 29310.0, 19422.0, 13134.0, 8651.0, 5912.0, 4110.0, 2755.0, 1936.0, 1408.0, 964.0, 661.0, 503.0, 298.0, 250.0, 158.0, 112.0, 83.0, 55.0, 35.0, 27.0, 15.0, 20.0, 7.0, 8.0, 6.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.80029296875, -0.7729415893554688, -0.7455902099609375, -0.7182388305664062, -0.690887451171875, -0.6635360717773438, -0.6361846923828125, -0.6088333129882812, -0.58148193359375, -0.5541305541992188, -0.5267791748046875, -0.49942779541015625, -0.472076416015625, -0.44472503662109375, -0.4173736572265625, -0.39002227783203125, -0.3626708984375, -0.33531951904296875, -0.3079681396484375, -0.28061676025390625, -0.253265380859375, -0.22591400146484375, -0.1985626220703125, -0.17121124267578125, -0.14385986328125, -0.11650848388671875, -0.0891571044921875, -0.06180572509765625, -0.034454345703125, -0.00710296630859375, 0.0202484130859375, 0.04759979248046875, 0.074951171875, 0.10230255126953125, 0.1296539306640625, 0.15700531005859375, 0.184356689453125, 0.21170806884765625, 0.2390594482421875, 0.26641082763671875, 0.29376220703125, 0.32111358642578125, 0.3484649658203125, 0.37581634521484375, 0.403167724609375, 0.43051910400390625, 0.4578704833984375, 0.48522186279296875, 0.5125732421875, 0.5399246215820312, 0.5672760009765625, 0.5946273803710938, 0.621978759765625, 0.6493301391601562, 0.6766815185546875, 0.7040328979492188, 0.73138427734375, 0.7587356567382812, 0.7860870361328125, 0.8134384155273438, 0.840789794921875, 0.8681411743164062, 0.8954925537109375, 0.9228439331054688, 0.9501953125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 3.0, 4.0, 6.0, 3.0, 9.0, 15.0, 15.0, 10.0, 16.0, 22.0, 20.0, 21.0, 31.0, 35.0, 32.0, 31.0, 37.0, 35.0, 42.0, 42.0, 39.0, 1071.0, 37.0, 40.0, 41.0, 34.0, 40.0, 30.0, 32.0, 27.0, 28.0, 28.0, 27.0, 21.0, 25.0, 22.0, 12.0, 12.0, 10.0, 9.0, 7.0, 4.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.55859375, -4.4268798828125, -4.295166015625, -4.1634521484375, -4.03173828125, -3.9000244140625, -3.768310546875, -3.6365966796875, -3.5048828125, -3.3731689453125, -3.241455078125, -3.1097412109375, -2.97802734375, -2.8463134765625, -2.714599609375, -2.5828857421875, -2.451171875, -2.3194580078125, -2.187744140625, -2.0560302734375, -1.92431640625, -1.7926025390625, -1.660888671875, -1.5291748046875, -1.3974609375, -1.2657470703125, -1.134033203125, -1.0023193359375, -0.87060546875, -0.7388916015625, -0.607177734375, -0.4754638671875, -0.34375, -0.2120361328125, -0.080322265625, 0.0513916015625, 0.18310546875, 0.3148193359375, 0.446533203125, 0.5782470703125, 0.7099609375, 0.8416748046875, 0.973388671875, 1.1051025390625, 1.23681640625, 1.3685302734375, 1.500244140625, 1.6319580078125, 1.763671875, 1.8953857421875, 2.027099609375, 2.1588134765625, 2.29052734375, 2.4222412109375, 2.553955078125, 2.6856689453125, 2.8173828125, 2.9490966796875, 3.080810546875, 3.2125244140625, 3.34423828125, 3.4759521484375, 3.607666015625, 3.7393798828125, 3.87109375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 2.0, 3.0, 11.0, 19.0, 17.0, 35.0, 44.0, 74.0, 109.0, 160.0, 222.0, 304.0, 518.0, 699.0, 1061.0, 1535.0, 2365.0, 3456.0, 5323.0, 8290.0, 13146.0, 20953.0, 34880.0, 59018.0, 108088.0, 206313.0, 1298947.0, 141850.0, 75409.0, 43310.0, 25848.0, 15894.0, 10056.0, 6475.0, 4240.0, 2729.0, 1806.0, 1232.0, 850.0, 557.0, 444.0, 277.0, 172.0, 138.0, 87.0, 66.0, 37.0, 18.0, 18.0, 13.0, 11.0, 3.0, 1.0, 3.0, 0.0, 2.0, 2.0], "bins": [-0.849609375, -0.8240280151367188, -0.7984466552734375, -0.7728652954101562, -0.747283935546875, -0.7217025756835938, -0.6961212158203125, -0.6705398559570312, -0.64495849609375, -0.6193771362304688, -0.5937957763671875, -0.5682144165039062, -0.542633056640625, -0.5170516967773438, -0.4914703369140625, -0.46588897705078125, -0.4403076171875, -0.41472625732421875, -0.3891448974609375, -0.36356353759765625, -0.337982177734375, -0.31240081787109375, -0.2868194580078125, -0.26123809814453125, -0.23565673828125, -0.21007537841796875, -0.1844940185546875, -0.15891265869140625, -0.133331298828125, -0.10774993896484375, -0.0821685791015625, -0.05658721923828125, -0.031005859375, -0.00542449951171875, 0.0201568603515625, 0.04573822021484375, 0.071319580078125, 0.09690093994140625, 0.1224822998046875, 0.14806365966796875, 0.17364501953125, 0.19922637939453125, 0.2248077392578125, 0.25038909912109375, 0.275970458984375, 0.30155181884765625, 0.3271331787109375, 0.35271453857421875, 0.3782958984375, 0.40387725830078125, 0.4294586181640625, 0.45503997802734375, 0.480621337890625, 0.5062026977539062, 0.5317840576171875, 0.5573654174804688, 0.58294677734375, 0.6085281372070312, 0.6341094970703125, 0.6596908569335938, 0.685272216796875, 0.7108535766601562, 0.7364349365234375, 0.7620162963867188, 0.78759765625]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 8.0, 4.0, 8.0, 9.0, 11.0, 5.0, 16.0, 18.0, 12.0, 18.0, 26.0, 35.0, 38.0, 29.0, 40.0, 33.0, 41.0, 58.0, 49.0, 53.0, 63.0, 48.0, 36.0, 48.0, 38.0, 43.0, 37.0, 22.0, 34.0, 19.0, 20.0, 20.0, 14.0, 11.0, 10.0, 7.0, 3.0, 5.0, 4.0, 2.0, 2.0, 3.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0016164779663085938, -0.0015639960765838623, -0.0015115141868591309, -0.0014590322971343994, -0.001406550407409668, -0.0013540685176849365, -0.001301586627960205, -0.0012491047382354736, -0.0011966228485107422, -0.0011441409587860107, -0.0010916590690612793, -0.0010391771793365479, -0.0009866952896118164, -0.000934213399887085, -0.0008817315101623535, -0.0008292496204376221, -0.0007767677307128906, -0.0007242858409881592, -0.0006718039512634277, -0.0006193220615386963, -0.0005668401718139648, -0.0005143582820892334, -0.00046187639236450195, -0.0004093945026397705, -0.00035691261291503906, -0.0003044307231903076, -0.00025194883346557617, -0.00019946694374084473, -0.00014698505401611328, -9.450316429138184e-05, -4.202127456665039e-05, 1.0460615158081055e-05, 6.29425048828125e-05, 0.00011542439460754395, 0.0001679062843322754, 0.00022038817405700684, 0.0002728700637817383, 0.0003253519535064697, 0.00037783384323120117, 0.0004303157329559326, 0.00048279762268066406, 0.0005352795124053955, 0.000587761402130127, 0.0006402432918548584, 0.0006927251815795898, 0.0007452070713043213, 0.0007976889610290527, 0.0008501708507537842, 0.0009026527404785156, 0.0009551346302032471, 0.0010076165199279785, 0.00106009840965271, 0.0011125802993774414, 0.0011650621891021729, 0.0012175440788269043, 0.0012700259685516357, 0.0013225078582763672, 0.0013749897480010986, 0.00142747163772583, 0.0014799535274505615, 0.001532435417175293, 0.0015849173069000244, 0.0016373991966247559, 0.0016898810863494873, 0.0017423629760742188]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 2.0, 2.0, 2.0, 7.0, 7.0, 3.0, 8.0, 8.0, 13.0, 21.0, 23.0, 34.0, 64.0, 57.0, 77.0, 110.0, 198.0, 459.0, 1269.0, 133814.0, 908204.0, 2832.0, 602.0, 232.0, 145.0, 96.0, 66.0, 39.0, 34.0, 39.0, 19.0, 20.0, 14.0, 11.0, 12.0, 9.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.038604736328125, -0.03723478317260742, -0.035864830017089844, -0.034494876861572266, -0.03312492370605469, -0.03175497055053711, -0.03038501739501953, -0.029015064239501953, -0.027645111083984375, -0.026275157928466797, -0.02490520477294922, -0.02353525161743164, -0.022165298461914062, -0.020795345306396484, -0.019425392150878906, -0.018055438995361328, -0.01668548583984375, -0.015315532684326172, -0.013945579528808594, -0.012575626373291016, -0.011205673217773438, -0.00983572006225586, -0.008465766906738281, -0.007095813751220703, -0.005725860595703125, -0.004355907440185547, -0.0029859542846679688, -0.0016160011291503906, -0.0002460479736328125, 0.0011239051818847656, 0.0024938583374023438, 0.003863811492919922, 0.0052337646484375, 0.006603717803955078, 0.007973670959472656, 0.009343624114990234, 0.010713577270507812, 0.01208353042602539, 0.013453483581542969, 0.014823436737060547, 0.016193389892578125, 0.017563343048095703, 0.01893329620361328, 0.02030324935913086, 0.021673202514648438, 0.023043155670166016, 0.024413108825683594, 0.025783061981201172, 0.02715301513671875, 0.028522968292236328, 0.029892921447753906, 0.031262874603271484, 0.03263282775878906, 0.03400278091430664, 0.03537273406982422, 0.0367426872253418, 0.038112640380859375, 0.03948259353637695, 0.04085254669189453, 0.04222249984741211, 0.04359245300292969, 0.044962406158447266, 0.046332359313964844, 0.04770231246948242, 0.049072265625]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 10.0, 26.0, 168.0, 350.0, 318.0, 115.0, 24.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0029191887006163597, -0.0027646366506814957, -0.0026100848335772753, -0.0024555327836424112, -0.002300980733707547, -0.002146428916603327, -0.0019918768666684628, -0.0018373248167335987, -0.0016827728832140565, -0.0015282209496945143, -0.0013736688997596502, -0.001219116966240108, -0.0010645650327205658, -0.0009100129827857018, -0.0007554610492661595, -0.0006009089993312955, -0.0004463570658117533, -0.00029180507408455014, -0.00013725311146117747, 1.7298851162195206e-05, 0.00017185084288939834, 0.00032640283461660147, 0.0004809547681361437, 0.0006355068180710077, 0.00079005875159055, 0.0009446107433177531, 0.0010991627350449562, 0.0012537146685644984, 0.0014082666020840406, 0.0015628186520189047, 0.001717370585538447, 0.001871922635473311, 0.002026474568992853, 0.002181026618927717, 0.0023355784360319376, 0.0024901304859668016, 0.0026446825359016657, 0.002799234353005886, 0.00295378640294075, 0.003108338452875614, 0.003262890502810478, 0.0034174425527453423, 0.0035719943698495626, 0.0037265464197844267, 0.0038810984697192907, 0.004035650286823511, 0.004190202336758375, 0.004344754386693239, 0.004499305970966816, 0.00465385802090168, 0.004808410070836544, 0.004962962120771408, 0.005117513705044985, 0.005272065754979849, 0.005426617804914713, 0.005581169854849577, 0.005735721904784441, 0.005890273954719305, 0.006044826004654169, 0.006199377588927746, 0.00635392963886261, 0.006508481688797474, 0.006663033738732338, 0.006817585788667202, 0.006972137838602066]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 2.0, 3.0, 10.0, 6.0, 6.0, 14.0, 15.0, 16.0, 19.0, 23.0, 26.0, 22.0, 22.0, 36.0, 28.0, 25.0, 38.0, 26.0, 45.0, 38.0, 44.0, 31.0, 58.0, 38.0, 43.0, 39.0, 36.0, 34.0, 31.0, 25.0, 21.0, 19.0, 26.0, 25.0, 16.0, 18.0, 19.0, 13.0, 11.0, 7.0, 11.0, 4.0, 5.0, 4.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010277628898620605, -0.0009970394894480705, -0.0009663160890340805, -0.0009355926886200905, -0.0009048692882061005, -0.0008741458877921104, -0.0008434224873781204, -0.0008126990869641304, -0.0007819756865501404, -0.0007512522861361504, -0.0007205288857221603, -0.0006898054853081703, -0.0006590820848941803, -0.0006283586844801903, -0.0005976352840662003, -0.0005669118836522102, -0.0005361884832382202, -0.0005054650828242302, -0.0004747416824102402, -0.00044401828199625015, -0.00041329488158226013, -0.0003825714811682701, -0.0003518480807542801, -0.00032112468034029007, -0.00029040127992630005, -0.00025967787951231003, -0.00022895447909832, -0.00019823107868433, -0.00016750767827033997, -0.00013678427785634995, -0.00010606087744235992, -7.53374770283699e-05, -4.461407661437988e-05, -1.3890676200389862e-05, 1.683272421360016e-05, 4.755612462759018e-05, 7.82795250415802e-05, 0.00010900292545557022, 0.00013972632586956024, 0.00017044972628355026, 0.00020117312669754028, 0.0002318965271115303, 0.0002626199275255203, 0.00029334332793951035, 0.00032406672835350037, 0.0003547901287674904, 0.0003855135291814804, 0.00041623692959547043, 0.00044696033000946045, 0.00047768373042345047, 0.0005084071308374405, 0.0005391305312514305, 0.0005698539316654205, 0.0006005773320794106, 0.0006313007324934006, 0.0006620241329073906, 0.0006927475333213806, 0.0007234709337353706, 0.0007541943341493607, 0.0007849177345633507, 0.0008156411349773407, 0.0008463645353913307, 0.0008770879358053207, 0.0009078113362193108, 0.0009385347366333008]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 6.0, 2.0, 3.0, 6.0, 9.0, 3.0, 6.0, 9.0, 8.0, 15.0, 11.0, 17.0, 19.0, 23.0, 30.0, 31.0, 38.0, 46.0, 37.0, 50.0, 61.0, 50.0, 43.0, 52.0, 39.0, 40.0, 48.0, 46.0, 33.0, 40.0, 32.0, 27.0, 29.0, 22.0, 8.0, 17.0, 13.0, 12.0, 9.0, 8.0, 3.0, 4.0, 4.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.0625, -7.8306884765625, -7.598876953125, -7.3670654296875, -7.13525390625, -6.9034423828125, -6.671630859375, -6.4398193359375, -6.2080078125, -5.9761962890625, -5.744384765625, -5.5125732421875, -5.28076171875, -5.0489501953125, -4.817138671875, -4.5853271484375, -4.353515625, -4.1217041015625, -3.889892578125, -3.6580810546875, -3.42626953125, -3.1944580078125, -2.962646484375, -2.7308349609375, -2.4990234375, -2.2672119140625, -2.035400390625, -1.8035888671875, -1.57177734375, -1.3399658203125, -1.108154296875, -0.8763427734375, -0.64453125, -0.4127197265625, -0.180908203125, 0.0509033203125, 0.28271484375, 0.5145263671875, 0.746337890625, 0.9781494140625, 1.2099609375, 1.4417724609375, 1.673583984375, 1.9053955078125, 2.13720703125, 2.3690185546875, 2.600830078125, 2.8326416015625, 3.064453125, 3.2962646484375, 3.528076171875, 3.7598876953125, 3.99169921875, 4.2235107421875, 4.455322265625, 4.6871337890625, 4.9189453125, 5.1507568359375, 5.382568359375, 5.6143798828125, 5.84619140625, 6.0780029296875, 6.309814453125, 6.5416259765625, 6.7734375]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 3.0, 4.0, 2.0, 5.0, 5.0, 8.0, 13.0, 25.0, 27.0, 35.0, 38.0, 60.0, 85.0, 119.0, 167.0, 293.0, 425.0, 719.0, 1277.0, 2302.0, 4534.0, 9128.0, 19500.0, 42975.0, 100814.0, 304362.0, 359391.0, 112466.0, 47488.0, 21500.0, 9897.0, 4857.0, 2558.0, 1278.0, 779.0, 489.0, 303.0, 161.0, 128.0, 90.0, 70.0, 58.0, 35.0, 22.0, 12.0, 20.0, 14.0, 2.0, 7.0, 6.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.4921875, -5.3309326171875, -5.169677734375, -5.0084228515625, -4.84716796875, -4.6859130859375, -4.524658203125, -4.3634033203125, -4.2021484375, -4.0408935546875, -3.879638671875, -3.7183837890625, -3.55712890625, -3.3958740234375, -3.234619140625, -3.0733642578125, -2.912109375, -2.7508544921875, -2.589599609375, -2.4283447265625, -2.26708984375, -2.1058349609375, -1.944580078125, -1.7833251953125, -1.6220703125, -1.4608154296875, -1.299560546875, -1.1383056640625, -0.97705078125, -0.8157958984375, -0.654541015625, -0.4932861328125, -0.33203125, -0.1707763671875, -0.009521484375, 0.1517333984375, 0.31298828125, 0.4742431640625, 0.635498046875, 0.7967529296875, 0.9580078125, 1.1192626953125, 1.280517578125, 1.4417724609375, 1.60302734375, 1.7642822265625, 1.925537109375, 2.0867919921875, 2.248046875, 2.4093017578125, 2.570556640625, 2.7318115234375, 2.89306640625, 3.0543212890625, 3.215576171875, 3.3768310546875, 3.5380859375, 3.6993408203125, 3.860595703125, 4.0218505859375, 4.18310546875, 4.3443603515625, 4.505615234375, 4.6668701171875, 4.828125]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 5.0, 6.0, 10.0, 8.0, 8.0, 13.0, 13.0, 16.0, 21.0, 23.0, 31.0, 40.0, 36.0, 37.0, 49.0, 41.0, 60.0, 82.0, 148.0, 1595.0, 280.0, 105.0, 69.0, 51.0, 52.0, 26.0, 35.0, 25.0, 20.0, 25.0, 22.0, 17.0, 15.0, 15.0, 14.0, 7.0, 5.0, 7.0, 6.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-20.734375, -20.036865234375, -19.33935546875, -18.641845703125, -17.9443359375, -17.246826171875, -16.54931640625, -15.851806640625, -15.154296875, -14.456787109375, -13.75927734375, -13.061767578125, -12.3642578125, -11.666748046875, -10.96923828125, -10.271728515625, -9.57421875, -8.876708984375, -8.17919921875, -7.481689453125, -6.7841796875, -6.086669921875, -5.38916015625, -4.691650390625, -3.994140625, -3.296630859375, -2.59912109375, -1.901611328125, -1.2041015625, -0.506591796875, 0.19091796875, 0.888427734375, 1.5859375, 2.283447265625, 2.98095703125, 3.678466796875, 4.3759765625, 5.073486328125, 5.77099609375, 6.468505859375, 7.166015625, 7.863525390625, 8.56103515625, 9.258544921875, 9.9560546875, 10.653564453125, 11.35107421875, 12.048583984375, 12.74609375, 13.443603515625, 14.14111328125, 14.838623046875, 15.5361328125, 16.233642578125, 16.93115234375, 17.628662109375, 18.326171875, 19.023681640625, 19.72119140625, 20.418701171875, 21.1162109375, 21.813720703125, 22.51123046875, 23.208740234375, 23.90625]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 6.0, 2.0, 3.0, 3.0, 12.0, 14.0, 13.0, 30.0, 39.0, 47.0, 62.0, 90.0, 138.0, 225.0, 386.0, 1086.0, 52010.0, 3086167.0, 3844.0, 607.0, 321.0, 191.0, 128.0, 82.0, 68.0, 49.0, 22.0, 23.0, 16.0, 8.0, 7.0, 7.0, 2.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.4375, -51.9921875, -49.546875, -47.1015625, -44.65625, -42.2109375, -39.765625, -37.3203125, -34.875, -32.4296875, -29.984375, -27.5390625, -25.09375, -22.6484375, -20.203125, -17.7578125, -15.3125, -12.8671875, -10.421875, -7.9765625, -5.53125, -3.0859375, -0.640625, 1.8046875, 4.25, 6.6953125, 9.140625, 11.5859375, 14.03125, 16.4765625, 18.921875, 21.3671875, 23.8125, 26.2578125, 28.703125, 31.1484375, 33.59375, 36.0390625, 38.484375, 40.9296875, 43.375, 45.8203125, 48.265625, 50.7109375, 53.15625, 55.6015625, 58.046875, 60.4921875, 62.9375, 65.3828125, 67.828125, 70.2734375, 72.71875, 75.1640625, 77.609375, 80.0546875, 82.5, 84.9453125, 87.390625, 89.8359375, 92.28125, 94.7265625, 97.171875, 99.6171875, 102.0625]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 31.0, 282.0, 556.0, 134.0, 13.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.40947723388672, -31.1434268951416, -26.877376556396484, -22.611328125, -18.345277786254883, -14.079227447509766, -9.813179016113281, -5.547128677368164, -1.2810783386230469, 2.984971523284912, 7.251021385192871, 11.517070770263672, 15.783121109008789, 20.049171447753906, 24.31521987915039, 28.581270217895508, 32.847320556640625, 37.11336898803711, 41.37942123413086, 45.645469665527344, 49.911521911621094, 54.17757034301758, 58.44361877441406, 62.70967102050781, 66.97572326660156, 71.24177551269531, 75.50782012939453, 79.77387237548828, 84.03992462158203, 88.30596923828125, 92.572021484375, 96.83807373046875, 101.1041259765625, 105.37017822265625, 109.63622283935547, 113.90227508544922, 118.16832733154297, 122.43437194824219, 126.70042419433594, 130.9664764404297, 135.23252868652344, 139.4985809326172, 143.76463317871094, 148.03067016601562, 152.29672241210938, 156.56277465820312, 160.82882690429688, 165.09487915039062, 169.36093139648438, 173.62698364257812, 177.89303588867188, 182.15908813476562, 186.4251251220703, 190.69117736816406, 194.9572296142578, 199.22328186035156, 203.48931884765625, 207.75537109375, 212.02142333984375, 216.2874755859375, 220.5535125732422, 224.81956481933594, 229.0856170654297, 233.35166931152344, 237.6177215576172]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 3.0, 11.0, 5.0, 12.0, 13.0, 10.0, 16.0, 19.0, 24.0, 15.0, 20.0, 26.0, 22.0, 36.0, 24.0, 30.0, 29.0, 36.0, 40.0, 46.0, 48.0, 34.0, 46.0, 42.0, 34.0, 38.0, 39.0, 41.0, 28.0, 30.0, 31.0, 15.0, 15.0, 15.0, 29.0, 13.0, 14.0, 15.0, 7.0, 11.0, 3.0, 2.0, 5.0, 4.0, 3.0, 7.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-58.328643798828125, -56.432769775390625, -54.536895751953125, -52.64101791381836, -50.74514389038086, -48.84926986694336, -46.953392028808594, -45.057518005371094, -43.161643981933594, -41.265769958496094, -39.369895935058594, -37.47401809692383, -35.57814407348633, -33.68227005004883, -31.786394119262695, -29.890518188476562, -27.994644165039062, -26.098770141601562, -24.20289421081543, -22.307018280029297, -20.411144256591797, -18.515270233154297, -16.619394302368164, -14.723519325256348, -12.827644348144531, -10.931769371032715, -9.035894393920898, -7.140019416809082, -5.244144439697266, -3.348269462585449, -1.4523944854736328, 0.4434804916381836, 2.33935546875, 4.235230445861816, 6.131105422973633, 8.02698040008545, 9.922855377197266, 11.818730354309082, 13.714605331420898, 15.610480308532715, 17.50635528564453, 19.40222930908203, 21.298105239868164, 23.193981170654297, 25.089855194091797, 26.985729217529297, 28.88160514831543, 30.777481079101562, 32.67335510253906, 34.56922912597656, 36.46510314941406, 38.36098098754883, 40.25685501098633, 42.15272903442383, 44.048606872558594, 45.944480895996094, 47.840354919433594, 49.736228942871094, 51.632102966308594, 53.52798080444336, 55.42385482788086, 57.31972885131836, 59.215606689453125, 61.111480712890625, 63.007354736328125]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 1.0, 1.0, 4.0, 6.0, 2.0, 6.0, 5.0, 12.0, 16.0, 15.0, 16.0, 13.0, 23.0, 28.0, 28.0, 35.0, 34.0, 36.0, 62.0, 50.0, 51.0, 41.0, 46.0, 45.0, 48.0, 49.0, 43.0, 48.0, 30.0, 29.0, 29.0, 38.0, 20.0, 23.0, 18.0, 12.0, 9.0, 7.0, 5.0, 6.0, 1.0, 8.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.5390625, -8.2896728515625, -8.040283203125, -7.7908935546875, -7.54150390625, -7.2921142578125, -7.042724609375, -6.7933349609375, -6.5439453125, -6.2945556640625, -6.045166015625, -5.7957763671875, -5.54638671875, -5.2969970703125, -5.047607421875, -4.7982177734375, -4.548828125, -4.2994384765625, -4.050048828125, -3.8006591796875, -3.55126953125, -3.3018798828125, -3.052490234375, -2.8031005859375, -2.5537109375, -2.3043212890625, -2.054931640625, -1.8055419921875, -1.55615234375, -1.3067626953125, -1.057373046875, -0.8079833984375, -0.55859375, -0.3092041015625, -0.059814453125, 0.1895751953125, 0.43896484375, 0.6883544921875, 0.937744140625, 1.1871337890625, 1.4365234375, 1.6859130859375, 1.935302734375, 2.1846923828125, 2.43408203125, 2.6834716796875, 2.932861328125, 3.1822509765625, 3.431640625, 3.6810302734375, 3.930419921875, 4.1798095703125, 4.42919921875, 4.6785888671875, 4.927978515625, 5.1773681640625, 5.4267578125, 5.6761474609375, 5.925537109375, 6.1749267578125, 6.42431640625, 6.6737060546875, 6.923095703125, 7.1724853515625, 7.421875]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 0.0, 3.0, 3.0, 2.0, 2.0, 10.0, 6.0, 7.0, 14.0, 18.0, 19.0, 16.0, 18.0, 18.0, 32.0, 46.0, 57.0, 141.0, 338.0, 1243.0, 8945.0, 379451.0, 3636256.0, 160926.0, 5274.0, 842.0, 245.0, 78.0, 55.0, 33.0, 37.0, 40.0, 18.0, 20.0, 19.0, 14.0, 9.0, 5.0, 9.0, 6.0, 4.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.1875, -30.25390625, -29.3203125, -28.38671875, -27.453125, -26.51953125, -25.5859375, -24.65234375, -23.71875, -22.78515625, -21.8515625, -20.91796875, -19.984375, -19.05078125, -18.1171875, -17.18359375, -16.25, -15.31640625, -14.3828125, -13.44921875, -12.515625, -11.58203125, -10.6484375, -9.71484375, -8.78125, -7.84765625, -6.9140625, -5.98046875, -5.046875, -4.11328125, -3.1796875, -2.24609375, -1.3125, -0.37890625, 0.5546875, 1.48828125, 2.421875, 3.35546875, 4.2890625, 5.22265625, 6.15625, 7.08984375, 8.0234375, 8.95703125, 9.890625, 10.82421875, 11.7578125, 12.69140625, 13.625, 14.55859375, 15.4921875, 16.42578125, 17.359375, 18.29296875, 19.2265625, 20.16015625, 21.09375, 22.02734375, 22.9609375, 23.89453125, 24.828125, 25.76171875, 26.6953125, 27.62890625, 28.5625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 6.0, 5.0, 6.0, 9.0, 11.0, 20.0, 51.0, 54.0, 85.0, 115.0, 198.0, 259.0, 404.0, 514.0, 614.0, 495.0, 407.0, 265.0, 162.0, 127.0, 86.0, 52.0, 45.0, 23.0, 15.0, 15.0, 9.0, 7.0, 2.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.578125, -17.020263671875, -16.46240234375, -15.904541015625, -15.3466796875, -14.788818359375, -14.23095703125, -13.673095703125, -13.115234375, -12.557373046875, -11.99951171875, -11.441650390625, -10.8837890625, -10.325927734375, -9.76806640625, -9.210205078125, -8.65234375, -8.094482421875, -7.53662109375, -6.978759765625, -6.4208984375, -5.863037109375, -5.30517578125, -4.747314453125, -4.189453125, -3.631591796875, -3.07373046875, -2.515869140625, -1.9580078125, -1.400146484375, -0.84228515625, -0.284423828125, 0.2734375, 0.831298828125, 1.38916015625, 1.947021484375, 2.5048828125, 3.062744140625, 3.62060546875, 4.178466796875, 4.736328125, 5.294189453125, 5.85205078125, 6.409912109375, 6.9677734375, 7.525634765625, 8.08349609375, 8.641357421875, 9.19921875, 9.757080078125, 10.31494140625, 10.872802734375, 11.4306640625, 11.988525390625, 12.54638671875, 13.104248046875, 13.662109375, 14.219970703125, 14.77783203125, 15.335693359375, 15.8935546875, 16.451416015625, 17.00927734375, 17.567138671875, 18.125]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 8.0, 6.0, 4.0, 9.0, 13.0, 18.0, 19.0, 32.0, 46.0, 58.0, 56.0, 101.0, 124.0, 162.0, 205.0, 318.0, 653.0, 3065.0, 275106.0, 3891356.0, 20363.0, 1137.0, 432.0, 250.0, 204.0, 146.0, 100.0, 78.0, 53.0, 31.0, 29.0, 37.0, 21.0, 10.0, 9.0, 10.0, 4.0, 5.0, 1.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.96875, -57.0830078125, -55.197265625, -53.3115234375, -51.42578125, -49.5400390625, -47.654296875, -45.7685546875, -43.8828125, -41.9970703125, -40.111328125, -38.2255859375, -36.33984375, -34.4541015625, -32.568359375, -30.6826171875, -28.796875, -26.9111328125, -25.025390625, -23.1396484375, -21.25390625, -19.3681640625, -17.482421875, -15.5966796875, -13.7109375, -11.8251953125, -9.939453125, -8.0537109375, -6.16796875, -4.2822265625, -2.396484375, -0.5107421875, 1.375, 3.2607421875, 5.146484375, 7.0322265625, 8.91796875, 10.8037109375, 12.689453125, 14.5751953125, 16.4609375, 18.3466796875, 20.232421875, 22.1181640625, 24.00390625, 25.8896484375, 27.775390625, 29.6611328125, 31.546875, 33.4326171875, 35.318359375, 37.2041015625, 39.08984375, 40.9755859375, 42.861328125, 44.7470703125, 46.6328125, 48.5185546875, 50.404296875, 52.2900390625, 54.17578125, 56.0615234375, 57.947265625, 59.8330078125, 61.71875]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 131.0, 712.0, 168.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-400.0184631347656, -386.9118347167969, -373.80523681640625, -360.6986083984375, -347.5920104980469, -334.4853820800781, -321.3787841796875, -308.27215576171875, -295.16552734375, -282.05889892578125, -268.9523010253906, -255.84567260742188, -242.7390594482422, -229.6324462890625, -216.5258331298828, -203.41921997070312, -190.31260681152344, -177.20599365234375, -164.09938049316406, -150.99276733398438, -137.88613891601562, -124.77952575683594, -111.67291259765625, -98.56629180908203, -85.45967864990234, -72.35306549072266, -59.24644470214844, -46.13983154296875, -33.0332145690918, -19.926597595214844, -6.819984436035156, 6.2866363525390625, 19.39324951171875, 32.4998664855957, 45.606483459472656, 58.713096618652344, 71.81971740722656, 84.92633056640625, 98.03294372558594, 111.13956451416016, 124.24617767333984, 137.35279846191406, 150.45941162109375, 163.56602478027344, 176.67263793945312, 189.77926635742188, 202.8858642578125, 215.99249267578125, 229.09910583496094, 242.20571899414062, 255.3123321533203, 268.4189453125, 281.52557373046875, 294.6322021484375, 307.7388000488281, 320.8454284667969, 333.9520263671875, 347.05865478515625, 360.1652526855469, 373.2718811035156, 386.37847900390625, 399.485107421875, 412.59173583984375, 425.6983337402344, 438.8049621582031]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 7.0, 4.0, 4.0, 5.0, 6.0, 9.0, 14.0, 15.0, 14.0, 18.0, 20.0, 26.0, 18.0, 20.0, 26.0, 27.0, 34.0, 38.0, 37.0, 32.0, 35.0, 33.0, 50.0, 33.0, 35.0, 42.0, 35.0, 29.0, 36.0, 25.0, 36.0, 34.0, 17.0, 33.0, 26.0, 23.0, 21.0, 23.0, 9.0, 8.0, 10.0, 8.0, 7.0, 5.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-43.46864318847656, -42.09502029418945, -40.72139358520508, -39.34777069091797, -37.97414779663086, -36.600521087646484, -35.226898193359375, -33.853271484375, -32.47964859008789, -31.10602378845215, -29.73240089416504, -28.358776092529297, -26.985151290893555, -25.611526489257812, -24.237903594970703, -22.86427879333496, -21.49065589904785, -20.11703109741211, -18.743408203125, -17.369783401489258, -15.996158599853516, -14.62253475189209, -13.248910903930664, -11.875286102294922, -10.501662254333496, -9.12803840637207, -7.754413604736328, -6.380789756774902, -5.007165431976318, -3.6335411071777344, -2.2599172592163086, -0.8862924575805664, 0.4873313903808594, 1.8609555959701538, 3.2345798015594482, 4.608203887939453, 5.981828212738037, 7.355452537536621, 8.729076385498047, 10.102701187133789, 11.476325035095215, 12.84994888305664, 14.223573684692383, 15.597197532653809, 16.970821380615234, 18.344446182250977, 19.71807098388672, 21.091693878173828, 22.46531867980957, 23.838943481445312, 25.212566375732422, 26.586191177368164, 27.959815979003906, 29.333438873291016, 30.707063674926758, 32.0806884765625, 33.45431137084961, 34.82793426513672, 36.201560974121094, 37.5751838684082, 38.94880676269531, 40.32243347167969, 41.6960563659668, 43.069679260253906, 44.44330596923828]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 4.0, 1.0, 5.0, 3.0, 3.0, 6.0, 4.0, 5.0, 11.0, 5.0, 22.0, 10.0, 22.0, 25.0, 25.0, 25.0, 28.0, 38.0, 29.0, 37.0, 47.0, 58.0, 34.0, 41.0, 35.0, 54.0, 54.0, 45.0, 37.0, 46.0, 31.0, 27.0, 35.0, 24.0, 25.0, 22.0, 15.0, 15.0, 10.0, 11.0, 11.0, 8.0, 8.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.99609375, -6.771484375, -6.546875, -6.322265625, -6.09765625, -5.873046875, -5.6484375, -5.423828125, -5.19921875, -4.974609375, -4.75, -4.525390625, -4.30078125, -4.076171875, -3.8515625, -3.626953125, -3.40234375, -3.177734375, -2.953125, -2.728515625, -2.50390625, -2.279296875, -2.0546875, -1.830078125, -1.60546875, -1.380859375, -1.15625, -0.931640625, -0.70703125, -0.482421875, -0.2578125, -0.033203125, 0.19140625, 0.416015625, 0.640625, 0.865234375, 1.08984375, 1.314453125, 1.5390625, 1.763671875, 1.98828125, 2.212890625, 2.4375, 2.662109375, 2.88671875, 3.111328125, 3.3359375, 3.560546875, 3.78515625, 4.009765625, 4.234375, 4.458984375, 4.68359375, 4.908203125, 5.1328125, 5.357421875, 5.58203125, 5.806640625, 6.03125, 6.255859375, 6.48046875, 6.705078125, 6.9296875, 7.154296875, 7.37890625]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 7.0, 12.0, 12.0, 16.0, 29.0, 42.0, 66.0, 90.0, 114.0, 194.0, 325.0, 385.0, 598.0, 932.0, 1371.0, 2032.0, 3006.0, 4805.0, 7178.0, 10951.0, 17592.0, 28411.0, 47938.0, 86745.0, 170054.0, 268211.0, 176793.0, 90873.0, 50007.0, 28951.0, 17878.0, 11301.0, 7340.0, 4805.0, 3142.0, 2086.0, 1357.0, 955.0, 645.0, 423.0, 288.0, 189.0, 136.0, 76.0, 66.0, 37.0, 24.0, 21.0, 25.0, 6.0, 6.0, 7.0, 0.0, 4.0, 1.0, 3.0, 0.0, 2.0], "bins": [-1.013671875, -0.9815216064453125, -0.949371337890625, -0.9172210693359375, -0.88507080078125, -0.8529205322265625, -0.820770263671875, -0.7886199951171875, -0.7564697265625, -0.7243194580078125, -0.692169189453125, -0.6600189208984375, -0.62786865234375, -0.5957183837890625, -0.563568115234375, -0.5314178466796875, -0.499267578125, -0.4671173095703125, -0.434967041015625, -0.4028167724609375, -0.37066650390625, -0.3385162353515625, -0.306365966796875, -0.2742156982421875, -0.2420654296875, -0.2099151611328125, -0.177764892578125, -0.1456146240234375, -0.11346435546875, -0.0813140869140625, -0.049163818359375, -0.0170135498046875, 0.01513671875, 0.0472869873046875, 0.079437255859375, 0.1115875244140625, 0.14373779296875, 0.1758880615234375, 0.208038330078125, 0.2401885986328125, 0.2723388671875, 0.3044891357421875, 0.336639404296875, 0.3687896728515625, 0.40093994140625, 0.4330902099609375, 0.465240478515625, 0.4973907470703125, 0.529541015625, 0.5616912841796875, 0.593841552734375, 0.6259918212890625, 0.65814208984375, 0.6902923583984375, 0.722442626953125, 0.7545928955078125, 0.7867431640625, 0.8188934326171875, 0.851043701171875, 0.8831939697265625, 0.91534423828125, 0.9474945068359375, 0.979644775390625, 1.0117950439453125, 1.0439453125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 7.0, 10.0, 15.0, 9.0, 20.0, 19.0, 19.0, 13.0, 33.0, 32.0, 41.0, 33.0, 40.0, 49.0, 60.0, 52.0, 50.0, 1066.0, 42.0, 45.0, 47.0, 46.0, 40.0, 23.0, 27.0, 38.0, 28.0, 23.0, 26.0, 17.0, 15.0, 9.0, 4.0, 7.0, 4.0, 3.0, 6.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.546875, -4.39080810546875, -4.2347412109375, -4.07867431640625, -3.922607421875, -3.76654052734375, -3.6104736328125, -3.45440673828125, -3.29833984375, -3.14227294921875, -2.9862060546875, -2.83013916015625, -2.674072265625, -2.51800537109375, -2.3619384765625, -2.20587158203125, -2.0498046875, -1.89373779296875, -1.7376708984375, -1.58160400390625, -1.425537109375, -1.26947021484375, -1.1134033203125, -0.95733642578125, -0.80126953125, -0.64520263671875, -0.4891357421875, -0.33306884765625, -0.177001953125, -0.02093505859375, 0.1351318359375, 0.29119873046875, 0.447265625, 0.60333251953125, 0.7593994140625, 0.91546630859375, 1.071533203125, 1.22760009765625, 1.3836669921875, 1.53973388671875, 1.69580078125, 1.85186767578125, 2.0079345703125, 2.16400146484375, 2.320068359375, 2.47613525390625, 2.6322021484375, 2.78826904296875, 2.9443359375, 3.10040283203125, 3.2564697265625, 3.41253662109375, 3.568603515625, 3.72467041015625, 3.8807373046875, 4.03680419921875, 4.19287109375, 4.34893798828125, 4.5050048828125, 4.66107177734375, 4.817138671875, 4.97320556640625, 5.1292724609375, 5.28533935546875, 5.44140625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 7.0, 16.0, 12.0, 27.0, 33.0, 42.0, 84.0, 110.0, 166.0, 242.0, 390.0, 641.0, 915.0, 1405.0, 2234.0, 3559.0, 5618.0, 9217.0, 15619.0, 26462.0, 45356.0, 79990.0, 152430.0, 1307931.0, 200672.0, 104155.0, 57037.0, 32956.0, 19408.0, 11458.0, 7003.0, 4331.0, 2739.0, 1741.0, 1076.0, 707.0, 462.0, 307.0, 196.0, 104.0, 108.0, 47.0, 42.0, 34.0, 15.0, 3.0, 9.0, 6.0, 5.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.85400390625, -0.8261947631835938, -0.7983856201171875, -0.7705764770507812, -0.742767333984375, -0.7149581909179688, -0.6871490478515625, -0.6593399047851562, -0.63153076171875, -0.6037216186523438, -0.5759124755859375, -0.5481033325195312, -0.520294189453125, -0.49248504638671875, -0.4646759033203125, -0.43686676025390625, -0.4090576171875, -0.38124847412109375, -0.3534393310546875, -0.32563018798828125, -0.297821044921875, -0.27001190185546875, -0.2422027587890625, -0.21439361572265625, -0.18658447265625, -0.15877532958984375, -0.1309661865234375, -0.10315704345703125, -0.075347900390625, -0.04753875732421875, -0.0197296142578125, 0.00807952880859375, 0.035888671875, 0.06369781494140625, 0.0915069580078125, 0.11931610107421875, 0.147125244140625, 0.17493438720703125, 0.2027435302734375, 0.23055267333984375, 0.25836181640625, 0.28617095947265625, 0.3139801025390625, 0.34178924560546875, 0.369598388671875, 0.39740753173828125, 0.4252166748046875, 0.45302581787109375, 0.4808349609375, 0.5086441040039062, 0.5364532470703125, 0.5642623901367188, 0.592071533203125, 0.6198806762695312, 0.6476898193359375, 0.6754989624023438, 0.70330810546875, 0.7311172485351562, 0.7589263916015625, 0.7867355346679688, 0.814544677734375, 0.8423538208007812, 0.8701629638671875, 0.8979721069335938, 0.92578125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 5.0, 3.0, 5.0, 7.0, 13.0, 11.0, 16.0, 20.0, 14.0, 29.0, 38.0, 35.0, 44.0, 46.0, 46.0, 65.0, 54.0, 55.0, 70.0, 69.0, 58.0, 60.0, 42.0, 44.0, 34.0, 25.0, 18.0, 17.0, 11.0, 13.0, 8.0, 8.0, 5.0, 2.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0029659271240234375, -0.002886861562728882, -0.002807796001434326, -0.0027287304401397705, -0.002649664878845215, -0.002570599317550659, -0.0024915337562561035, -0.002412468194961548, -0.002333402633666992, -0.0022543370723724365, -0.002175271511077881, -0.002096205949783325, -0.0020171403884887695, -0.0019380748271942139, -0.0018590092658996582, -0.0017799437046051025, -0.0017008781433105469, -0.0016218125820159912, -0.0015427470207214355, -0.0014636814594268799, -0.0013846158981323242, -0.0013055503368377686, -0.0012264847755432129, -0.0011474192142486572, -0.0010683536529541016, -0.000989288091659546, -0.0009102225303649902, -0.0008311569690704346, -0.0007520914077758789, -0.0006730258464813232, -0.0005939602851867676, -0.0005148947238922119, -0.00043582916259765625, -0.0003567636013031006, -0.0002776980400085449, -0.00019863247871398926, -0.0001195669174194336, -4.050135612487793e-05, 3.8564205169677734e-05, 0.0001176297664642334, 0.00019669532775878906, 0.0002757608890533447, 0.0003548264503479004, 0.00043389201164245605, 0.0005129575729370117, 0.0005920231342315674, 0.000671088695526123, 0.0007501542568206787, 0.0008292198181152344, 0.00090828537940979, 0.0009873509407043457, 0.0010664165019989014, 0.001145482063293457, 0.0012245476245880127, 0.0013036131858825684, 0.001382678747177124, 0.0014617443084716797, 0.0015408098697662354, 0.001619875431060791, 0.0016989409923553467, 0.0017780065536499023, 0.001857072114944458, 0.0019361376762390137, 0.0020152032375335693, 0.002094268798828125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 8.0, 6.0, 3.0, 10.0, 16.0, 19.0, 18.0, 25.0, 40.0, 61.0, 69.0, 113.0, 146.0, 332.0, 1001.0, 124840.0, 919193.0, 1609.0, 431.0, 188.0, 101.0, 74.0, 60.0, 46.0, 33.0, 26.0, 17.0, 12.0, 10.0, 17.0, 8.0, 3.0, 6.0, 2.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.050537109375, -0.04874134063720703, -0.04694557189941406, -0.045149803161621094, -0.043354034423828125, -0.041558265686035156, -0.03976249694824219, -0.03796672821044922, -0.03617095947265625, -0.03437519073486328, -0.03257942199707031, -0.030783653259277344, -0.028987884521484375, -0.027192115783691406, -0.025396347045898438, -0.02360057830810547, -0.0218048095703125, -0.02000904083251953, -0.018213272094726562, -0.016417503356933594, -0.014621734619140625, -0.012825965881347656, -0.011030197143554688, -0.009234428405761719, -0.00743865966796875, -0.005642890930175781, -0.0038471221923828125, -0.0020513534545898438, -0.000255584716796875, 0.0015401840209960938, 0.0033359527587890625, 0.005131721496582031, 0.006927490234375, 0.008723258972167969, 0.010519027709960938, 0.012314796447753906, 0.014110565185546875, 0.015906333923339844, 0.017702102661132812, 0.01949787139892578, 0.02129364013671875, 0.02308940887451172, 0.024885177612304688, 0.026680946350097656, 0.028476715087890625, 0.030272483825683594, 0.03206825256347656, 0.03386402130126953, 0.0356597900390625, 0.03745555877685547, 0.03925132751464844, 0.041047096252441406, 0.042842864990234375, 0.044638633728027344, 0.04643440246582031, 0.04823017120361328, 0.05002593994140625, 0.05182170867919922, 0.05361747741699219, 0.055413246154785156, 0.057209014892578125, 0.059004783630371094, 0.06080055236816406, 0.06259632110595703, 0.06439208984375]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 17.0, 124.0, 433.0, 360.0, 73.0, 5.0, 3.0, 1.0, 1.0], "bins": [-0.010284267365932465, -0.010106420144438744, -0.009928571991622448, -0.009750724770128727, -0.009572876617312431, -0.00939502939581871, -0.009217181243002415, -0.009039334021508694, -0.008861485868692398, -0.008683638647198677, -0.008505790494382381, -0.00832794327288866, -0.008150095120072365, -0.007972247898578644, -0.007794399745762348, -0.00761655205860734, -0.0074387043714523315, -0.007260856684297323, -0.007083008997142315, -0.006905161309987307, -0.006727313622832298, -0.00654946593567729, -0.006371618248522282, -0.006193770561367273, -0.006015923339873552, -0.005838075652718544, -0.005660227965563536, -0.005482380278408527, -0.005304532591253519, -0.005126684904098511, -0.004948837216943502, -0.004770989529788494, -0.0045931413769721985, -0.00441529368981719, -0.004237446002662182, -0.0040595983155071735, -0.0038817506283521652, -0.003703902941197157, -0.0035260552540421486, -0.0033482075668871403, -0.0031703601125627756, -0.0029925124254077673, -0.002814664738252759, -0.0026368170510977507, -0.0024589693639427423, -0.002281121676787734, -0.0021032742224633694, -0.0019254264188930392, -0.001747578731738031, -0.0015697310445830226, -0.0013918833574280143, -0.0012140357866883278, -0.0010361880995333195, -0.0008583403541706502, -0.0006804927252233028, -0.0005026450380682945, -0.0003247973509132862, -0.00014694967831019312, 3.0897994292899966e-05, 0.00020874565234407783, 0.00038659333949908614, 0.0005644410266540945, 0.0007422886556014419, 0.0009201363427564502, 0.0010979840299114585]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 3.0, 7.0, 1.0, 8.0, 5.0, 8.0, 16.0, 8.0, 4.0, 20.0, 20.0, 14.0, 22.0, 19.0, 23.0, 27.0, 30.0, 29.0, 33.0, 35.0, 40.0, 47.0, 44.0, 35.0, 41.0, 43.0, 44.0, 40.0, 39.0, 27.0, 33.0, 34.0, 28.0, 22.0, 21.0, 18.0, 17.0, 23.0, 16.0, 12.0, 9.0, 7.0, 11.0, 6.0, 6.0, 6.0, 3.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0010445117950439453, -0.0010075448080897331, -0.0009705778211355209, -0.0009336108341813087, -0.0008966438472270966, -0.0008596768602728844, -0.0008227098733186722, -0.00078574288636446, -0.0007487758994102478, -0.0007118089124560356, -0.0006748419255018234, -0.0006378749385476112, -0.000600907951593399, -0.0005639409646391869, -0.0005269739776849747, -0.0004900069907307625, -0.0004530400037765503, -0.0004160730168223381, -0.0003791060298681259, -0.0003421390429139137, -0.00030517205595970154, -0.00026820506900548935, -0.00023123808205127716, -0.00019427109509706497, -0.00015730410814285278, -0.0001203371211886406, -8.33701342344284e-05, -4.640314728021622e-05, -9.436160326004028e-06, 2.753082662820816e-05, 6.449781358242035e-05, 0.00010146480053663254, 0.00013843178749084473, 0.00017539877444505692, 0.0002123657613992691, 0.0002493327483534813, 0.0002862997353076935, 0.00032326672226190567, 0.00036023370921611786, 0.00039720069617033005, 0.00043416768312454224, 0.0004711346700787544, 0.0005081016570329666, 0.0005450686439871788, 0.000582035630941391, 0.0006190026178956032, 0.0006559696048498154, 0.0006929365918040276, 0.0007299035787582397, 0.0007668705657124519, 0.0008038375526666641, 0.0008408045396208763, 0.0008777715265750885, 0.0009147385135293007, 0.0009517055004835129, 0.000988672487437725, 0.0010256394743919373, 0.0010626064613461494, 0.0010995734483003616, 0.0011365404352545738, 0.001173507422208786, 0.0012104744091629982, 0.0012474413961172104, 0.0012844083830714226, 0.0013213753700256348]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 4.0, 1.0, 5.0, 3.0, 3.0, 6.0, 4.0, 5.0, 11.0, 5.0, 22.0, 10.0, 22.0, 25.0, 25.0, 25.0, 28.0, 37.0, 30.0, 37.0, 47.0, 57.0, 35.0, 41.0, 35.0, 54.0, 54.0, 45.0, 37.0, 46.0, 30.0, 28.0, 34.0, 25.0, 25.0, 22.0, 15.0, 15.0, 10.0, 11.0, 11.0, 8.0, 8.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.99609375, -6.77154541015625, -6.5469970703125, -6.32244873046875, -6.097900390625, -5.87335205078125, -5.6488037109375, -5.42425537109375, -5.19970703125, -4.97515869140625, -4.7506103515625, -4.52606201171875, -4.301513671875, -4.07696533203125, -3.8524169921875, -3.62786865234375, -3.4033203125, -3.17877197265625, -2.9542236328125, -2.72967529296875, -2.505126953125, -2.28057861328125, -2.0560302734375, -1.83148193359375, -1.60693359375, -1.38238525390625, -1.1578369140625, -0.93328857421875, -0.708740234375, -0.48419189453125, -0.2596435546875, -0.03509521484375, 0.189453125, 0.41400146484375, 0.6385498046875, 0.86309814453125, 1.087646484375, 1.31219482421875, 1.5367431640625, 1.76129150390625, 1.98583984375, 2.21038818359375, 2.4349365234375, 2.65948486328125, 2.884033203125, 3.10858154296875, 3.3331298828125, 3.55767822265625, 3.7822265625, 4.00677490234375, 4.2313232421875, 4.45587158203125, 4.680419921875, 4.90496826171875, 5.1295166015625, 5.35406494140625, 5.57861328125, 5.80316162109375, 6.0277099609375, 6.25225830078125, 6.476806640625, 6.70135498046875, 6.9259033203125, 7.15045166015625, 7.375]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 8.0, 6.0, 10.0, 6.0, 8.0, 9.0, 22.0, 25.0, 24.0, 49.0, 73.0, 103.0, 140.0, 215.0, 317.0, 491.0, 781.0, 1210.0, 1960.0, 3402.0, 5850.0, 10314.0, 20166.0, 44728.0, 121303.0, 368936.0, 295138.0, 96451.0, 37142.0, 17281.0, 9292.0, 5130.0, 3029.0, 1770.0, 1135.0, 666.0, 461.0, 303.0, 175.0, 126.0, 78.0, 51.0, 51.0, 33.0, 28.0, 21.0, 19.0, 8.0, 9.0, 9.0, 5.0, 1.0, 2.0, 1.0], "bins": [-5.1875, -5.04296875, -4.8984375, -4.75390625, -4.609375, -4.46484375, -4.3203125, -4.17578125, -4.03125, -3.88671875, -3.7421875, -3.59765625, -3.453125, -3.30859375, -3.1640625, -3.01953125, -2.875, -2.73046875, -2.5859375, -2.44140625, -2.296875, -2.15234375, -2.0078125, -1.86328125, -1.71875, -1.57421875, -1.4296875, -1.28515625, -1.140625, -0.99609375, -0.8515625, -0.70703125, -0.5625, -0.41796875, -0.2734375, -0.12890625, 0.015625, 0.16015625, 0.3046875, 0.44921875, 0.59375, 0.73828125, 0.8828125, 1.02734375, 1.171875, 1.31640625, 1.4609375, 1.60546875, 1.75, 1.89453125, 2.0390625, 2.18359375, 2.328125, 2.47265625, 2.6171875, 2.76171875, 2.90625, 3.05078125, 3.1953125, 3.33984375, 3.484375, 3.62890625, 3.7734375, 3.91796875, 4.0625]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 4.0, 9.0, 6.0, 5.0, 8.0, 14.0, 13.0, 20.0, 8.0, 24.0, 33.0, 24.0, 27.0, 42.0, 33.0, 47.0, 43.0, 68.0, 100.0, 418.0, 1501.0, 124.0, 62.0, 56.0, 49.0, 45.0, 35.0, 33.0, 31.0, 20.0, 24.0, 18.0, 18.0, 20.0, 11.0, 10.0, 7.0, 11.0, 6.0, 6.0, 8.0, 4.0, 2.0, 3.0, 0.0, 0.0, 3.0, 0.0, 3.0], "bins": [-23.765625, -23.087158203125, -22.40869140625, -21.730224609375, -21.0517578125, -20.373291015625, -19.69482421875, -19.016357421875, -18.337890625, -17.659423828125, -16.98095703125, -16.302490234375, -15.6240234375, -14.945556640625, -14.26708984375, -13.588623046875, -12.91015625, -12.231689453125, -11.55322265625, -10.874755859375, -10.1962890625, -9.517822265625, -8.83935546875, -8.160888671875, -7.482421875, -6.803955078125, -6.12548828125, -5.447021484375, -4.7685546875, -4.090087890625, -3.41162109375, -2.733154296875, -2.0546875, -1.376220703125, -0.69775390625, -0.019287109375, 0.6591796875, 1.337646484375, 2.01611328125, 2.694580078125, 3.373046875, 4.051513671875, 4.72998046875, 5.408447265625, 6.0869140625, 6.765380859375, 7.44384765625, 8.122314453125, 8.80078125, 9.479248046875, 10.15771484375, 10.836181640625, 11.5146484375, 12.193115234375, 12.87158203125, 13.550048828125, 14.228515625, 14.906982421875, 15.58544921875, 16.263916015625, 16.9423828125, 17.620849609375, 18.29931640625, 18.977783203125, 19.65625]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 8.0, 14.0, 17.0, 30.0, 32.0, 56.0, 64.0, 89.0, 146.0, 208.0, 305.0, 537.0, 3038.0, 3095564.0, 43684.0, 817.0, 365.0, 248.0, 159.0, 93.0, 69.0, 50.0, 26.0, 24.0, 17.0, 7.0, 10.0, 8.0, 3.0, 2.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-71.8125, -69.314453125, -66.81640625, -64.318359375, -61.8203125, -59.322265625, -56.82421875, -54.326171875, -51.828125, -49.330078125, -46.83203125, -44.333984375, -41.8359375, -39.337890625, -36.83984375, -34.341796875, -31.84375, -29.345703125, -26.84765625, -24.349609375, -21.8515625, -19.353515625, -16.85546875, -14.357421875, -11.859375, -9.361328125, -6.86328125, -4.365234375, -1.8671875, 0.630859375, 3.12890625, 5.626953125, 8.125, 10.623046875, 13.12109375, 15.619140625, 18.1171875, 20.615234375, 23.11328125, 25.611328125, 28.109375, 30.607421875, 33.10546875, 35.603515625, 38.1015625, 40.599609375, 43.09765625, 45.595703125, 48.09375, 50.591796875, 53.08984375, 55.587890625, 58.0859375, 60.583984375, 63.08203125, 65.580078125, 68.078125, 70.576171875, 73.07421875, 75.572265625, 78.0703125, 80.568359375, 83.06640625, 85.564453125, 88.0625]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 7.0, 709.0, 298.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.23029327392578, -29.586578369140625, -21.94286346435547, -14.299150466918945, -6.655435562133789, 0.9882774353027344, 8.63199234008789, 16.275707244873047, 23.919422149658203, 31.56313705444336, 39.206851959228516, 46.850563049316406, 54.49427795410156, 62.13799285888672, 69.78170776367188, 77.42542266845703, 85.06913757324219, 92.71285247802734, 100.3565673828125, 108.00028228759766, 115.64399719238281, 123.28770446777344, 130.93142700195312, 138.57513427734375, 146.21885681152344, 153.86256408691406, 161.50628662109375, 169.14999389648438, 176.79371643066406, 184.4374237060547, 192.08114624023438, 199.724853515625, 207.3685760498047, 215.0122833251953, 222.656005859375, 230.29971313476562, 237.9434356689453, 245.58714294433594, 253.23086547851562, 260.87457275390625, 268.5182800292969, 276.1619873046875, 283.8056945800781, 291.4494323730469, 299.0931396484375, 306.7368469238281, 314.38055419921875, 322.0242919921875, 329.6679992675781, 337.31170654296875, 344.9554138183594, 352.5991516113281, 360.24285888671875, 367.8865661621094, 375.5302734375, 383.17401123046875, 390.8177185058594, 398.46142578125, 406.1051330566406, 413.7488708496094, 421.392578125, 429.0362854003906, 436.67999267578125, 444.32373046875, 451.9674377441406]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 4.0, 5.0, 8.0, 6.0, 13.0, 9.0, 12.0, 15.0, 13.0, 23.0, 16.0, 19.0, 23.0, 23.0, 31.0, 38.0, 35.0, 38.0, 40.0, 39.0, 40.0, 38.0, 48.0, 33.0, 31.0, 46.0, 38.0, 38.0, 34.0, 30.0, 35.0, 22.0, 21.0, 14.0, 17.0, 18.0, 12.0, 18.0, 12.0, 12.0, 7.0, 8.0, 4.0, 6.0, 3.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-49.44548797607422, -47.808387756347656, -46.171287536621094, -44.53418731689453, -42.89708709716797, -41.259986877441406, -39.622886657714844, -37.98578643798828, -36.34868621826172, -34.711585998535156, -33.074485778808594, -31.43738555908203, -29.80028533935547, -28.163185119628906, -26.526084899902344, -24.88898468017578, -23.25188446044922, -21.614784240722656, -19.977684020996094, -18.34058380126953, -16.70348358154297, -15.066383361816406, -13.429283142089844, -11.792182922363281, -10.155082702636719, -8.517982482910156, -6.880882263183594, -5.243782043457031, -3.6066818237304688, -1.9695816040039062, -0.33248138427734375, 1.3046188354492188, 2.9417190551757812, 4.578819274902344, 6.215919494628906, 7.853019714355469, 9.490119934082031, 11.127220153808594, 12.764320373535156, 14.401420593261719, 16.03852081298828, 17.675621032714844, 19.312721252441406, 20.94982147216797, 22.58692169189453, 24.224021911621094, 25.861122131347656, 27.49822235107422, 29.13532257080078, 30.772422790527344, 32.409523010253906, 34.04662322998047, 35.68372344970703, 37.320823669433594, 38.957923889160156, 40.59502410888672, 42.23212432861328, 43.869224548339844, 45.506324768066406, 47.14342498779297, 48.78052520751953, 50.417625427246094, 52.054725646972656, 53.69182586669922, 55.32892608642578]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 2.0, 2.0, 4.0, 8.0, 4.0, 5.0, 8.0, 7.0, 8.0, 13.0, 16.0, 21.0, 25.0, 25.0, 30.0, 36.0, 33.0, 36.0, 37.0, 31.0, 45.0, 41.0, 47.0, 51.0, 41.0, 45.0, 51.0, 38.0, 36.0, 41.0, 29.0, 30.0, 27.0, 25.0, 11.0, 18.0, 18.0, 14.0, 12.0, 6.0, 11.0, 4.0, 3.0, 1.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-7.65625, -7.42388916015625, -7.1915283203125, -6.95916748046875, -6.726806640625, -6.49444580078125, -6.2620849609375, -6.02972412109375, -5.79736328125, -5.56500244140625, -5.3326416015625, -5.10028076171875, -4.867919921875, -4.63555908203125, -4.4031982421875, -4.17083740234375, -3.9384765625, -3.70611572265625, -3.4737548828125, -3.24139404296875, -3.009033203125, -2.77667236328125, -2.5443115234375, -2.31195068359375, -2.07958984375, -1.84722900390625, -1.6148681640625, -1.38250732421875, -1.150146484375, -0.91778564453125, -0.6854248046875, -0.45306396484375, -0.220703125, 0.01165771484375, 0.2440185546875, 0.47637939453125, 0.708740234375, 0.94110107421875, 1.1734619140625, 1.40582275390625, 1.63818359375, 1.87054443359375, 2.1029052734375, 2.33526611328125, 2.567626953125, 2.79998779296875, 3.0323486328125, 3.26470947265625, 3.4970703125, 3.72943115234375, 3.9617919921875, 4.19415283203125, 4.426513671875, 4.65887451171875, 4.8912353515625, 5.12359619140625, 5.35595703125, 5.58831787109375, 5.8206787109375, 6.05303955078125, 6.285400390625, 6.51776123046875, 6.7501220703125, 6.98248291015625, 7.21484375]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 7.0, 3.0, 7.0, 7.0, 11.0, 9.0, 12.0, 19.0, 20.0, 36.0, 25.0, 41.0, 84.0, 108.0, 208.0, 416.0, 1025.0, 3206.0, 16757.0, 250208.0, 2602015.0, 1237472.0, 72396.0, 7118.0, 1719.0, 631.0, 263.0, 140.0, 79.0, 55.0, 33.0, 23.0, 20.0, 19.0, 24.0, 11.0, 9.0, 8.0, 10.0, 4.0, 6.0, 5.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-18.984375, -18.42236328125, -17.8603515625, -17.29833984375, -16.736328125, -16.17431640625, -15.6123046875, -15.05029296875, -14.48828125, -13.92626953125, -13.3642578125, -12.80224609375, -12.240234375, -11.67822265625, -11.1162109375, -10.55419921875, -9.9921875, -9.43017578125, -8.8681640625, -8.30615234375, -7.744140625, -7.18212890625, -6.6201171875, -6.05810546875, -5.49609375, -4.93408203125, -4.3720703125, -3.81005859375, -3.248046875, -2.68603515625, -2.1240234375, -1.56201171875, -1.0, -0.43798828125, 0.1240234375, 0.68603515625, 1.248046875, 1.81005859375, 2.3720703125, 2.93408203125, 3.49609375, 4.05810546875, 4.6201171875, 5.18212890625, 5.744140625, 6.30615234375, 6.8681640625, 7.43017578125, 7.9921875, 8.55419921875, 9.1162109375, 9.67822265625, 10.240234375, 10.80224609375, 11.3642578125, 11.92626953125, 12.48828125, 13.05029296875, 13.6123046875, 14.17431640625, 14.736328125, 15.29833984375, 15.8603515625, 16.42236328125, 16.984375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 8.0, 10.0, 5.0, 9.0, 20.0, 29.0, 40.0, 80.0, 80.0, 106.0, 165.0, 224.0, 338.0, 428.0, 493.0, 528.0, 419.0, 315.0, 226.0, 155.0, 106.0, 88.0, 56.0, 38.0, 26.0, 23.0, 12.0, 16.0, 10.0, 3.0, 7.0, 3.0, 1.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-16.78125, -16.3271484375, -15.873046875, -15.4189453125, -14.96484375, -14.5107421875, -14.056640625, -13.6025390625, -13.1484375, -12.6943359375, -12.240234375, -11.7861328125, -11.33203125, -10.8779296875, -10.423828125, -9.9697265625, -9.515625, -9.0615234375, -8.607421875, -8.1533203125, -7.69921875, -7.2451171875, -6.791015625, -6.3369140625, -5.8828125, -5.4287109375, -4.974609375, -4.5205078125, -4.06640625, -3.6123046875, -3.158203125, -2.7041015625, -2.25, -1.7958984375, -1.341796875, -0.8876953125, -0.43359375, 0.0205078125, 0.474609375, 0.9287109375, 1.3828125, 1.8369140625, 2.291015625, 2.7451171875, 3.19921875, 3.6533203125, 4.107421875, 4.5615234375, 5.015625, 5.4697265625, 5.923828125, 6.3779296875, 6.83203125, 7.2861328125, 7.740234375, 8.1943359375, 8.6484375, 9.1025390625, 9.556640625, 10.0107421875, 10.46484375, 10.9189453125, 11.373046875, 11.8271484375, 12.28125]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 0.0, 0.0, 3.0, 6.0, 6.0, 7.0, 6.0, 10.0, 12.0, 16.0, 29.0, 31.0, 36.0, 42.0, 57.0, 75.0, 87.0, 117.0, 146.0, 200.0, 301.0, 520.0, 1257.0, 21363.0, 3603105.0, 559970.0, 4623.0, 782.0, 402.0, 258.0, 181.0, 148.0, 109.0, 101.0, 60.0, 44.0, 41.0, 34.0, 24.0, 17.0, 14.0, 12.0, 11.0, 10.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-48.15625, -46.5927734375, -45.029296875, -43.4658203125, -41.90234375, -40.3388671875, -38.775390625, -37.2119140625, -35.6484375, -34.0849609375, -32.521484375, -30.9580078125, -29.39453125, -27.8310546875, -26.267578125, -24.7041015625, -23.140625, -21.5771484375, -20.013671875, -18.4501953125, -16.88671875, -15.3232421875, -13.759765625, -12.1962890625, -10.6328125, -9.0693359375, -7.505859375, -5.9423828125, -4.37890625, -2.8154296875, -1.251953125, 0.3115234375, 1.875, 3.4384765625, 5.001953125, 6.5654296875, 8.12890625, 9.6923828125, 11.255859375, 12.8193359375, 14.3828125, 15.9462890625, 17.509765625, 19.0732421875, 20.63671875, 22.2001953125, 23.763671875, 25.3271484375, 26.890625, 28.4541015625, 30.017578125, 31.5810546875, 33.14453125, 34.7080078125, 36.271484375, 37.8349609375, 39.3984375, 40.9619140625, 42.525390625, 44.0888671875, 45.65234375, 47.2158203125, 48.779296875, 50.3427734375, 51.90625]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 14.0, 41.0, 77.0, 124.0, 179.0, 191.0, 168.0, 110.0, 60.0, 24.0, 14.0, 5.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-143.77023315429688, -140.96571350097656, -138.1612091064453, -135.356689453125, -132.55218505859375, -129.74766540527344, -126.94316101074219, -124.1386489868164, -121.33413696289062, -118.52962493896484, -115.72511291503906, -112.92060089111328, -110.1160888671875, -107.31157684326172, -104.50706481933594, -101.70255279541016, -98.89804077148438, -96.0935287475586, -93.28901672363281, -90.48450469970703, -87.67999267578125, -84.87548065185547, -82.07096862792969, -79.2664566040039, -76.4619369506836, -73.65742492675781, -70.85291290283203, -68.04840087890625, -65.24388885498047, -62.43937683105469, -59.634864807128906, -56.830352783203125, -54.02584457397461, -51.22133255004883, -48.41682052612305, -45.612308502197266, -42.807796478271484, -40.0032844543457, -37.198768615722656, -34.394256591796875, -31.589746475219727, -28.785234451293945, -25.980722427368164, -23.17620849609375, -20.37169647216797, -17.567184448242188, -14.762672424316406, -11.958160400390625, -9.153648376464844, -6.3491363525390625, -3.544623851776123, -0.7401113510131836, 2.0644006729125977, 4.868912696838379, 7.673425674438477, 10.477937698364258, 13.282449722290039, 16.08696174621582, 18.8914737701416, 21.695987701416016, 24.500499725341797, 27.305011749267578, 30.10952377319336, 32.91403579711914, 35.71854782104492]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 2.0, 8.0, 6.0, 6.0, 11.0, 11.0, 17.0, 11.0, 20.0, 21.0, 24.0, 23.0, 26.0, 33.0, 35.0, 42.0, 33.0, 37.0, 46.0, 37.0, 38.0, 40.0, 55.0, 40.0, 39.0, 45.0, 34.0, 34.0, 23.0, 17.0, 24.0, 23.0, 20.0, 22.0, 18.0, 12.0, 15.0, 13.0, 10.0, 4.0, 6.0, 3.0, 13.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-39.9771728515625, -38.68795394897461, -37.39873123168945, -36.10951232910156, -34.820289611816406, -33.531070709228516, -32.241851806640625, -30.9526309967041, -29.663410186767578, -28.374189376831055, -27.08496856689453, -25.79574966430664, -24.506528854370117, -23.217308044433594, -21.928089141845703, -20.63886833190918, -19.349647521972656, -18.060426712036133, -16.77120590209961, -15.481986999511719, -14.192766189575195, -12.903545379638672, -11.614325523376465, -10.325105667114258, -9.035884857177734, -7.746664524078369, -6.457444190979004, -5.168223857879639, -3.8790035247802734, -2.589783191680908, -1.300562858581543, -0.011343002319335938, 1.2778778076171875, 2.5670981407165527, 3.856318473815918, 5.145538806915283, 6.434759140014648, 7.723979473114014, 9.013199806213379, 10.302419662475586, 11.59164047241211, 12.880861282348633, 14.17008113861084, 15.459300994873047, 16.74852180480957, 18.037742614746094, 19.326961517333984, 20.616182327270508, 21.90540313720703, 23.194623947143555, 24.483844757080078, 25.77306365966797, 27.062284469604492, 28.351505279541016, 29.640724182128906, 30.92994499206543, 32.21916580200195, 33.508384704589844, 34.797607421875, 36.08682632446289, 37.37604522705078, 38.66526794433594, 39.95448684692383, 41.24370574951172, 42.532928466796875]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 8.0, 8.0, 9.0, 14.0, 23.0, 17.0, 15.0, 14.0, 24.0, 27.0, 25.0, 42.0, 36.0, 34.0, 40.0, 42.0, 47.0, 39.0, 51.0, 40.0, 48.0, 47.0, 41.0, 46.0, 36.0, 32.0, 33.0, 23.0, 26.0, 22.0, 10.0, 21.0, 15.0, 11.0, 7.0, 4.0, 6.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.2734375, -7.04705810546875, -6.8206787109375, -6.59429931640625, -6.367919921875, -6.14154052734375, -5.9151611328125, -5.68878173828125, -5.46240234375, -5.23602294921875, -5.0096435546875, -4.78326416015625, -4.556884765625, -4.33050537109375, -4.1041259765625, -3.87774658203125, -3.6513671875, -3.42498779296875, -3.1986083984375, -2.97222900390625, -2.745849609375, -2.51947021484375, -2.2930908203125, -2.06671142578125, -1.84033203125, -1.61395263671875, -1.3875732421875, -1.16119384765625, -0.934814453125, -0.70843505859375, -0.4820556640625, -0.25567626953125, -0.029296875, 0.19708251953125, 0.4234619140625, 0.64984130859375, 0.876220703125, 1.10260009765625, 1.3289794921875, 1.55535888671875, 1.78173828125, 2.00811767578125, 2.2344970703125, 2.46087646484375, 2.687255859375, 2.91363525390625, 3.1400146484375, 3.36639404296875, 3.5927734375, 3.81915283203125, 4.0455322265625, 4.27191162109375, 4.498291015625, 4.72467041015625, 4.9510498046875, 5.17742919921875, 5.40380859375, 5.63018798828125, 5.8565673828125, 6.08294677734375, 6.309326171875, 6.53570556640625, 6.7620849609375, 6.98846435546875, 7.21484375]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 3.0, 3.0, 4.0, 10.0, 15.0, 20.0, 39.0, 47.0, 64.0, 104.0, 149.0, 227.0, 367.0, 597.0, 1016.0, 1653.0, 2657.0, 4565.0, 7797.0, 13340.0, 23410.0, 42577.0, 85791.0, 200466.0, 331554.0, 169827.0, 73874.0, 37940.0, 20965.0, 12132.0, 6989.0, 4117.0, 2376.0, 1490.0, 933.0, 532.0, 324.0, 216.0, 107.0, 89.0, 60.0, 43.0, 27.0, 17.0, 17.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.32421875, -1.284576416015625, -1.24493408203125, -1.205291748046875, -1.1656494140625, -1.126007080078125, -1.08636474609375, -1.046722412109375, -1.007080078125, -0.967437744140625, -0.92779541015625, -0.888153076171875, -0.8485107421875, -0.808868408203125, -0.76922607421875, -0.729583740234375, -0.68994140625, -0.650299072265625, -0.61065673828125, -0.571014404296875, -0.5313720703125, -0.491729736328125, -0.45208740234375, -0.412445068359375, -0.372802734375, -0.333160400390625, -0.29351806640625, -0.253875732421875, -0.2142333984375, -0.174591064453125, -0.13494873046875, -0.095306396484375, -0.0556640625, -0.016021728515625, 0.02362060546875, 0.063262939453125, 0.1029052734375, 0.142547607421875, 0.18218994140625, 0.221832275390625, 0.261474609375, 0.301116943359375, 0.34075927734375, 0.380401611328125, 0.4200439453125, 0.459686279296875, 0.49932861328125, 0.538970947265625, 0.57861328125, 0.618255615234375, 0.65789794921875, 0.697540283203125, 0.7371826171875, 0.776824951171875, 0.81646728515625, 0.856109619140625, 0.895751953125, 0.935394287109375, 0.97503662109375, 1.014678955078125, 1.0543212890625, 1.093963623046875, 1.13360595703125, 1.173248291015625, 1.212890625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 7.0, 4.0, 8.0, 10.0, 17.0, 13.0, 17.0, 26.0, 23.0, 30.0, 29.0, 35.0, 39.0, 44.0, 58.0, 44.0, 57.0, 1071.0, 63.0, 30.0, 45.0, 49.0, 35.0, 44.0, 27.0, 30.0, 32.0, 31.0, 21.0, 14.0, 14.0, 17.0, 12.0, 6.0, 4.0, 8.0, 4.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.33203125, -5.1788330078125, -5.025634765625, -4.8724365234375, -4.71923828125, -4.5660400390625, -4.412841796875, -4.2596435546875, -4.1064453125, -3.9532470703125, -3.800048828125, -3.6468505859375, -3.49365234375, -3.3404541015625, -3.187255859375, -3.0340576171875, -2.880859375, -2.7276611328125, -2.574462890625, -2.4212646484375, -2.26806640625, -2.1148681640625, -1.961669921875, -1.8084716796875, -1.6552734375, -1.5020751953125, -1.348876953125, -1.1956787109375, -1.04248046875, -0.8892822265625, -0.736083984375, -0.5828857421875, -0.4296875, -0.2764892578125, -0.123291015625, 0.0299072265625, 0.18310546875, 0.3363037109375, 0.489501953125, 0.6427001953125, 0.7958984375, 0.9490966796875, 1.102294921875, 1.2554931640625, 1.40869140625, 1.5618896484375, 1.715087890625, 1.8682861328125, 2.021484375, 2.1746826171875, 2.327880859375, 2.4810791015625, 2.63427734375, 2.7874755859375, 2.940673828125, 3.0938720703125, 3.2470703125, 3.4002685546875, 3.553466796875, 3.7066650390625, 3.85986328125, 4.0130615234375, 4.166259765625, 4.3194580078125, 4.47265625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 3.0, 2.0, 9.0, 18.0, 13.0, 20.0, 38.0, 57.0, 97.0, 131.0, 210.0, 293.0, 406.0, 636.0, 859.0, 1225.0, 1899.0, 2701.0, 3960.0, 5985.0, 8940.0, 13788.0, 21232.0, 33347.0, 54337.0, 92945.0, 166896.0, 1286126.0, 163465.0, 90705.0, 52642.0, 32753.0, 20920.0, 13602.0, 8762.0, 5767.0, 3841.0, 2620.0, 1815.0, 1264.0, 826.0, 649.0, 426.0, 284.0, 207.0, 126.0, 105.0, 51.0, 40.0, 26.0, 29.0, 17.0, 7.0, 8.0, 5.0, 4.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.75244140625, -0.7285385131835938, -0.7046356201171875, -0.6807327270507812, -0.656829833984375, -0.6329269409179688, -0.6090240478515625, -0.5851211547851562, -0.56121826171875, -0.5373153686523438, -0.5134124755859375, -0.48950958251953125, -0.465606689453125, -0.44170379638671875, -0.4178009033203125, -0.39389801025390625, -0.3699951171875, -0.34609222412109375, -0.3221893310546875, -0.29828643798828125, -0.274383544921875, -0.25048065185546875, -0.2265777587890625, -0.20267486572265625, -0.17877197265625, -0.15486907958984375, -0.1309661865234375, -0.10706329345703125, -0.083160400390625, -0.05925750732421875, -0.0353546142578125, -0.01145172119140625, 0.012451171875, 0.03635406494140625, 0.0602569580078125, 0.08415985107421875, 0.108062744140625, 0.13196563720703125, 0.1558685302734375, 0.17977142333984375, 0.20367431640625, 0.22757720947265625, 0.2514801025390625, 0.27538299560546875, 0.299285888671875, 0.32318878173828125, 0.3470916748046875, 0.37099456787109375, 0.3948974609375, 0.41880035400390625, 0.4427032470703125, 0.46660614013671875, 0.490509033203125, 0.5144119262695312, 0.5383148193359375, 0.5622177124023438, 0.58612060546875, 0.6100234985351562, 0.6339263916015625, 0.6578292846679688, 0.681732177734375, 0.7056350708007812, 0.7295379638671875, 0.7534408569335938, 0.77734375]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 10.0, 4.0, 16.0, 10.0, 14.0, 23.0, 24.0, 27.0, 29.0, 34.0, 29.0, 34.0, 50.0, 54.0, 51.0, 62.0, 62.0, 58.0, 63.0, 45.0, 40.0, 48.0, 33.0, 27.0, 28.0, 28.0, 22.0, 11.0, 8.0, 6.0, 16.0, 7.0, 6.0, 7.0, 4.0, 2.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0022449493408203125, -0.0021731555461883545, -0.0021013617515563965, -0.0020295679569244385, -0.0019577741622924805, -0.0018859803676605225, -0.0018141865730285645, -0.0017423927783966064, -0.0016705989837646484, -0.0015988051891326904, -0.0015270113945007324, -0.0014552175998687744, -0.0013834238052368164, -0.0013116300106048584, -0.0012398362159729004, -0.0011680424213409424, -0.0010962486267089844, -0.0010244548320770264, -0.0009526610374450684, -0.0008808672428131104, -0.0008090734481811523, -0.0007372796535491943, -0.0006654858589172363, -0.0005936920642852783, -0.0005218982696533203, -0.0004501044750213623, -0.0003783106803894043, -0.0003065168857574463, -0.00023472309112548828, -0.00016292929649353027, -9.113550186157227e-05, -1.9341707229614258e-05, 5.245208740234375e-05, 0.00012424588203430176, 0.00019603967666625977, 0.0002678334712982178, 0.0003396272659301758, 0.0004114210605621338, 0.0004832148551940918, 0.0005550086498260498, 0.0006268024444580078, 0.0006985962390899658, 0.0007703900337219238, 0.0008421838283538818, 0.0009139776229858398, 0.0009857714176177979, 0.0010575652122497559, 0.0011293590068817139, 0.0012011528015136719, 0.0012729465961456299, 0.0013447403907775879, 0.001416534185409546, 0.001488327980041504, 0.001560121774673462, 0.00163191556930542, 0.001703709363937378, 0.001775503158569336, 0.001847296953201294, 0.001919090747833252, 0.00199088454246521, 0.002062678337097168, 0.002134472131729126, 0.002206265926361084, 0.002278059720993042, 0.002349853515625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 1.0, 7.0, 5.0, 5.0, 14.0, 13.0, 7.0, 20.0, 23.0, 24.0, 22.0, 51.0, 54.0, 87.0, 102.0, 182.0, 443.0, 2359.0, 1002963.0, 40532.0, 899.0, 242.0, 114.0, 93.0, 63.0, 50.0, 41.0, 31.0, 21.0, 20.0, 16.0, 11.0, 9.0, 8.0, 6.0, 3.0, 3.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.05712890625, -0.055384159088134766, -0.05363941192626953, -0.0518946647644043, -0.05014991760253906, -0.04840517044067383, -0.046660423278808594, -0.04491567611694336, -0.043170928955078125, -0.04142618179321289, -0.039681434631347656, -0.03793668746948242, -0.03619194030761719, -0.03444719314575195, -0.03270244598388672, -0.030957698822021484, -0.02921295166015625, -0.027468204498291016, -0.02572345733642578, -0.023978710174560547, -0.022233963012695312, -0.020489215850830078, -0.018744468688964844, -0.01699972152709961, -0.015254974365234375, -0.01351022720336914, -0.011765480041503906, -0.010020732879638672, -0.008275985717773438, -0.006531238555908203, -0.004786491394042969, -0.0030417442321777344, -0.0012969970703125, 0.0004477500915527344, 0.0021924972534179688, 0.003937244415283203, 0.0056819915771484375, 0.007426738739013672, 0.009171485900878906, 0.01091623306274414, 0.012660980224609375, 0.01440572738647461, 0.016150474548339844, 0.017895221710205078, 0.019639968872070312, 0.021384716033935547, 0.02312946319580078, 0.024874210357666016, 0.02661895751953125, 0.028363704681396484, 0.03010845184326172, 0.03185319900512695, 0.03359794616699219, 0.03534269332885742, 0.037087440490722656, 0.03883218765258789, 0.040576934814453125, 0.04232168197631836, 0.044066429138183594, 0.04581117630004883, 0.04755592346191406, 0.0493006706237793, 0.05104541778564453, 0.052790164947509766, 0.054534912109375]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 19.0, 154.0, 387.0, 339.0, 91.0, 18.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008039196953177452, -0.007878146134316921, -0.00771709531545639, -0.0075560444965958595, -0.007394993677735329, -0.0072339423932135105, -0.00707289157435298, -0.006911840755492449, -0.006750789936631918, -0.006589739117771387, -0.006428688298910856, -0.006267637480050325, -0.006106586195528507, -0.005945535376667976, -0.0057844845578074455, -0.005623433738946915, -0.005462382920086384, -0.005301332101225853, -0.005140281282365322, -0.004979230463504791, -0.00481817964464426, -0.004657128360122442, -0.004496077541261911, -0.0043350267224013805, -0.00417397590354085, -0.004012925084680319, -0.003851874265819788, -0.0036908232141286135, -0.0035297723952680826, -0.0033687215764075518, -0.0032076705247163773, -0.0030466197058558464, -0.002885569352656603, -0.002724518533796072, -0.002563467714935541, -0.0024024166632443666, -0.002241365844383836, -0.002080315025523305, -0.0019192640902474523, -0.0017582131549715996, -0.0015971623361110687, -0.0014361115172505379, -0.0012750605819746852, -0.0011140096466988325, -0.0009529588278383017, -0.0007919079507701099, -0.0006308570737019181, -0.00046980613842606544, -0.0003087553195655346, -0.00014770444249734282, 1.3346434570848942e-05, 0.0001743973116390407, 0.0003354481887072325, 0.0004964990657754242, 0.000657549942843616, 0.0008186008781194687, 0.0009796516969799995, 0.0011407025158405304, 0.001301753451116383, 0.0014628043863922358, 0.0016238552052527666, 0.0017849060241132975, 0.0019459569593891501, 0.002107007894665003, 0.0022680587135255337]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 2.0, 3.0, 6.0, 10.0, 7.0, 7.0, 6.0, 6.0, 9.0, 24.0, 16.0, 23.0, 21.0, 19.0, 22.0, 24.0, 28.0, 40.0, 42.0, 28.0, 33.0, 26.0, 44.0, 28.0, 39.0, 45.0, 30.0, 48.0, 39.0, 38.0, 46.0, 36.0, 24.0, 21.0, 26.0, 20.0, 27.0, 16.0, 17.0, 7.0, 17.0, 5.0, 6.0, 7.0, 6.0, 5.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0011587142944335938, -0.0011224783957004547, -0.0010862424969673157, -0.0010500065982341766, -0.0010137706995010376, -0.0009775348007678986, -0.0009412989020347595, -0.0009050630033016205, -0.0008688271045684814, -0.0008325912058353424, -0.0007963553071022034, -0.0007601194083690643, -0.0007238835096359253, -0.0006876476109027863, -0.0006514117121696472, -0.0006151758134365082, -0.0005789399147033691, -0.0005427040159702301, -0.0005064681172370911, -0.000470232218503952, -0.000433996319770813, -0.00039776042103767395, -0.0003615245223045349, -0.0003252886235713959, -0.00028905272483825684, -0.0002528168261051178, -0.00021658092737197876, -0.00018034502863883972, -0.00014410912990570068, -0.00010787323117256165, -7.163733243942261e-05, -3.540143370628357e-05, 8.344650268554688e-07, 3.707036375999451e-05, 7.330626249313354e-05, 0.00010954216122627258, 0.00014577805995941162, 0.00018201395869255066, 0.0002182498574256897, 0.00025448575615882874, 0.0002907216548919678, 0.0003269575536251068, 0.00036319345235824585, 0.0003994293510913849, 0.0004356652498245239, 0.00047190114855766296, 0.000508137047290802, 0.000544372946023941, 0.0005806088447570801, 0.0006168447434902191, 0.0006530806422233582, 0.0006893165409564972, 0.0007255524396896362, 0.0007617883384227753, 0.0007980242371559143, 0.0008342601358890533, 0.0008704960346221924, 0.0009067319333553314, 0.0009429678320884705, 0.0009792037308216095, 0.0010154396295547485, 0.0010516755282878876, 0.0010879114270210266, 0.0011241473257541656, 0.0011603832244873047]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 8.0, 8.0, 9.0, 14.0, 23.0, 17.0, 15.0, 14.0, 24.0, 27.0, 25.0, 42.0, 36.0, 34.0, 40.0, 42.0, 47.0, 39.0, 51.0, 40.0, 48.0, 47.0, 41.0, 46.0, 36.0, 32.0, 33.0, 23.0, 26.0, 22.0, 10.0, 21.0, 15.0, 11.0, 7.0, 4.0, 6.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.2734375, -7.04705810546875, -6.8206787109375, -6.59429931640625, -6.367919921875, -6.14154052734375, -5.9151611328125, -5.68878173828125, -5.46240234375, -5.23602294921875, -5.0096435546875, -4.78326416015625, -4.556884765625, -4.33050537109375, -4.1041259765625, -3.87774658203125, -3.6513671875, -3.42498779296875, -3.1986083984375, -2.97222900390625, -2.745849609375, -2.51947021484375, -2.2930908203125, -2.06671142578125, -1.84033203125, -1.61395263671875, -1.3875732421875, -1.16119384765625, -0.934814453125, -0.70843505859375, -0.4820556640625, -0.25567626953125, -0.029296875, 0.19708251953125, 0.4234619140625, 0.64984130859375, 0.876220703125, 1.10260009765625, 1.3289794921875, 1.55535888671875, 1.78173828125, 2.00811767578125, 2.2344970703125, 2.46087646484375, 2.687255859375, 2.91363525390625, 3.1400146484375, 3.36639404296875, 3.5927734375, 3.81915283203125, 4.0455322265625, 4.27191162109375, 4.498291015625, 4.72467041015625, 4.9510498046875, 5.17742919921875, 5.40380859375, 5.63018798828125, 5.8565673828125, 6.08294677734375, 6.309326171875, 6.53570556640625, 6.7620849609375, 6.98846435546875, 7.21484375]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 6.0, 11.0, 11.0, 15.0, 18.0, 36.0, 34.0, 42.0, 78.0, 118.0, 203.0, 328.0, 690.0, 1236.0, 2507.0, 5625.0, 14856.0, 56201.0, 326771.0, 522375.0, 84228.0, 19846.0, 6907.0, 3033.0, 1464.0, 775.0, 415.0, 261.0, 154.0, 102.0, 50.0, 35.0, 40.0, 25.0, 17.0, 12.0, 4.0, 9.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.03515625, -6.816162109375, -6.59716796875, -6.378173828125, -6.1591796875, -5.940185546875, -5.72119140625, -5.502197265625, -5.283203125, -5.064208984375, -4.84521484375, -4.626220703125, -4.4072265625, -4.188232421875, -3.96923828125, -3.750244140625, -3.53125, -3.312255859375, -3.09326171875, -2.874267578125, -2.6552734375, -2.436279296875, -2.21728515625, -1.998291015625, -1.779296875, -1.560302734375, -1.34130859375, -1.122314453125, -0.9033203125, -0.684326171875, -0.46533203125, -0.246337890625, -0.02734375, 0.191650390625, 0.41064453125, 0.629638671875, 0.8486328125, 1.067626953125, 1.28662109375, 1.505615234375, 1.724609375, 1.943603515625, 2.16259765625, 2.381591796875, 2.6005859375, 2.819580078125, 3.03857421875, 3.257568359375, 3.4765625, 3.695556640625, 3.91455078125, 4.133544921875, 4.3525390625, 4.571533203125, 4.79052734375, 5.009521484375, 5.228515625, 5.447509765625, 5.66650390625, 5.885498046875, 6.1044921875, 6.323486328125, 6.54248046875, 6.761474609375, 6.98046875]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 1.0, 6.0, 6.0, 5.0, 7.0, 10.0, 14.0, 9.0, 11.0, 22.0, 28.0, 18.0, 28.0, 30.0, 43.0, 31.0, 35.0, 33.0, 63.0, 56.0, 156.0, 1752.0, 205.0, 62.0, 48.0, 50.0, 36.0, 44.0, 32.0, 30.0, 36.0, 25.0, 21.0, 20.0, 18.0, 15.0, 10.0, 6.0, 7.0, 6.0, 6.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-24.375, -23.66943359375, -22.9638671875, -22.25830078125, -21.552734375, -20.84716796875, -20.1416015625, -19.43603515625, -18.73046875, -18.02490234375, -17.3193359375, -16.61376953125, -15.908203125, -15.20263671875, -14.4970703125, -13.79150390625, -13.0859375, -12.38037109375, -11.6748046875, -10.96923828125, -10.263671875, -9.55810546875, -8.8525390625, -8.14697265625, -7.44140625, -6.73583984375, -6.0302734375, -5.32470703125, -4.619140625, -3.91357421875, -3.2080078125, -2.50244140625, -1.796875, -1.09130859375, -0.3857421875, 0.31982421875, 1.025390625, 1.73095703125, 2.4365234375, 3.14208984375, 3.84765625, 4.55322265625, 5.2587890625, 5.96435546875, 6.669921875, 7.37548828125, 8.0810546875, 8.78662109375, 9.4921875, 10.19775390625, 10.9033203125, 11.60888671875, 12.314453125, 13.02001953125, 13.7255859375, 14.43115234375, 15.13671875, 15.84228515625, 16.5478515625, 17.25341796875, 17.958984375, 18.66455078125, 19.3701171875, 20.07568359375, 20.78125]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 3.0, 11.0, 7.0, 14.0, 11.0, 15.0, 23.0, 28.0, 48.0, 49.0, 76.0, 109.0, 163.0, 228.0, 365.0, 807.0, 8967.0, 3119899.0, 12804.0, 912.0, 390.0, 230.0, 150.0, 106.0, 75.0, 49.0, 54.0, 21.0, 17.0, 18.0, 16.0, 14.0, 8.0, 5.0, 4.0, 6.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-71.8125, -69.84716796875, -67.8818359375, -65.91650390625, -63.951171875, -61.98583984375, -60.0205078125, -58.05517578125, -56.08984375, -54.12451171875, -52.1591796875, -50.19384765625, -48.228515625, -46.26318359375, -44.2978515625, -42.33251953125, -40.3671875, -38.40185546875, -36.4365234375, -34.47119140625, -32.505859375, -30.54052734375, -28.5751953125, -26.60986328125, -24.64453125, -22.67919921875, -20.7138671875, -18.74853515625, -16.783203125, -14.81787109375, -12.8525390625, -10.88720703125, -8.921875, -6.95654296875, -4.9912109375, -3.02587890625, -1.060546875, 0.90478515625, 2.8701171875, 4.83544921875, 6.80078125, 8.76611328125, 10.7314453125, 12.69677734375, 14.662109375, 16.62744140625, 18.5927734375, 20.55810546875, 22.5234375, 24.48876953125, 26.4541015625, 28.41943359375, 30.384765625, 32.35009765625, 34.3154296875, 36.28076171875, 38.24609375, 40.21142578125, 42.1767578125, 44.14208984375, 46.107421875, 48.07275390625, 50.0380859375, 52.00341796875, 53.96875]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 7.0, 114.0, 410.0, 370.0, 98.0, 12.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.324606895446777, -10.261812210083008, -8.199018478393555, -6.136223793029785, -4.073429107666016, -2.010634422302246, 0.05215930938720703, 2.1149539947509766, 4.177748680114746, 6.240543365478516, 8.303337097167969, 10.366131782531738, 12.428926467895508, 14.491721153259277, 16.554515838623047, 18.6173095703125, 20.680103302001953, 22.742897033691406, 24.805692672729492, 26.868486404418945, 28.93128204345703, 30.994075775146484, 33.05686950683594, 35.11966323852539, 37.18246078491211, 39.24525451660156, 41.308048248291016, 43.37084197998047, 45.43363952636719, 47.49643325805664, 49.559226989746094, 51.62202072143555, 53.68482208251953, 55.747615814208984, 57.81040954589844, 59.873207092285156, 61.93600082397461, 63.99879455566406, 66.06158447265625, 68.12438201904297, 70.18717956542969, 72.2499771118164, 74.3127670288086, 76.37556457519531, 78.4383544921875, 80.50115203857422, 82.56394958496094, 84.62673950195312, 86.68952941894531, 88.75232696533203, 90.81511688232422, 92.87791442871094, 94.94070434570312, 97.00350189208984, 99.06629943847656, 101.12908935546875, 103.19188690185547, 105.25468444824219, 107.31747436523438, 109.3802719116211, 111.44306182861328, 113.505859375, 115.56864929199219, 117.6314468383789, 119.69424438476562]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 5.0, 5.0, 4.0, 11.0, 4.0, 9.0, 8.0, 20.0, 15.0, 16.0, 26.0, 22.0, 24.0, 27.0, 33.0, 35.0, 35.0, 31.0, 32.0, 46.0, 38.0, 44.0, 41.0, 37.0, 44.0, 39.0, 34.0, 38.0, 30.0, 27.0, 35.0, 28.0, 19.0, 23.0, 15.0, 16.0, 18.0, 13.0, 8.0, 9.0, 6.0, 2.0, 5.0, 3.0, 4.0, 6.0, 6.0, 2.0, 1.0, 2.0, 3.0], "bins": [-56.34214782714844, -54.72157669067383, -53.10100173950195, -51.480430603027344, -49.85985565185547, -48.23928451538086, -46.61871337890625, -44.998138427734375, -43.3775634765625, -41.75699234008789, -40.136417388916016, -38.515846252441406, -36.89527130126953, -35.27470016479492, -33.65412902832031, -32.03355407714844, -30.412982940673828, -28.792409896850586, -27.171836853027344, -25.551265716552734, -23.93069076538086, -22.31011962890625, -20.689546585083008, -19.068973541259766, -17.448400497436523, -15.827827453613281, -14.207254409790039, -12.586682319641113, -10.966109275817871, -9.345536231994629, -7.724964141845703, -6.104391098022461, -4.483818054199219, -2.8632452487945557, -1.2426724433898926, 0.3779001235961914, 1.9984731674194336, 3.619046211242676, 5.239618301391602, 6.860191345214844, 8.480764389038086, 10.101337432861328, 11.72191047668457, 13.342482566833496, 14.963055610656738, 16.583629608154297, 18.204200744628906, 19.82477378845215, 21.44534683227539, 23.065919876098633, 24.686492919921875, 26.307064056396484, 27.92763900756836, 29.54821014404297, 31.16878318786621, 32.78935623168945, 34.40992736816406, 36.03049850463867, 37.65107345581055, 39.271644592285156, 40.89221954345703, 42.51279067993164, 44.13336181640625, 45.753936767578125, 47.37451171875]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 6.0, 7.0, 7.0, 12.0, 21.0, 15.0, 18.0, 18.0, 18.0, 24.0, 30.0, 35.0, 38.0, 38.0, 47.0, 45.0, 44.0, 36.0, 45.0, 48.0, 51.0, 46.0, 46.0, 40.0, 41.0, 39.0, 31.0, 24.0, 22.0, 27.0, 14.0, 15.0, 15.0, 9.0, 9.0, 2.0, 4.0, 4.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.015625, -7.775146484375, -7.53466796875, -7.294189453125, -7.0537109375, -6.813232421875, -6.57275390625, -6.332275390625, -6.091796875, -5.851318359375, -5.61083984375, -5.370361328125, -5.1298828125, -4.889404296875, -4.64892578125, -4.408447265625, -4.16796875, -3.927490234375, -3.68701171875, -3.446533203125, -3.2060546875, -2.965576171875, -2.72509765625, -2.484619140625, -2.244140625, -2.003662109375, -1.76318359375, -1.522705078125, -1.2822265625, -1.041748046875, -0.80126953125, -0.560791015625, -0.3203125, -0.079833984375, 0.16064453125, 0.401123046875, 0.6416015625, 0.882080078125, 1.12255859375, 1.363037109375, 1.603515625, 1.843994140625, 2.08447265625, 2.324951171875, 2.5654296875, 2.805908203125, 3.04638671875, 3.286865234375, 3.52734375, 3.767822265625, 4.00830078125, 4.248779296875, 4.4892578125, 4.729736328125, 4.97021484375, 5.210693359375, 5.451171875, 5.691650390625, 5.93212890625, 6.172607421875, 6.4130859375, 6.653564453125, 6.89404296875, 7.134521484375, 7.375]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 5.0, 2.0, 5.0, 6.0, 9.0, 7.0, 10.0, 18.0, 19.0, 24.0, 37.0, 34.0, 43.0, 51.0, 77.0, 109.0, 150.0, 235.0, 398.0, 974.0, 3040.0, 15620.0, 230531.0, 2642983.0, 1226068.0, 63813.0, 6686.0, 1699.0, 662.0, 294.0, 177.0, 107.0, 82.0, 64.0, 51.0, 49.0, 31.0, 23.0, 30.0, 15.0, 9.0, 10.0, 5.0, 10.0, 4.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.734375, -17.158203125, -16.58203125, -16.005859375, -15.4296875, -14.853515625, -14.27734375, -13.701171875, -13.125, -12.548828125, -11.97265625, -11.396484375, -10.8203125, -10.244140625, -9.66796875, -9.091796875, -8.515625, -7.939453125, -7.36328125, -6.787109375, -6.2109375, -5.634765625, -5.05859375, -4.482421875, -3.90625, -3.330078125, -2.75390625, -2.177734375, -1.6015625, -1.025390625, -0.44921875, 0.126953125, 0.703125, 1.279296875, 1.85546875, 2.431640625, 3.0078125, 3.583984375, 4.16015625, 4.736328125, 5.3125, 5.888671875, 6.46484375, 7.041015625, 7.6171875, 8.193359375, 8.76953125, 9.345703125, 9.921875, 10.498046875, 11.07421875, 11.650390625, 12.2265625, 12.802734375, 13.37890625, 13.955078125, 14.53125, 15.107421875, 15.68359375, 16.259765625, 16.8359375, 17.412109375, 17.98828125, 18.564453125, 19.140625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 5.0, 5.0, 6.0, 4.0, 7.0, 14.0, 19.0, 11.0, 37.0, 36.0, 64.0, 78.0, 98.0, 137.0, 205.0, 274.0, 406.0, 453.0, 504.0, 454.0, 379.0, 254.0, 176.0, 131.0, 94.0, 65.0, 43.0, 41.0, 23.0, 22.0, 14.0, 10.0, 2.0, 8.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.09375, -16.648193359375, -16.20263671875, -15.757080078125, -15.3115234375, -14.865966796875, -14.42041015625, -13.974853515625, -13.529296875, -13.083740234375, -12.63818359375, -12.192626953125, -11.7470703125, -11.301513671875, -10.85595703125, -10.410400390625, -9.96484375, -9.519287109375, -9.07373046875, -8.628173828125, -8.1826171875, -7.737060546875, -7.29150390625, -6.845947265625, -6.400390625, -5.954833984375, -5.50927734375, -5.063720703125, -4.6181640625, -4.172607421875, -3.72705078125, -3.281494140625, -2.8359375, -2.390380859375, -1.94482421875, -1.499267578125, -1.0537109375, -0.608154296875, -0.16259765625, 0.282958984375, 0.728515625, 1.174072265625, 1.61962890625, 2.065185546875, 2.5107421875, 2.956298828125, 3.40185546875, 3.847412109375, 4.29296875, 4.738525390625, 5.18408203125, 5.629638671875, 6.0751953125, 6.520751953125, 6.96630859375, 7.411865234375, 7.857421875, 8.302978515625, 8.74853515625, 9.194091796875, 9.6396484375, 10.085205078125, 10.53076171875, 10.976318359375, 11.421875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 6.0, 7.0, 15.0, 22.0, 24.0, 31.0, 39.0, 53.0, 59.0, 87.0, 119.0, 131.0, 216.0, 258.0, 397.0, 746.0, 3867.0, 1024166.0, 3154203.0, 7396.0, 873.0, 443.0, 278.0, 191.0, 155.0, 114.0, 84.0, 63.0, 59.0, 44.0, 23.0, 31.0, 31.0, 9.0, 14.0, 5.0, 8.0, 3.0, 4.0, 2.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.40625, -50.54052734375, -48.6748046875, -46.80908203125, -44.943359375, -43.07763671875, -41.2119140625, -39.34619140625, -37.48046875, -35.61474609375, -33.7490234375, -31.88330078125, -30.017578125, -28.15185546875, -26.2861328125, -24.42041015625, -22.5546875, -20.68896484375, -18.8232421875, -16.95751953125, -15.091796875, -13.22607421875, -11.3603515625, -9.49462890625, -7.62890625, -5.76318359375, -3.8974609375, -2.03173828125, -0.166015625, 1.69970703125, 3.5654296875, 5.43115234375, 7.296875, 9.16259765625, 11.0283203125, 12.89404296875, 14.759765625, 16.62548828125, 18.4912109375, 20.35693359375, 22.22265625, 24.08837890625, 25.9541015625, 27.81982421875, 29.685546875, 31.55126953125, 33.4169921875, 35.28271484375, 37.1484375, 39.01416015625, 40.8798828125, 42.74560546875, 44.611328125, 46.47705078125, 48.3427734375, 50.20849609375, 52.07421875, 53.93994140625, 55.8056640625, 57.67138671875, 59.537109375, 61.40283203125, 63.2685546875, 65.13427734375, 67.0]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 10.0, 13.0, 31.0, 48.0, 62.0, 108.0, 123.0, 123.0, 128.0, 115.0, 93.0, 64.0, 39.0, 30.0, 8.0, 3.0, 6.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-72.71900177001953, -70.8021469116211, -68.88528442382812, -66.96842956542969, -65.05157470703125, -63.13471221923828, -61.217857360839844, -59.30099868774414, -57.38414001464844, -55.467281341552734, -53.55042266845703, -51.633567810058594, -49.71670913696289, -47.79985046386719, -45.88299560546875, -43.96613693237305, -42.049278259277344, -40.13241958618164, -38.21556091308594, -36.2987060546875, -34.3818473815918, -32.464988708496094, -30.548131942749023, -28.631275177001953, -26.71441650390625, -24.797557830810547, -22.880701065063477, -20.963844299316406, -19.046985626220703, -17.130126953125, -15.21327018737793, -13.296412467956543, -11.379558563232422, -9.462700843811035, -7.545843124389648, -5.628985404968262, -3.712127685546875, -1.7952699661254883, 0.12158775329589844, 2.038445472717285, 3.955303192138672, 5.872160911560059, 7.789018630981445, 9.705876350402832, 11.622734069824219, 13.539591789245605, 15.456449508666992, 17.373306274414062, 19.290164947509766, 21.20702362060547, 23.12388038635254, 25.04073715209961, 26.957595825195312, 28.874454498291016, 30.791311264038086, 32.708168029785156, 34.62502670288086, 36.54188537597656, 38.458740234375, 40.3755989074707, 42.292457580566406, 44.20931625366211, 46.12617492675781, 48.04302978515625, 49.95988845825195]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 6.0, 6.0, 9.0, 4.0, 20.0, 14.0, 18.0, 15.0, 22.0, 26.0, 17.0, 26.0, 25.0, 28.0, 31.0, 42.0, 21.0, 25.0, 42.0, 39.0, 43.0, 34.0, 44.0, 45.0, 42.0, 32.0, 29.0, 34.0, 34.0, 26.0, 19.0, 26.0, 21.0, 21.0, 9.0, 22.0, 23.0, 16.0, 7.0, 10.0, 9.0, 4.0, 5.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0, 3.0, 3.0], "bins": [-41.55791473388672, -40.33024978637695, -39.10258102416992, -37.874916076660156, -36.647247314453125, -35.41958236694336, -34.19191360473633, -32.96424865722656, -31.73657989501953, -30.508913040161133, -29.281246185302734, -28.053579330444336, -26.825912475585938, -25.59824562072754, -24.37057876586914, -23.142913818359375, -21.915246963500977, -20.687580108642578, -19.45991325378418, -18.23224639892578, -17.004579544067383, -15.776912689208984, -14.549246788024902, -13.321579933166504, -12.093913078308105, -10.866246223449707, -9.638579368591309, -8.410913467407227, -7.18324613571167, -5.9555792808532715, -4.727912902832031, -3.500246047973633, -2.2725791931152344, -1.0449124574661255, 0.1827542781829834, 1.4104208946228027, 2.638087749481201, 3.8657546043395996, 5.09342098236084, 6.321087837219238, 7.548754692077637, 8.776421546936035, 10.004088401794434, 11.231754302978516, 12.459421157836914, 13.687088012695312, 14.914754867553711, 16.14242172241211, 17.370088577270508, 18.597755432128906, 19.825422286987305, 21.053089141845703, 22.2807559967041, 23.5084228515625, 24.736087799072266, 25.963756561279297, 27.191421508789062, 28.41908836364746, 29.64675521850586, 30.874422073364258, 32.102088928222656, 33.32975387573242, 34.55742263793945, 35.78508758544922, 37.01275634765625]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 5.0, 0.0, 2.0, 4.0, 9.0, 9.0, 9.0, 14.0, 25.0, 22.0, 18.0, 22.0, 27.0, 26.0, 33.0, 30.0, 35.0, 35.0, 40.0, 42.0, 58.0, 55.0, 46.0, 56.0, 44.0, 30.0, 41.0, 34.0, 39.0, 30.0, 30.0, 22.0, 23.0, 21.0, 15.0, 11.0, 9.0, 7.0, 10.0, 9.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.74609375, -7.51507568359375, -7.2840576171875, -7.05303955078125, -6.822021484375, -6.59100341796875, -6.3599853515625, -6.12896728515625, -5.89794921875, -5.66693115234375, -5.4359130859375, -5.20489501953125, -4.973876953125, -4.74285888671875, -4.5118408203125, -4.28082275390625, -4.0498046875, -3.81878662109375, -3.5877685546875, -3.35675048828125, -3.125732421875, -2.89471435546875, -2.6636962890625, -2.43267822265625, -2.20166015625, -1.97064208984375, -1.7396240234375, -1.50860595703125, -1.277587890625, -1.04656982421875, -0.8155517578125, -0.58453369140625, -0.353515625, -0.12249755859375, 0.1085205078125, 0.33953857421875, 0.570556640625, 0.80157470703125, 1.0325927734375, 1.26361083984375, 1.49462890625, 1.72564697265625, 1.9566650390625, 2.18768310546875, 2.418701171875, 2.64971923828125, 2.8807373046875, 3.11175537109375, 3.3427734375, 3.57379150390625, 3.8048095703125, 4.03582763671875, 4.266845703125, 4.49786376953125, 4.7288818359375, 4.95989990234375, 5.19091796875, 5.42193603515625, 5.6529541015625, 5.88397216796875, 6.114990234375, 6.34600830078125, 6.5770263671875, 6.80804443359375, 7.0390625]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 5.0, 14.0, 19.0, 22.0, 21.0, 38.0, 57.0, 76.0, 111.0, 194.0, 282.0, 410.0, 568.0, 869.0, 1433.0, 2236.0, 3437.0, 5385.0, 8643.0, 14493.0, 24841.0, 44640.0, 84580.0, 170664.0, 291179.0, 186523.0, 92193.0, 48125.0, 26604.0, 15457.0, 9315.0, 5797.0, 3691.0, 2255.0, 1458.0, 975.0, 658.0, 448.0, 283.0, 166.0, 134.0, 87.0, 52.0, 43.0, 26.0, 19.0, 9.0, 6.0, 6.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0], "bins": [-1.1220703125, -1.0886383056640625, -1.055206298828125, -1.0217742919921875, -0.98834228515625, -0.9549102783203125, -0.921478271484375, -0.8880462646484375, -0.8546142578125, -0.8211822509765625, -0.787750244140625, -0.7543182373046875, -0.72088623046875, -0.6874542236328125, -0.654022216796875, -0.6205902099609375, -0.587158203125, -0.5537261962890625, -0.520294189453125, -0.4868621826171875, -0.45343017578125, -0.4199981689453125, -0.386566162109375, -0.3531341552734375, -0.3197021484375, -0.2862701416015625, -0.252838134765625, -0.2194061279296875, -0.18597412109375, -0.1525421142578125, -0.119110107421875, -0.0856781005859375, -0.05224609375, -0.0188140869140625, 0.014617919921875, 0.0480499267578125, 0.08148193359375, 0.1149139404296875, 0.148345947265625, 0.1817779541015625, 0.2152099609375, 0.2486419677734375, 0.282073974609375, 0.3155059814453125, 0.34893798828125, 0.3823699951171875, 0.415802001953125, 0.4492340087890625, 0.482666015625, 0.5160980224609375, 0.549530029296875, 0.5829620361328125, 0.61639404296875, 0.6498260498046875, 0.683258056640625, 0.7166900634765625, 0.7501220703125, 0.7835540771484375, 0.816986083984375, 0.8504180908203125, 0.88385009765625, 0.9172821044921875, 0.950714111328125, 0.9841461181640625, 1.017578125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 2.0, 2.0, 3.0, 6.0, 1.0, 2.0, 9.0, 8.0, 9.0, 8.0, 16.0, 10.0, 13.0, 21.0, 27.0, 32.0, 29.0, 27.0, 20.0, 32.0, 37.0, 42.0, 44.0, 30.0, 45.0, 1064.0, 44.0, 35.0, 28.0, 47.0, 34.0, 38.0, 28.0, 25.0, 30.0, 22.0, 30.0, 16.0, 21.0, 18.0, 17.0, 12.0, 6.0, 7.0, 12.0, 4.0, 7.0, 4.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.03125, -3.90496826171875, -3.7786865234375, -3.65240478515625, -3.526123046875, -3.39984130859375, -3.2735595703125, -3.14727783203125, -3.02099609375, -2.89471435546875, -2.7684326171875, -2.64215087890625, -2.515869140625, -2.38958740234375, -2.2633056640625, -2.13702392578125, -2.0107421875, -1.88446044921875, -1.7581787109375, -1.63189697265625, -1.505615234375, -1.37933349609375, -1.2530517578125, -1.12677001953125, -1.00048828125, -0.87420654296875, -0.7479248046875, -0.62164306640625, -0.495361328125, -0.36907958984375, -0.2427978515625, -0.11651611328125, 0.009765625, 0.13604736328125, 0.2623291015625, 0.38861083984375, 0.514892578125, 0.64117431640625, 0.7674560546875, 0.89373779296875, 1.02001953125, 1.14630126953125, 1.2725830078125, 1.39886474609375, 1.525146484375, 1.65142822265625, 1.7777099609375, 1.90399169921875, 2.0302734375, 2.15655517578125, 2.2828369140625, 2.40911865234375, 2.535400390625, 2.66168212890625, 2.7879638671875, 2.91424560546875, 3.04052734375, 3.16680908203125, 3.2930908203125, 3.41937255859375, 3.545654296875, 3.67193603515625, 3.7982177734375, 3.92449951171875, 4.05078125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 2.0, 5.0, 10.0, 13.0, 17.0, 25.0, 35.0, 47.0, 86.0, 107.0, 137.0, 187.0, 281.0, 401.0, 506.0, 710.0, 1007.0, 1494.0, 2060.0, 3047.0, 4352.0, 6494.0, 10115.0, 14822.0, 23880.0, 37974.0, 63292.0, 110948.0, 196398.0, 1275546.0, 138147.0, 76685.0, 45870.0, 28236.0, 17791.0, 11792.0, 7757.0, 5219.0, 3483.0, 2401.0, 1717.0, 1187.0, 834.0, 596.0, 407.0, 311.0, 208.0, 156.0, 115.0, 65.0, 54.0, 39.0, 22.0, 20.0, 15.0, 8.0, 6.0, 3.0, 4.0, 1.0], "bins": [-0.79052734375, -0.7667083740234375, -0.742889404296875, -0.7190704345703125, -0.69525146484375, -0.6714324951171875, -0.647613525390625, -0.6237945556640625, -0.5999755859375, -0.5761566162109375, -0.552337646484375, -0.5285186767578125, -0.50469970703125, -0.4808807373046875, -0.457061767578125, -0.4332427978515625, -0.409423828125, -0.3856048583984375, -0.361785888671875, -0.3379669189453125, -0.31414794921875, -0.2903289794921875, -0.266510009765625, -0.2426910400390625, -0.2188720703125, -0.1950531005859375, -0.171234130859375, -0.1474151611328125, -0.12359619140625, -0.0997772216796875, -0.075958251953125, -0.0521392822265625, -0.0283203125, -0.0045013427734375, 0.019317626953125, 0.0431365966796875, 0.06695556640625, 0.0907745361328125, 0.114593505859375, 0.1384124755859375, 0.1622314453125, 0.1860504150390625, 0.209869384765625, 0.2336883544921875, 0.25750732421875, 0.2813262939453125, 0.305145263671875, 0.3289642333984375, 0.352783203125, 0.3766021728515625, 0.400421142578125, 0.4242401123046875, 0.44805908203125, 0.4718780517578125, 0.495697021484375, 0.5195159912109375, 0.5433349609375, 0.5671539306640625, 0.590972900390625, 0.6147918701171875, 0.63861083984375, 0.6624298095703125, 0.686248779296875, 0.7100677490234375, 0.73388671875]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 4.0, 6.0, 2.0, 5.0, 3.0, 5.0, 5.0, 10.0, 5.0, 13.0, 11.0, 17.0, 19.0, 19.0, 29.0, 27.0, 23.0, 30.0, 26.0, 42.0, 33.0, 52.0, 55.0, 55.0, 47.0, 58.0, 51.0, 38.0, 44.0, 37.0, 27.0, 38.0, 25.0, 19.0, 23.0, 14.0, 15.0, 11.0, 7.0, 5.0, 14.0, 9.0, 9.0, 3.0, 7.0, 4.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.0017375946044921875, -0.0016822516918182373, -0.0016269087791442871, -0.001571565866470337, -0.0015162229537963867, -0.0014608800411224365, -0.0014055371284484863, -0.0013501942157745361, -0.001294851303100586, -0.0012395083904266357, -0.0011841654777526855, -0.0011288225650787354, -0.0010734796524047852, -0.001018136739730835, -0.0009627938270568848, -0.0009074509143829346, -0.0008521080017089844, -0.0007967650890350342, -0.000741422176361084, -0.0006860792636871338, -0.0006307363510131836, -0.0005753934383392334, -0.0005200505256652832, -0.000464707612991333, -0.0004093647003173828, -0.0003540217876434326, -0.0002986788749694824, -0.00024333596229553223, -0.00018799304962158203, -0.00013265013694763184, -7.730722427368164e-05, -2.1964311599731445e-05, 3.337860107421875e-05, 8.872151374816895e-05, 0.00014406442642211914, 0.00019940733909606934, 0.00025475025177001953, 0.0003100931644439697, 0.0003654360771179199, 0.0004207789897918701, 0.0004761219024658203, 0.0005314648151397705, 0.0005868077278137207, 0.0006421506404876709, 0.0006974935531616211, 0.0007528364658355713, 0.0008081793785095215, 0.0008635222911834717, 0.0009188652038574219, 0.0009742081165313721, 0.0010295510292053223, 0.0010848939418792725, 0.0011402368545532227, 0.0011955797672271729, 0.001250922679901123, 0.0013062655925750732, 0.0013616085052490234, 0.0014169514179229736, 0.0014722943305969238, 0.001527637243270874, 0.0015829801559448242, 0.0016383230686187744, 0.0016936659812927246, 0.0017490088939666748, 0.001804351806640625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 4.0, 5.0, 10.0, 8.0, 10.0, 20.0, 14.0, 20.0, 21.0, 33.0, 36.0, 56.0, 55.0, 82.0, 101.0, 221.0, 527.0, 2313.0, 999491.0, 43670.0, 911.0, 333.0, 158.0, 88.0, 71.0, 58.0, 46.0, 36.0, 37.0, 22.0, 16.0, 19.0, 12.0, 11.0, 9.0, 2.0, 4.0, 6.0, 2.0, 5.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.044525146484375, -0.043076515197753906, -0.04162788391113281, -0.04017925262451172, -0.038730621337890625, -0.03728199005126953, -0.03583335876464844, -0.034384727478027344, -0.03293609619140625, -0.031487464904785156, -0.030038833618164062, -0.02859020233154297, -0.027141571044921875, -0.02569293975830078, -0.024244308471679688, -0.022795677185058594, -0.0213470458984375, -0.019898414611816406, -0.018449783325195312, -0.01700115203857422, -0.015552520751953125, -0.014103889465332031, -0.012655258178710938, -0.011206626892089844, -0.00975799560546875, -0.008309364318847656, -0.0068607330322265625, -0.005412101745605469, -0.003963470458984375, -0.0025148391723632812, -0.0010662078857421875, 0.00038242340087890625, 0.0018310546875, 0.0032796859741210938, 0.0047283172607421875, 0.006176948547363281, 0.007625579833984375, 0.009074211120605469, 0.010522842407226562, 0.011971473693847656, 0.01342010498046875, 0.014868736267089844, 0.016317367553710938, 0.01776599884033203, 0.019214630126953125, 0.02066326141357422, 0.022111892700195312, 0.023560523986816406, 0.0250091552734375, 0.026457786560058594, 0.027906417846679688, 0.02935504913330078, 0.030803680419921875, 0.03225231170654297, 0.03370094299316406, 0.035149574279785156, 0.03659820556640625, 0.038046836853027344, 0.03949546813964844, 0.04094409942626953, 0.042392730712890625, 0.04384136199951172, 0.04528999328613281, 0.046738624572753906, 0.048187255859375]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [4.0, 49.0, 532.0, 409.0, 24.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007347395294345915, -0.0004809266538359225, -0.00022711377823725343, 2.6699097361415625e-05, 0.0002805119729600847, 0.0005343248485587537, 0.0007881377241574228, 0.0010419506579637527, 0.0012957635335624218, 0.0015495764091610909, 0.00180338928475976, 0.002057202160358429, 0.002311015035957098, 0.002564827911555767, 0.002818640787154436, 0.003072453662753105, 0.003326266538351774, 0.0035800794139504433, 0.0038338922895491123, 0.004087705165147781, 0.00434151804074645, 0.0045953309163451195, 0.0048491437919437885, 0.005102956667542458, 0.005356769543141127, 0.005610582418739796, 0.005864395294338465, 0.006118208169937134, 0.006372021045535803, 0.006625833921134472, 0.006879646796733141, 0.00713345967233181, 0.007387273013591766, 0.007641085889190435, 0.007894898764789104, 0.008148711174726486, 0.008402524515986443, 0.008656337857246399, 0.00891015026718378, 0.009163962677121162, 0.009417776018381119, 0.009671589359641075, 0.009925401769578457, 0.010179214179515839, 0.010433027520775795, 0.010686840862035751, 0.010940653271973133, 0.011194465681910515, 0.011448279023170471, 0.011702092364430428, 0.01195590477436781, 0.012209717184305191, 0.012463530525565147, 0.012717343866825104, 0.012971156276762486, 0.013224968686699867, 0.013478782027959824, 0.01373259536921978, 0.013986407779157162, 0.014240220189094543, 0.0144940335303545, 0.014747846871614456, 0.015001659281551838, 0.01525547169148922, 0.015509285032749176]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 0.0, 4.0, 3.0, 4.0, 6.0, 13.0, 9.0, 13.0, 13.0, 8.0, 16.0, 16.0, 25.0, 21.0, 29.0, 22.0, 35.0, 22.0, 30.0, 37.0, 38.0, 50.0, 55.0, 38.0, 33.0, 44.0, 39.0, 41.0, 44.0, 25.0, 28.0, 35.0, 33.0, 35.0, 26.0, 20.0, 19.0, 15.0, 6.0, 11.0, 9.0, 9.0, 4.0, 8.0, 3.0, 6.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011382102966308594, -0.0011033406481146812, -0.0010684709995985031, -0.001033601351082325, -0.0009987317025661469, -0.0009638620540499687, -0.0009289924055337906, -0.0008941227570176125, -0.0008592531085014343, -0.0008243834599852562, -0.0007895138114690781, -0.0007546441629528999, -0.0007197745144367218, -0.0006849048659205437, -0.0006500352174043655, -0.0006151655688881874, -0.0005802959203720093, -0.0005454262718558311, -0.000510556623339653, -0.0004756869748234749, -0.00044081732630729675, -0.0004059476777911186, -0.0003710780292749405, -0.00033620838075876236, -0.00030133873224258423, -0.0002664690837264061, -0.00023159943521022797, -0.00019672978669404984, -0.0001618601381778717, -0.00012699048966169357, -9.212084114551544e-05, -5.725119262933731e-05, -2.238154411315918e-05, 1.2488104403018951e-05, 4.735775291919708e-05, 8.222740143537521e-05, 0.00011709704995155334, 0.00015196669846773148, 0.0001868363469839096, 0.00022170599550008774, 0.00025657564401626587, 0.000291445292532444, 0.00032631494104862213, 0.00036118458956480026, 0.0003960542380809784, 0.0004309238865971565, 0.00046579353511333466, 0.0005006631836295128, 0.0005355328321456909, 0.000570402480661869, 0.0006052721291780472, 0.0006401417776942253, 0.0006750114262104034, 0.0007098810747265816, 0.0007447507232427597, 0.0007796203717589378, 0.000814490020275116, 0.0008493596687912941, 0.0008842293173074722, 0.0009190989658236504, 0.0009539686143398285, 0.0009888382628560066, 0.0010237079113721848, 0.0010585775598883629, 0.001093447208404541]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 5.0, 0.0, 2.0, 4.0, 9.0, 9.0, 9.0, 14.0, 25.0, 22.0, 18.0, 22.0, 27.0, 26.0, 33.0, 30.0, 35.0, 35.0, 40.0, 42.0, 58.0, 55.0, 46.0, 56.0, 44.0, 30.0, 41.0, 34.0, 39.0, 30.0, 30.0, 22.0, 22.0, 22.0, 15.0, 11.0, 9.0, 7.0, 10.0, 9.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.74609375, -7.51507568359375, -7.2840576171875, -7.05303955078125, -6.822021484375, -6.59100341796875, -6.3599853515625, -6.12896728515625, -5.89794921875, -5.66693115234375, -5.4359130859375, -5.20489501953125, -4.973876953125, -4.74285888671875, -4.5118408203125, -4.28082275390625, -4.0498046875, -3.81878662109375, -3.5877685546875, -3.35675048828125, -3.125732421875, -2.89471435546875, -2.6636962890625, -2.43267822265625, -2.20166015625, -1.97064208984375, -1.7396240234375, -1.50860595703125, -1.277587890625, -1.04656982421875, -0.8155517578125, -0.58453369140625, -0.353515625, -0.12249755859375, 0.1085205078125, 0.33953857421875, 0.570556640625, 0.80157470703125, 1.0325927734375, 1.26361083984375, 1.49462890625, 1.72564697265625, 1.9566650390625, 2.18768310546875, 2.418701171875, 2.64971923828125, 2.8807373046875, 3.11175537109375, 3.3427734375, 3.57379150390625, 3.8048095703125, 4.03582763671875, 4.266845703125, 4.49786376953125, 4.7288818359375, 4.95989990234375, 5.19091796875, 5.42193603515625, 5.6529541015625, 5.88397216796875, 6.114990234375, 6.34600830078125, 6.5770263671875, 6.80804443359375, 7.0390625]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 8.0, 6.0, 10.0, 19.0, 26.0, 49.0, 67.0, 92.0, 146.0, 215.0, 320.0, 561.0, 1019.0, 1716.0, 3199.0, 6357.0, 12710.0, 27131.0, 61645.0, 159639.0, 410556.0, 217347.0, 79261.0, 34139.0, 15687.0, 7683.0, 4015.0, 2014.0, 1126.0, 659.0, 388.0, 272.0, 150.0, 102.0, 70.0, 47.0, 43.0, 19.0, 14.0, 10.0, 7.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-5.3515625, -5.201416015625, -5.05126953125, -4.901123046875, -4.7509765625, -4.600830078125, -4.45068359375, -4.300537109375, -4.150390625, -4.000244140625, -3.85009765625, -3.699951171875, -3.5498046875, -3.399658203125, -3.24951171875, -3.099365234375, -2.94921875, -2.799072265625, -2.64892578125, -2.498779296875, -2.3486328125, -2.198486328125, -2.04833984375, -1.898193359375, -1.748046875, -1.597900390625, -1.44775390625, -1.297607421875, -1.1474609375, -0.997314453125, -0.84716796875, -0.697021484375, -0.546875, -0.396728515625, -0.24658203125, -0.096435546875, 0.0537109375, 0.203857421875, 0.35400390625, 0.504150390625, 0.654296875, 0.804443359375, 0.95458984375, 1.104736328125, 1.2548828125, 1.405029296875, 1.55517578125, 1.705322265625, 1.85546875, 2.005615234375, 2.15576171875, 2.305908203125, 2.4560546875, 2.606201171875, 2.75634765625, 2.906494140625, 3.056640625, 3.206787109375, 3.35693359375, 3.507080078125, 3.6572265625, 3.807373046875, 3.95751953125, 4.107666015625, 4.2578125]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 5.0, 2.0, 2.0, 2.0, 10.0, 4.0, 12.0, 12.0, 13.0, 16.0, 12.0, 16.0, 22.0, 26.0, 27.0, 35.0, 28.0, 35.0, 51.0, 43.0, 63.0, 98.0, 262.0, 1576.0, 170.0, 91.0, 56.0, 42.0, 44.0, 39.0, 37.0, 26.0, 27.0, 17.0, 21.0, 20.0, 28.0, 13.0, 12.0, 9.0, 8.0, 6.0, 7.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-25.34375, -24.62646484375, -23.9091796875, -23.19189453125, -22.474609375, -21.75732421875, -21.0400390625, -20.32275390625, -19.60546875, -18.88818359375, -18.1708984375, -17.45361328125, -16.736328125, -16.01904296875, -15.3017578125, -14.58447265625, -13.8671875, -13.14990234375, -12.4326171875, -11.71533203125, -10.998046875, -10.28076171875, -9.5634765625, -8.84619140625, -8.12890625, -7.41162109375, -6.6943359375, -5.97705078125, -5.259765625, -4.54248046875, -3.8251953125, -3.10791015625, -2.390625, -1.67333984375, -0.9560546875, -0.23876953125, 0.478515625, 1.19580078125, 1.9130859375, 2.63037109375, 3.34765625, 4.06494140625, 4.7822265625, 5.49951171875, 6.216796875, 6.93408203125, 7.6513671875, 8.36865234375, 9.0859375, 9.80322265625, 10.5205078125, 11.23779296875, 11.955078125, 12.67236328125, 13.3896484375, 14.10693359375, 14.82421875, 15.54150390625, 16.2587890625, 16.97607421875, 17.693359375, 18.41064453125, 19.1279296875, 19.84521484375, 20.5625]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 5.0, 8.0, 16.0, 7.0, 20.0, 27.0, 46.0, 52.0, 77.0, 94.0, 169.0, 258.0, 429.0, 1117.0, 73115.0, 3066024.0, 2788.0, 554.0, 295.0, 189.0, 138.0, 75.0, 56.0, 43.0, 30.0, 28.0, 18.0, 9.0, 8.0, 6.0, 6.0, 1.0, 0.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.3125, -81.7734375, -79.234375, -76.6953125, -74.15625, -71.6171875, -69.078125, -66.5390625, -64.0, -61.4609375, -58.921875, -56.3828125, -53.84375, -51.3046875, -48.765625, -46.2265625, -43.6875, -41.1484375, -38.609375, -36.0703125, -33.53125, -30.9921875, -28.453125, -25.9140625, -23.375, -20.8359375, -18.296875, -15.7578125, -13.21875, -10.6796875, -8.140625, -5.6015625, -3.0625, -0.5234375, 2.015625, 4.5546875, 7.09375, 9.6328125, 12.171875, 14.7109375, 17.25, 19.7890625, 22.328125, 24.8671875, 27.40625, 29.9453125, 32.484375, 35.0234375, 37.5625, 40.1015625, 42.640625, 45.1796875, 47.71875, 50.2578125, 52.796875, 55.3359375, 57.875, 60.4140625, 62.953125, 65.4921875, 68.03125, 70.5703125, 73.109375, 75.6484375, 78.1875]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 94.0, 917.0, 7.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.50545120239258, -31.873199462890625, -22.240949630737305, -12.608699798583984, -2.9764480590820312, 6.655803680419922, 16.28805160522461, 25.920307159423828, 35.552555084228516, 45.18480682373047, 54.817054748535156, 64.44931030273438, 74.08155822753906, 83.71380615234375, 93.34605407714844, 102.97831726074219, 112.61056518554688, 122.24281311035156, 131.87506103515625, 141.50732421875, 151.1395721435547, 160.77182006835938, 170.40406799316406, 180.03631591796875, 189.66856384277344, 199.30081176757812, 208.9330596923828, 218.5653076171875, 228.19757080078125, 237.82981872558594, 247.46206665039062, 257.0943298339844, 266.7265930175781, 276.3588562011719, 285.9910888671875, 295.62335205078125, 305.2555847167969, 314.8878479003906, 324.52008056640625, 334.15234375, 343.78460693359375, 353.4168701171875, 363.0491027832031, 372.6813659667969, 382.3135986328125, 391.94586181640625, 401.578125, 411.2103576660156, 420.84259033203125, 430.474853515625, 440.1070861816406, 449.7393493652344, 459.37158203125, 469.00384521484375, 478.6361083984375, 488.2683410644531, 497.9006042480469, 507.5328674316406, 517.1651000976562, 526.79736328125, 536.4296264648438, 546.0618896484375, 555.694091796875, 565.3263549804688, 574.9586181640625]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 4.0, 4.0, 3.0, 6.0, 5.0, 9.0, 13.0, 14.0, 18.0, 19.0, 23.0, 35.0, 23.0, 40.0, 24.0, 32.0, 34.0, 39.0, 38.0, 49.0, 39.0, 45.0, 45.0, 51.0, 37.0, 35.0, 33.0, 31.0, 39.0, 25.0, 35.0, 33.0, 16.0, 15.0, 12.0, 15.0, 9.0, 12.0, 9.0, 11.0, 10.0, 1.0, 3.0, 9.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0], "bins": [-57.825531005859375, -56.14991760253906, -54.474308013916016, -52.7986946105957, -51.12308120727539, -49.447471618652344, -47.77185821533203, -46.09624481201172, -44.420631408691406, -42.745018005371094, -41.06940841674805, -39.393795013427734, -37.71818161010742, -36.042572021484375, -34.36695861816406, -32.69134521484375, -31.015735626220703, -29.340124130249023, -27.66451072692871, -25.98889923095703, -24.31328582763672, -22.63767433166504, -20.96206283569336, -19.286449432373047, -17.610837936401367, -15.935225486755371, -14.259613037109375, -12.584001541137695, -10.9083890914917, -9.232776641845703, -7.557165145874023, -5.881552696228027, -4.205944061279297, -2.53033185005188, -0.8547196388244629, 0.820892333984375, 2.496504783630371, 4.172117233276367, 5.847728729248047, 7.523341178894043, 9.198953628540039, 10.874566078186035, 12.550178527832031, 14.225790023803711, 15.901402473449707, 17.577014923095703, 19.252626419067383, 20.928237915039062, 22.603851318359375, 24.279462814331055, 25.955076217651367, 27.630687713623047, 29.30630111694336, 30.98191261291504, 32.65752410888672, 34.33313751220703, 36.008750915527344, 37.684364318847656, 39.3599739074707, 41.035587310791016, 42.71120071411133, 44.386810302734375, 46.06242370605469, 47.738037109375, 49.41364669799805]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 3.0, 5.0, 8.0, 4.0, 15.0, 17.0, 19.0, 24.0, 24.0, 25.0, 22.0, 26.0, 31.0, 37.0, 27.0, 36.0, 51.0, 50.0, 52.0, 49.0, 44.0, 47.0, 42.0, 41.0, 25.0, 38.0, 39.0, 36.0, 24.0, 29.0, 20.0, 18.0, 15.0, 15.0, 7.0, 7.0, 7.0, 7.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0], "bins": [-8.4609375, -8.22119140625, -7.9814453125, -7.74169921875, -7.501953125, -7.26220703125, -7.0224609375, -6.78271484375, -6.54296875, -6.30322265625, -6.0634765625, -5.82373046875, -5.583984375, -5.34423828125, -5.1044921875, -4.86474609375, -4.625, -4.38525390625, -4.1455078125, -3.90576171875, -3.666015625, -3.42626953125, -3.1865234375, -2.94677734375, -2.70703125, -2.46728515625, -2.2275390625, -1.98779296875, -1.748046875, -1.50830078125, -1.2685546875, -1.02880859375, -0.7890625, -0.54931640625, -0.3095703125, -0.06982421875, 0.169921875, 0.40966796875, 0.6494140625, 0.88916015625, 1.12890625, 1.36865234375, 1.6083984375, 1.84814453125, 2.087890625, 2.32763671875, 2.5673828125, 2.80712890625, 3.046875, 3.28662109375, 3.5263671875, 3.76611328125, 4.005859375, 4.24560546875, 4.4853515625, 4.72509765625, 4.96484375, 5.20458984375, 5.4443359375, 5.68408203125, 5.923828125, 6.16357421875, 6.4033203125, 6.64306640625, 6.8828125]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 3.0, 5.0, 1.0, 0.0, 3.0, 5.0, 5.0, 7.0, 7.0, 9.0, 11.0, 16.0, 16.0, 19.0, 15.0, 23.0, 33.0, 36.0, 55.0, 109.0, 154.0, 378.0, 1043.0, 3665.0, 25887.0, 994601.0, 3017218.0, 139627.0, 8278.0, 1807.0, 604.0, 229.0, 109.0, 64.0, 51.0, 33.0, 34.0, 22.0, 13.0, 13.0, 19.0, 12.0, 11.0, 4.0, 8.0, 5.0, 8.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-23.625, -22.892333984375, -22.15966796875, -21.427001953125, -20.6943359375, -19.961669921875, -19.22900390625, -18.496337890625, -17.763671875, -17.031005859375, -16.29833984375, -15.565673828125, -14.8330078125, -14.100341796875, -13.36767578125, -12.635009765625, -11.90234375, -11.169677734375, -10.43701171875, -9.704345703125, -8.9716796875, -8.239013671875, -7.50634765625, -6.773681640625, -6.041015625, -5.308349609375, -4.57568359375, -3.843017578125, -3.1103515625, -2.377685546875, -1.64501953125, -0.912353515625, -0.1796875, 0.552978515625, 1.28564453125, 2.018310546875, 2.7509765625, 3.483642578125, 4.21630859375, 4.948974609375, 5.681640625, 6.414306640625, 7.14697265625, 7.879638671875, 8.6123046875, 9.344970703125, 10.07763671875, 10.810302734375, 11.54296875, 12.275634765625, 13.00830078125, 13.740966796875, 14.4736328125, 15.206298828125, 15.93896484375, 16.671630859375, 17.404296875, 18.136962890625, 18.86962890625, 19.602294921875, 20.3349609375, 21.067626953125, 21.80029296875, 22.532958984375, 23.265625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 8.0, 9.0, 7.0, 19.0, 19.0, 26.0, 65.0, 112.0, 183.0, 320.0, 538.0, 733.0, 740.0, 514.0, 308.0, 182.0, 116.0, 84.0, 45.0, 21.0, 14.0, 6.0, 9.0, 1.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.71875, -23.041259765625, -22.36376953125, -21.686279296875, -21.0087890625, -20.331298828125, -19.65380859375, -18.976318359375, -18.298828125, -17.621337890625, -16.94384765625, -16.266357421875, -15.5888671875, -14.911376953125, -14.23388671875, -13.556396484375, -12.87890625, -12.201416015625, -11.52392578125, -10.846435546875, -10.1689453125, -9.491455078125, -8.81396484375, -8.136474609375, -7.458984375, -6.781494140625, -6.10400390625, -5.426513671875, -4.7490234375, -4.071533203125, -3.39404296875, -2.716552734375, -2.0390625, -1.361572265625, -0.68408203125, -0.006591796875, 0.6708984375, 1.348388671875, 2.02587890625, 2.703369140625, 3.380859375, 4.058349609375, 4.73583984375, 5.413330078125, 6.0908203125, 6.768310546875, 7.44580078125, 8.123291015625, 8.80078125, 9.478271484375, 10.15576171875, 10.833251953125, 11.5107421875, 12.188232421875, 12.86572265625, 13.543212890625, 14.220703125, 14.898193359375, 15.57568359375, 16.253173828125, 16.9306640625, 17.608154296875, 18.28564453125, 18.963134765625, 19.640625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 7.0, 13.0, 20.0, 35.0, 44.0, 59.0, 109.0, 134.0, 201.0, 325.0, 558.0, 1591.0, 329494.0, 3856412.0, 3511.0, 724.0, 359.0, 253.0, 153.0, 93.0, 68.0, 45.0, 32.0, 15.0, 13.0, 12.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.5, -84.69140625, -81.8828125, -79.07421875, -76.265625, -73.45703125, -70.6484375, -67.83984375, -65.03125, -62.22265625, -59.4140625, -56.60546875, -53.796875, -50.98828125, -48.1796875, -45.37109375, -42.5625, -39.75390625, -36.9453125, -34.13671875, -31.328125, -28.51953125, -25.7109375, -22.90234375, -20.09375, -17.28515625, -14.4765625, -11.66796875, -8.859375, -6.05078125, -3.2421875, -0.43359375, 2.375, 5.18359375, 7.9921875, 10.80078125, 13.609375, 16.41796875, 19.2265625, 22.03515625, 24.84375, 27.65234375, 30.4609375, 33.26953125, 36.078125, 38.88671875, 41.6953125, 44.50390625, 47.3125, 50.12109375, 52.9296875, 55.73828125, 58.546875, 61.35546875, 64.1640625, 66.97265625, 69.78125, 72.58984375, 75.3984375, 78.20703125, 81.015625, 83.82421875, 86.6328125, 89.44140625, 92.25]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 73.0, 559.0, 359.0, 19.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-101.29222106933594, -91.90959167480469, -82.5269546508789, -73.14432525634766, -63.76169204711914, -54.379058837890625, -44.996429443359375, -35.613792419433594, -26.231163024902344, -16.848529815673828, -7.465898513793945, 1.9167327880859375, 11.299365997314453, 20.68199920654297, 30.06462860107422, 39.447265625, 48.82989501953125, 58.212528228759766, 67.59516143798828, 76.97779083251953, 86.36042785644531, 95.74305725097656, 105.12568664550781, 114.5083236694336, 123.89095306396484, 133.27359008789062, 142.65621948242188, 152.03884887695312, 161.42147827148438, 170.80410766601562, 180.18673706054688, 189.5693817138672, 198.95199584960938, 208.33462524414062, 217.71725463867188, 227.09988403320312, 236.48252868652344, 245.8651580810547, 255.24778747558594, 264.63043212890625, 274.0130615234375, 283.39569091796875, 292.7783203125, 302.16094970703125, 311.5435791015625, 320.92620849609375, 330.308837890625, 339.6914978027344, 349.0740966796875, 358.45672607421875, 367.83935546875, 377.22198486328125, 386.6046142578125, 395.98724365234375, 405.369873046875, 414.7525329589844, 424.1351623535156, 433.5177917480469, 442.9004211425781, 452.2830505371094, 461.6656799316406, 471.04833984375, 480.43096923828125, 489.8135986328125, 499.19622802734375]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 6.0, 4.0, 3.0, 7.0, 6.0, 9.0, 8.0, 11.0, 16.0, 18.0, 16.0, 21.0, 25.0, 22.0, 31.0, 28.0, 40.0, 31.0, 49.0, 28.0, 39.0, 45.0, 45.0, 55.0, 45.0, 44.0, 35.0, 45.0, 31.0, 40.0, 25.0, 27.0, 24.0, 24.0, 21.0, 17.0, 9.0, 10.0, 9.0, 6.0, 10.0, 5.0, 9.0, 9.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.98966979980469, -41.68730545043945, -40.38494110107422, -39.082576751708984, -37.78021240234375, -36.477848052978516, -35.17548370361328, -33.87312316894531, -32.57075500488281, -31.268390655517578, -29.966026306152344, -28.66366195678711, -27.361297607421875, -26.05893325805664, -24.75657081604004, -23.454206466674805, -22.151844024658203, -20.84947967529297, -19.547115325927734, -18.2447509765625, -16.942386627197266, -15.640023231506348, -14.33765983581543, -13.035295486450195, -11.732931137084961, -10.430566787719727, -9.128202438354492, -7.825839042663574, -6.52347469329834, -5.2211103439331055, -3.9187464714050293, -2.616382598876953, -1.3140182495117188, -0.011654138565063477, 1.2907099723815918, 2.593074083328247, 3.8954381942749023, 5.197802543640137, 6.500166416168213, 7.802530288696289, 9.104894638061523, 10.407258987426758, 11.709623336791992, 13.01198673248291, 14.314351081848145, 15.616715431213379, 16.919078826904297, 18.22144317626953, 19.523807525634766, 20.826171875, 22.128536224365234, 23.43090057373047, 24.733264923095703, 26.035629272460938, 27.33799171447754, 28.640356063842773, 29.942720413208008, 31.245084762573242, 32.547447204589844, 33.84981155395508, 35.15217590332031, 36.45454025268555, 37.75690460205078, 39.059268951416016, 40.36163330078125]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 8.0, 4.0, 5.0, 7.0, 6.0, 11.0, 10.0, 11.0, 18.0, 16.0, 10.0, 25.0, 26.0, 27.0, 24.0, 24.0, 35.0, 34.0, 45.0, 34.0, 47.0, 38.0, 46.0, 40.0, 50.0, 36.0, 44.0, 35.0, 39.0, 32.0, 32.0, 22.0, 26.0, 12.0, 18.0, 29.0, 12.0, 17.0, 13.0, 10.0, 9.0, 5.0, 7.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 4.0], "bins": [-8.0703125, -7.85040283203125, -7.6304931640625, -7.41058349609375, -7.190673828125, -6.97076416015625, -6.7508544921875, -6.53094482421875, -6.31103515625, -6.09112548828125, -5.8712158203125, -5.65130615234375, -5.431396484375, -5.21148681640625, -4.9915771484375, -4.77166748046875, -4.5517578125, -4.33184814453125, -4.1119384765625, -3.89202880859375, -3.672119140625, -3.45220947265625, -3.2322998046875, -3.01239013671875, -2.79248046875, -2.57257080078125, -2.3526611328125, -2.13275146484375, -1.912841796875, -1.69293212890625, -1.4730224609375, -1.25311279296875, -1.033203125, -0.81329345703125, -0.5933837890625, -0.37347412109375, -0.153564453125, 0.06634521484375, 0.2862548828125, 0.50616455078125, 0.72607421875, 0.94598388671875, 1.1658935546875, 1.38580322265625, 1.605712890625, 1.82562255859375, 2.0455322265625, 2.26544189453125, 2.4853515625, 2.70526123046875, 2.9251708984375, 3.14508056640625, 3.364990234375, 3.58489990234375, 3.8048095703125, 4.02471923828125, 4.24462890625, 4.46453857421875, 4.6844482421875, 4.90435791015625, 5.124267578125, 5.34417724609375, 5.5640869140625, 5.78399658203125, 6.00390625]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 6.0, 12.0, 18.0, 13.0, 32.0, 38.0, 57.0, 83.0, 137.0, 181.0, 311.0, 438.0, 691.0, 1202.0, 1826.0, 2794.0, 4257.0, 6622.0, 10568.0, 16768.0, 27485.0, 46293.0, 81158.0, 153561.0, 271272.0, 187902.0, 96606.0, 53858.0, 31800.0, 19160.0, 12017.0, 7724.0, 4924.0, 3038.0, 2020.0, 1272.0, 810.0, 544.0, 379.0, 237.0, 157.0, 101.0, 68.0, 49.0, 30.0, 8.0, 15.0, 6.0, 7.0, 6.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9814453125, -0.9494171142578125, -0.917388916015625, -0.8853607177734375, -0.85333251953125, -0.8213043212890625, -0.789276123046875, -0.7572479248046875, -0.7252197265625, -0.6931915283203125, -0.661163330078125, -0.6291351318359375, -0.59710693359375, -0.5650787353515625, -0.533050537109375, -0.5010223388671875, -0.468994140625, -0.4369659423828125, -0.404937744140625, -0.3729095458984375, -0.34088134765625, -0.3088531494140625, -0.276824951171875, -0.2447967529296875, -0.2127685546875, -0.1807403564453125, -0.148712158203125, -0.1166839599609375, -0.08465576171875, -0.0526275634765625, -0.020599365234375, 0.0114288330078125, 0.04345703125, 0.0754852294921875, 0.107513427734375, 0.1395416259765625, 0.17156982421875, 0.2035980224609375, 0.235626220703125, 0.2676544189453125, 0.2996826171875, 0.3317108154296875, 0.363739013671875, 0.3957672119140625, 0.42779541015625, 0.4598236083984375, 0.491851806640625, 0.5238800048828125, 0.555908203125, 0.5879364013671875, 0.619964599609375, 0.6519927978515625, 0.68402099609375, 0.7160491943359375, 0.748077392578125, 0.7801055908203125, 0.8121337890625, 0.8441619873046875, 0.876190185546875, 0.9082183837890625, 0.94024658203125, 0.9722747802734375, 1.004302978515625, 1.0363311767578125, 1.068359375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 8.0, 6.0, 4.0, 8.0, 11.0, 8.0, 18.0, 12.0, 15.0, 14.0, 27.0, 28.0, 23.0, 22.0, 28.0, 39.0, 39.0, 37.0, 32.0, 28.0, 36.0, 1068.0, 56.0, 30.0, 40.0, 39.0, 38.0, 27.0, 47.0, 39.0, 16.0, 23.0, 23.0, 18.0, 23.0, 12.0, 17.0, 10.0, 10.0, 10.0, 15.0, 5.0, 7.0, 5.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-4.5, -4.365966796875, -4.23193359375, -4.097900390625, -3.9638671875, -3.829833984375, -3.69580078125, -3.561767578125, -3.427734375, -3.293701171875, -3.15966796875, -3.025634765625, -2.8916015625, -2.757568359375, -2.62353515625, -2.489501953125, -2.35546875, -2.221435546875, -2.08740234375, -1.953369140625, -1.8193359375, -1.685302734375, -1.55126953125, -1.417236328125, -1.283203125, -1.149169921875, -1.01513671875, -0.881103515625, -0.7470703125, -0.613037109375, -0.47900390625, -0.344970703125, -0.2109375, -0.076904296875, 0.05712890625, 0.191162109375, 0.3251953125, 0.459228515625, 0.59326171875, 0.727294921875, 0.861328125, 0.995361328125, 1.12939453125, 1.263427734375, 1.3974609375, 1.531494140625, 1.66552734375, 1.799560546875, 1.93359375, 2.067626953125, 2.20166015625, 2.335693359375, 2.4697265625, 2.603759765625, 2.73779296875, 2.871826171875, 3.005859375, 3.139892578125, 3.27392578125, 3.407958984375, 3.5419921875, 3.676025390625, 3.81005859375, 3.944091796875, 4.078125]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [5.0, 0.0, 4.0, 1.0, 3.0, 6.0, 12.0, 14.0, 22.0, 27.0, 49.0, 53.0, 85.0, 156.0, 221.0, 277.0, 484.0, 704.0, 1002.0, 1466.0, 2045.0, 2958.0, 4496.0, 6990.0, 10623.0, 16256.0, 25742.0, 40777.0, 67166.0, 116804.0, 203490.0, 1264490.0, 130907.0, 74756.0, 44905.0, 27828.0, 17872.0, 11430.0, 7526.0, 5010.0, 3273.0, 2236.0, 1544.0, 1062.0, 737.0, 536.0, 323.0, 272.0, 160.0, 103.0, 80.0, 54.0, 36.0, 21.0, 15.0, 12.0, 9.0, 5.0, 7.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.78564453125, -0.7603836059570312, -0.7351226806640625, -0.7098617553710938, -0.684600830078125, -0.6593399047851562, -0.6340789794921875, -0.6088180541992188, -0.58355712890625, -0.5582962036132812, -0.5330352783203125, -0.5077743530273438, -0.482513427734375, -0.45725250244140625, -0.4319915771484375, -0.40673065185546875, -0.3814697265625, -0.35620880126953125, -0.3309478759765625, -0.30568695068359375, -0.280426025390625, -0.25516510009765625, -0.2299041748046875, -0.20464324951171875, -0.17938232421875, -0.15412139892578125, -0.1288604736328125, -0.10359954833984375, -0.078338623046875, -0.05307769775390625, -0.0278167724609375, -0.00255584716796875, 0.022705078125, 0.04796600341796875, 0.0732269287109375, 0.09848785400390625, 0.123748779296875, 0.14900970458984375, 0.1742706298828125, 0.19953155517578125, 0.22479248046875, 0.25005340576171875, 0.2753143310546875, 0.30057525634765625, 0.325836181640625, 0.35109710693359375, 0.3763580322265625, 0.40161895751953125, 0.4268798828125, 0.45214080810546875, 0.4774017333984375, 0.5026626586914062, 0.527923583984375, 0.5531845092773438, 0.5784454345703125, 0.6037063598632812, 0.62896728515625, 0.6542282104492188, 0.6794891357421875, 0.7047500610351562, 0.730010986328125, 0.7552719116210938, 0.7805328369140625, 0.8057937622070312, 0.8310546875]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 4.0, 6.0, 8.0, 7.0, 10.0, 13.0, 11.0, 16.0, 17.0, 32.0, 33.0, 34.0, 38.0, 41.0, 35.0, 49.0, 64.0, 54.0, 57.0, 73.0, 47.0, 56.0, 52.0, 31.0, 38.0, 44.0, 29.0, 24.0, 19.0, 12.0, 10.0, 9.0, 10.0, 3.0, 1.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0027980804443359375, -0.002721160650253296, -0.0026442408561706543, -0.0025673210620880127, -0.002490401268005371, -0.0024134814739227295, -0.002336561679840088, -0.0022596418857574463, -0.0021827220916748047, -0.002105802297592163, -0.0020288825035095215, -0.0019519627094268799, -0.0018750429153442383, -0.0017981231212615967, -0.001721203327178955, -0.0016442835330963135, -0.0015673637390136719, -0.0014904439449310303, -0.0014135241508483887, -0.001336604356765747, -0.0012596845626831055, -0.0011827647686004639, -0.0011058449745178223, -0.0010289251804351807, -0.0009520053863525391, -0.0008750855922698975, -0.0007981657981872559, -0.0007212460041046143, -0.0006443262100219727, -0.0005674064159393311, -0.0004904866218566895, -0.00041356682777404785, -0.00033664703369140625, -0.00025972723960876465, -0.00018280744552612305, -0.00010588765144348145, -2.8967857360839844e-05, 4.795193672180176e-05, 0.00012487173080444336, 0.00020179152488708496, 0.00027871131896972656, 0.00035563111305236816, 0.00043255090713500977, 0.0005094707012176514, 0.000586390495300293, 0.0006633102893829346, 0.0007402300834655762, 0.0008171498775482178, 0.0008940696716308594, 0.000970989465713501, 0.0010479092597961426, 0.0011248290538787842, 0.0012017488479614258, 0.0012786686420440674, 0.001355588436126709, 0.0014325082302093506, 0.0015094280242919922, 0.0015863478183746338, 0.0016632676124572754, 0.001740187406539917, 0.0018171072006225586, 0.0018940269947052002, 0.001970946788787842, 0.0020478665828704834, 0.002124786376953125]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 6.0, 1.0, 1.0, 8.0, 9.0, 12.0, 15.0, 12.0, 38.0, 37.0, 49.0, 57.0, 71.0, 130.0, 206.0, 563.0, 14552.0, 1029590.0, 2236.0, 363.0, 172.0, 99.0, 84.0, 50.0, 39.0, 29.0, 28.0, 19.0, 10.0, 16.0, 10.0, 13.0, 7.0, 2.0, 4.0, 7.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.054962158203125, -0.053021907806396484, -0.05108165740966797, -0.04914140701293945, -0.04720115661621094, -0.04526090621948242, -0.043320655822753906, -0.04138040542602539, -0.039440155029296875, -0.03749990463256836, -0.035559654235839844, -0.03361940383911133, -0.03167915344238281, -0.029738903045654297, -0.02779865264892578, -0.025858402252197266, -0.02391815185546875, -0.021977901458740234, -0.02003765106201172, -0.018097400665283203, -0.016157150268554688, -0.014216899871826172, -0.012276649475097656, -0.01033639907836914, -0.008396148681640625, -0.006455898284912109, -0.004515647888183594, -0.002575397491455078, -0.0006351470947265625, 0.0013051033020019531, 0.0032453536987304688, 0.005185604095458984, 0.0071258544921875, 0.009066104888916016, 0.011006355285644531, 0.012946605682373047, 0.014886856079101562, 0.016827106475830078, 0.018767356872558594, 0.02070760726928711, 0.022647857666015625, 0.02458810806274414, 0.026528358459472656, 0.028468608856201172, 0.030408859252929688, 0.0323491096496582, 0.03428936004638672, 0.036229610443115234, 0.03816986083984375, 0.040110111236572266, 0.04205036163330078, 0.0439906120300293, 0.04593086242675781, 0.04787111282348633, 0.049811363220214844, 0.05175161361694336, 0.053691864013671875, 0.05563211441040039, 0.057572364807128906, 0.05951261520385742, 0.06145286560058594, 0.06339311599731445, 0.06533336639404297, 0.06727361679077148, 0.0692138671875]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 256.0, 696.0, 59.0, 2.0], "bins": [-0.020843908190727234, -0.020503737032413483, -0.02016356773674488, -0.01982339657843113, -0.019483225420117378, -0.019143056124448776, -0.018802884966135025, -0.018462713807821274, -0.018122544512152672, -0.01778237335383892, -0.01744220405817032, -0.017102032899856567, -0.016761861741542816, -0.016421692445874214, -0.016081521287560463, -0.01574135012924671, -0.01540117897093296, -0.015061008743941784, -0.014720837585628033, -0.014380667358636856, -0.01404049713164568, -0.013700325973331928, -0.013360155746340752, -0.013019984588027, -0.012679815292358398, -0.012339645065367222, -0.01199947390705347, -0.011659303680062294, -0.011319133453071117, -0.010978962294757366, -0.01063879206776619, -0.010298620909452438, -0.009958450682461262, -0.009618280455470085, -0.009278109297156334, -0.008937939070165157, -0.00859776884317398, -0.00825759768486023, -0.007917427457869053, -0.007577256765216589, -0.007237086072564125, -0.006896915379911661, -0.0065567451529204845, -0.006216574460268021, -0.005876403767615557, -0.005536233074963093, -0.005196062847971916, -0.004855892155319452, -0.004515721928328276, -0.004175551235675812, -0.0038353807758539915, -0.0034952103160321712, -0.0031550396233797073, -0.002814869163557887, -0.002474698703736067, -0.002134528011083603, -0.0017943574348464608, -0.0014541868586093187, -0.0011140163987874985, -0.0007738458225503564, -0.0004336752463132143, -9.350467007607222e-05, 0.00024666578974574804, 0.000586836482398212, 0.0009270069422200322]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 4.0, 2.0, 7.0, 10.0, 12.0, 9.0, 19.0, 19.0, 28.0, 22.0, 24.0, 21.0, 18.0, 35.0, 38.0, 48.0, 40.0, 47.0, 42.0, 39.0, 44.0, 55.0, 49.0, 40.0, 41.0, 50.0, 40.0, 36.0, 36.0, 25.0, 15.0, 18.0, 9.0, 9.0, 16.0, 9.0, 7.0, 7.0, 7.0, 5.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012969970703125, -0.0012514535337686539, -0.0012059099972248077, -0.0011603664606809616, -0.0011148229241371155, -0.0010692793875932693, -0.0010237358510494232, -0.000978192314505577, -0.000932648777961731, -0.0008871052414178848, -0.0008415617048740387, -0.0007960181683301926, -0.0007504746317863464, -0.0007049310952425003, -0.0006593875586986542, -0.000613844022154808, -0.0005683004856109619, -0.0005227569490671158, -0.00047721341252326965, -0.0004316698759794235, -0.0003861263394355774, -0.00034058280289173126, -0.00029503926634788513, -0.000249495729804039, -0.00020395219326019287, -0.00015840865671634674, -0.00011286512017250061, -6.732158362865448e-05, -2.177804708480835e-05, 2.376548945903778e-05, 6.930902600288391e-05, 0.00011485256254673004, 0.00016039609909057617, 0.0002059396356344223, 0.00025148317217826843, 0.00029702670872211456, 0.0003425702452659607, 0.0003881137818098068, 0.00043365731835365295, 0.0004792008548974991, 0.0005247443914413452, 0.0005702879279851913, 0.0006158314645290375, 0.0006613750010728836, 0.0007069185376167297, 0.0007524620741605759, 0.000798005610704422, 0.0008435491472482681, 0.0008890926837921143, 0.0009346362203359604, 0.0009801797568798065, 0.0010257232934236526, 0.0010712668299674988, 0.001116810366511345, 0.001162353903055191, 0.0012078974395990372, 0.0012534409761428833, 0.0012989845126867294, 0.0013445280492305756, 0.0013900715857744217, 0.0014356151223182678, 0.001481158658862114, 0.00152670219540596, 0.0015722457319498062, 0.0016177892684936523]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 8.0, 4.0, 5.0, 7.0, 6.0, 11.0, 10.0, 11.0, 18.0, 16.0, 10.0, 25.0, 26.0, 27.0, 24.0, 24.0, 35.0, 34.0, 45.0, 34.0, 47.0, 38.0, 46.0, 40.0, 50.0, 36.0, 44.0, 34.0, 40.0, 32.0, 32.0, 22.0, 26.0, 12.0, 18.0, 29.0, 12.0, 17.0, 13.0, 10.0, 9.0, 5.0, 7.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 4.0], "bins": [-8.0703125, -7.85040283203125, -7.6304931640625, -7.41058349609375, -7.190673828125, -6.97076416015625, -6.7508544921875, -6.53094482421875, -6.31103515625, -6.09112548828125, -5.8712158203125, -5.65130615234375, -5.431396484375, -5.21148681640625, -4.9915771484375, -4.77166748046875, -4.5517578125, -4.33184814453125, -4.1119384765625, -3.89202880859375, -3.672119140625, -3.45220947265625, -3.2322998046875, -3.01239013671875, -2.79248046875, -2.57257080078125, -2.3526611328125, -2.13275146484375, -1.912841796875, -1.69293212890625, -1.4730224609375, -1.25311279296875, -1.033203125, -0.81329345703125, -0.5933837890625, -0.37347412109375, -0.153564453125, 0.06634521484375, 0.2862548828125, 0.50616455078125, 0.72607421875, 0.94598388671875, 1.1658935546875, 1.38580322265625, 1.605712890625, 1.82562255859375, 2.0455322265625, 2.26544189453125, 2.4853515625, 2.70526123046875, 2.9251708984375, 3.14508056640625, 3.364990234375, 3.58489990234375, 3.8048095703125, 4.02471923828125, 4.24462890625, 4.46453857421875, 4.6844482421875, 4.90435791015625, 5.124267578125, 5.34417724609375, 5.5640869140625, 5.78399658203125, 6.00390625]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 7.0, 4.0, 8.0, 4.0, 13.0, 13.0, 25.0, 31.0, 37.0, 41.0, 70.0, 80.0, 129.0, 186.0, 289.0, 482.0, 805.0, 1541.0, 3408.0, 7936.0, 19861.0, 55908.0, 190053.0, 516114.0, 168220.0, 50632.0, 18592.0, 7341.0, 3098.0, 1481.0, 781.0, 431.0, 277.0, 177.0, 151.0, 95.0, 64.0, 39.0, 38.0, 22.0, 20.0, 12.0, 13.0, 13.0, 5.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-7.44921875, -7.2265625, -7.00390625, -6.78125, -6.55859375, -6.3359375, -6.11328125, -5.890625, -5.66796875, -5.4453125, -5.22265625, -5.0, -4.77734375, -4.5546875, -4.33203125, -4.109375, -3.88671875, -3.6640625, -3.44140625, -3.21875, -2.99609375, -2.7734375, -2.55078125, -2.328125, -2.10546875, -1.8828125, -1.66015625, -1.4375, -1.21484375, -0.9921875, -0.76953125, -0.546875, -0.32421875, -0.1015625, 0.12109375, 0.34375, 0.56640625, 0.7890625, 1.01171875, 1.234375, 1.45703125, 1.6796875, 1.90234375, 2.125, 2.34765625, 2.5703125, 2.79296875, 3.015625, 3.23828125, 3.4609375, 3.68359375, 3.90625, 4.12890625, 4.3515625, 4.57421875, 4.796875, 5.01953125, 5.2421875, 5.46484375, 5.6875, 5.91015625, 6.1328125, 6.35546875, 6.578125, 6.80078125]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 3.0, 4.0, 6.0, 4.0, 6.0, 13.0, 9.0, 16.0, 19.0, 15.0, 18.0, 25.0, 22.0, 35.0, 36.0, 39.0, 36.0, 44.0, 43.0, 58.0, 83.0, 367.0, 1601.0, 134.0, 53.0, 52.0, 43.0, 42.0, 22.0, 22.0, 18.0, 35.0, 23.0, 16.0, 19.0, 20.0, 13.0, 7.0, 10.0, 10.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.75, -20.0615234375, -19.373046875, -18.6845703125, -17.99609375, -17.3076171875, -16.619140625, -15.9306640625, -15.2421875, -14.5537109375, -13.865234375, -13.1767578125, -12.48828125, -11.7998046875, -11.111328125, -10.4228515625, -9.734375, -9.0458984375, -8.357421875, -7.6689453125, -6.98046875, -6.2919921875, -5.603515625, -4.9150390625, -4.2265625, -3.5380859375, -2.849609375, -2.1611328125, -1.47265625, -0.7841796875, -0.095703125, 0.5927734375, 1.28125, 1.9697265625, 2.658203125, 3.3466796875, 4.03515625, 4.7236328125, 5.412109375, 6.1005859375, 6.7890625, 7.4775390625, 8.166015625, 8.8544921875, 9.54296875, 10.2314453125, 10.919921875, 11.6083984375, 12.296875, 12.9853515625, 13.673828125, 14.3623046875, 15.05078125, 15.7392578125, 16.427734375, 17.1162109375, 17.8046875, 18.4931640625, 19.181640625, 19.8701171875, 20.55859375, 21.2470703125, 21.935546875, 22.6240234375, 23.3125]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 4.0, 10.0, 5.0, 11.0, 10.0, 27.0, 19.0, 37.0, 55.0, 66.0, 75.0, 121.0, 167.0, 272.0, 554.0, 3295.0, 3026852.0, 111512.0, 1321.0, 455.0, 260.0, 170.0, 99.0, 75.0, 74.0, 34.0, 38.0, 32.0, 17.0, 10.0, 12.0, 1.0, 4.0, 4.0, 7.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.875, -48.7392578125, -46.603515625, -44.4677734375, -42.33203125, -40.1962890625, -38.060546875, -35.9248046875, -33.7890625, -31.6533203125, -29.517578125, -27.3818359375, -25.24609375, -23.1103515625, -20.974609375, -18.8388671875, -16.703125, -14.5673828125, -12.431640625, -10.2958984375, -8.16015625, -6.0244140625, -3.888671875, -1.7529296875, 0.3828125, 2.5185546875, 4.654296875, 6.7900390625, 8.92578125, 11.0615234375, 13.197265625, 15.3330078125, 17.46875, 19.6044921875, 21.740234375, 23.8759765625, 26.01171875, 28.1474609375, 30.283203125, 32.4189453125, 34.5546875, 36.6904296875, 38.826171875, 40.9619140625, 43.09765625, 45.2333984375, 47.369140625, 49.5048828125, 51.640625, 53.7763671875, 55.912109375, 58.0478515625, 60.18359375, 62.3193359375, 64.455078125, 66.5908203125, 68.7265625, 70.8623046875, 72.998046875, 75.1337890625, 77.26953125, 79.4052734375, 81.541015625, 83.6767578125, 85.8125]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 241.0, 746.0, 29.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.654178619384766, -28.29014778137207, -22.926116943359375, -17.562084197998047, -12.198053359985352, -6.834022521972656, -1.4699897766113281, 3.8940391540527344, 9.258071899414062, 14.622102737426758, 19.986133575439453, 25.35016632080078, 30.714197158813477, 36.07822799682617, 41.4422607421875, 46.80628967285156, 52.17032241821289, 57.53435516357422, 62.89838409423828, 68.26242065429688, 73.62644958496094, 78.990478515625, 84.35450744628906, 89.71853637695312, 95.08257293701172, 100.44660186767578, 105.81063842773438, 111.17466735839844, 116.5386962890625, 121.90272521972656, 127.26676177978516, 132.63079833984375, 137.9948272705078, 143.35885620117188, 148.72288513183594, 154.0869140625, 159.45095825195312, 164.8149871826172, 170.17901611328125, 175.5430450439453, 180.90707397460938, 186.27110290527344, 191.6351318359375, 196.99917602539062, 202.3632049560547, 207.72723388671875, 213.0912628173828, 218.45529174804688, 223.8193359375, 229.18336486816406, 234.54739379882812, 239.91143798828125, 245.2754669189453, 250.63949584960938, 256.0035400390625, 261.3675537109375, 266.7315673828125, 272.0956115722656, 277.4596252441406, 282.82366943359375, 288.18768310546875, 293.5517272949219, 298.915771484375, 304.27978515625, 309.6438293457031]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 8.0, 9.0, 9.0, 6.0, 9.0, 17.0, 19.0, 27.0, 27.0, 32.0, 27.0, 32.0, 42.0, 41.0, 47.0, 45.0, 61.0, 41.0, 50.0, 44.0, 45.0, 40.0, 52.0, 42.0, 38.0, 29.0, 31.0, 23.0, 18.0, 20.0, 12.0, 10.0, 14.0, 7.0, 8.0, 4.0, 8.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-64.50402069091797, -62.609405517578125, -60.71479034423828, -58.82017517089844, -56.925559997558594, -55.03094482421875, -53.136329650878906, -51.24171829223633, -49.347103118896484, -47.45248794555664, -45.5578727722168, -43.66325759887695, -41.76864242553711, -39.87403106689453, -37.97941589355469, -36.084800720214844, -34.190185546875, -32.295570373535156, -30.400955200195312, -28.50634002685547, -26.611726760864258, -24.717111587524414, -22.82249641418457, -20.92788314819336, -19.03326416015625, -17.138648986816406, -15.244034767150879, -13.349419593811035, -11.454805374145508, -9.560190200805664, -7.66557502746582, -5.770960807800293, -3.8763465881347656, -1.9817317724227905, -0.08711695671081543, 1.8074979782104492, 3.7021126747131348, 5.59672737121582, 7.491342544555664, 9.385956764221191, 11.280571937561035, 13.175187110900879, 15.069801330566406, 16.96441650390625, 18.859031677246094, 20.753646850585938, 22.64826202392578, 24.542875289916992, 26.437490463256836, 28.33210563659668, 30.226720809936523, 32.121334075927734, 34.01594924926758, 35.91056442260742, 37.805179595947266, 39.69979476928711, 41.59440994262695, 43.4890251159668, 45.38364028930664, 47.278255462646484, 49.17287063598633, 51.067481994628906, 52.96209716796875, 54.856712341308594, 56.75132751464844]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 8.0, 4.0, 5.0, 5.0, 7.0, 11.0, 11.0, 5.0, 17.0, 14.0, 16.0, 20.0, 20.0, 31.0, 18.0, 32.0, 34.0, 33.0, 28.0, 39.0, 32.0, 53.0, 43.0, 42.0, 55.0, 26.0, 41.0, 42.0, 38.0, 27.0, 32.0, 34.0, 29.0, 24.0, 17.0, 20.0, 14.0, 13.0, 11.0, 18.0, 10.0, 8.0, 4.0, 5.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 3.0], "bins": [-8.1953125, -7.96917724609375, -7.7430419921875, -7.51690673828125, -7.290771484375, -7.06463623046875, -6.8385009765625, -6.61236572265625, -6.38623046875, -6.16009521484375, -5.9339599609375, -5.70782470703125, -5.481689453125, -5.25555419921875, -5.0294189453125, -4.80328369140625, -4.5771484375, -4.35101318359375, -4.1248779296875, -3.89874267578125, -3.672607421875, -3.44647216796875, -3.2203369140625, -2.99420166015625, -2.76806640625, -2.54193115234375, -2.3157958984375, -2.08966064453125, -1.863525390625, -1.63739013671875, -1.4112548828125, -1.18511962890625, -0.958984375, -0.73284912109375, -0.5067138671875, -0.28057861328125, -0.054443359375, 0.17169189453125, 0.3978271484375, 0.62396240234375, 0.85009765625, 1.07623291015625, 1.3023681640625, 1.52850341796875, 1.754638671875, 1.98077392578125, 2.2069091796875, 2.43304443359375, 2.6591796875, 2.88531494140625, 3.1114501953125, 3.33758544921875, 3.563720703125, 3.78985595703125, 4.0159912109375, 4.24212646484375, 4.46826171875, 4.69439697265625, 4.9205322265625, 5.14666748046875, 5.372802734375, 5.59893798828125, 5.8250732421875, 6.05120849609375, 6.27734375]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 5.0, 2.0, 3.0, 0.0, 4.0, 3.0, 4.0, 4.0, 4.0, 4.0, 9.0, 6.0, 18.0, 16.0, 14.0, 18.0, 26.0, 26.0, 42.0, 52.0, 63.0, 71.0, 118.0, 157.0, 285.0, 676.0, 1691.0, 7979.0, 121125.0, 2798810.0, 1220386.0, 36152.0, 4138.0, 1110.0, 449.0, 235.0, 149.0, 99.0, 63.0, 60.0, 52.0, 29.0, 22.0, 19.0, 15.0, 7.0, 17.0, 7.0, 16.0, 10.0, 9.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0], "bins": [-23.171875, -22.486572265625, -21.80126953125, -21.115966796875, -20.4306640625, -19.745361328125, -19.06005859375, -18.374755859375, -17.689453125, -17.004150390625, -16.31884765625, -15.633544921875, -14.9482421875, -14.262939453125, -13.57763671875, -12.892333984375, -12.20703125, -11.521728515625, -10.83642578125, -10.151123046875, -9.4658203125, -8.780517578125, -8.09521484375, -7.409912109375, -6.724609375, -6.039306640625, -5.35400390625, -4.668701171875, -3.9833984375, -3.298095703125, -2.61279296875, -1.927490234375, -1.2421875, -0.556884765625, 0.12841796875, 0.813720703125, 1.4990234375, 2.184326171875, 2.86962890625, 3.554931640625, 4.240234375, 4.925537109375, 5.61083984375, 6.296142578125, 6.9814453125, 7.666748046875, 8.35205078125, 9.037353515625, 9.72265625, 10.407958984375, 11.09326171875, 11.778564453125, 12.4638671875, 13.149169921875, 13.83447265625, 14.519775390625, 15.205078125, 15.890380859375, 16.57568359375, 17.260986328125, 17.9462890625, 18.631591796875, 19.31689453125, 20.002197265625, 20.6875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 14.0, 15.0, 35.0, 45.0, 55.0, 96.0, 186.0, 305.0, 414.0, 677.0, 773.0, 569.0, 351.0, 188.0, 129.0, 89.0, 41.0, 28.0, 21.0, 16.0, 9.0, 7.0, 4.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-27.328125, -26.7105712890625, -26.093017578125, -25.4754638671875, -24.85791015625, -24.2403564453125, -23.622802734375, -23.0052490234375, -22.3876953125, -21.7701416015625, -21.152587890625, -20.5350341796875, -19.91748046875, -19.2999267578125, -18.682373046875, -18.0648193359375, -17.447265625, -16.8297119140625, -16.212158203125, -15.5946044921875, -14.97705078125, -14.3594970703125, -13.741943359375, -13.1243896484375, -12.5068359375, -11.8892822265625, -11.271728515625, -10.6541748046875, -10.03662109375, -9.4190673828125, -8.801513671875, -8.1839599609375, -7.56640625, -6.9488525390625, -6.331298828125, -5.7137451171875, -5.09619140625, -4.4786376953125, -3.861083984375, -3.2435302734375, -2.6259765625, -2.0084228515625, -1.390869140625, -0.7733154296875, -0.15576171875, 0.4617919921875, 1.079345703125, 1.6968994140625, 2.314453125, 2.9320068359375, 3.549560546875, 4.1671142578125, 4.78466796875, 5.4022216796875, 6.019775390625, 6.6373291015625, 7.2548828125, 7.8724365234375, 8.489990234375, 9.1075439453125, 9.72509765625, 10.3426513671875, 10.960205078125, 11.5777587890625, 12.1953125]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 8.0, 10.0, 8.0, 16.0, 21.0, 30.0, 60.0, 73.0, 98.0, 183.0, 226.0, 338.0, 621.0, 2859.0, 3823455.0, 363385.0, 1387.0, 515.0, 351.0, 207.0, 151.0, 93.0, 80.0, 33.0, 33.0, 19.0, 11.0, 8.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.6875, -61.728515625, -58.76953125, -55.810546875, -52.8515625, -49.892578125, -46.93359375, -43.974609375, -41.015625, -38.056640625, -35.09765625, -32.138671875, -29.1796875, -26.220703125, -23.26171875, -20.302734375, -17.34375, -14.384765625, -11.42578125, -8.466796875, -5.5078125, -2.548828125, 0.41015625, 3.369140625, 6.328125, 9.287109375, 12.24609375, 15.205078125, 18.1640625, 21.123046875, 24.08203125, 27.041015625, 30.0, 32.958984375, 35.91796875, 38.876953125, 41.8359375, 44.794921875, 47.75390625, 50.712890625, 53.671875, 56.630859375, 59.58984375, 62.548828125, 65.5078125, 68.466796875, 71.42578125, 74.384765625, 77.34375, 80.302734375, 83.26171875, 86.220703125, 89.1796875, 92.138671875, 95.09765625, 98.056640625, 101.015625, 103.974609375, 106.93359375, 109.892578125, 112.8515625, 115.810546875, 118.76953125, 121.728515625, 124.6875]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [2.0, 3.0, 12.0, 291.0, 674.0, 40.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.37624740600586, -41.611297607421875, -28.846351623535156, -16.081401824951172, -3.316455841064453, 9.448490142822266, 22.213443756103516, 34.978389739990234, 47.74333572387695, 60.50828552246094, 73.27323150634766, 86.03817749023438, 98.80313110351562, 111.56806945800781, 124.33302307128906, 137.0979766845703, 149.8629150390625, 162.62786865234375, 175.39280700683594, 188.1577606201172, 200.92269897460938, 213.68765258789062, 226.45260620117188, 239.21755981445312, 251.9824981689453, 264.7474365234375, 277.51239013671875, 290.27734375, 303.04229736328125, 315.8072509765625, 328.57220458984375, 341.3371276855469, 354.10211181640625, 366.8670654296875, 379.63201904296875, 392.39697265625, 405.1618957519531, 417.9268493652344, 430.6918029785156, 443.4567565917969, 456.2216796875, 468.98663330078125, 481.7515869140625, 494.51654052734375, 507.2814636230469, 520.04638671875, 532.8114013671875, 545.5762939453125, 558.34130859375, 571.1062622070312, 583.8712158203125, 596.6361694335938, 609.401123046875, 622.166015625, 634.9310302734375, 647.6959228515625, 660.4608764648438, 673.225830078125, 685.9907836914062, 698.7557373046875, 711.5206909179688, 724.28564453125, 737.050537109375, 749.8154907226562, 762.5804443359375]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 2.0, 7.0, 5.0, 6.0, 6.0, 3.0, 8.0, 14.0, 15.0, 14.0, 14.0, 22.0, 26.0, 24.0, 26.0, 42.0, 22.0, 37.0, 31.0, 33.0, 46.0, 45.0, 29.0, 29.0, 39.0, 34.0, 38.0, 32.0, 32.0, 36.0, 43.0, 24.0, 35.0, 27.0, 23.0, 23.0, 20.0, 24.0, 12.0, 15.0, 10.0, 13.0, 4.0, 4.0, 2.0, 5.0, 3.0, 0.0, 2.0], "bins": [-45.539703369140625, -44.339481353759766, -43.13925552368164, -41.93903350830078, -40.738807678222656, -39.5385856628418, -38.33836364746094, -37.13813781738281, -35.93791580200195, -34.737693786621094, -33.53746795654297, -32.33724594116211, -31.137022018432617, -29.936798095703125, -28.736576080322266, -27.536352157592773, -26.33612823486328, -25.13590431213379, -23.935680389404297, -22.735458374023438, -21.535234451293945, -20.335010528564453, -19.134788513183594, -17.9345645904541, -16.73434066772461, -15.534116744995117, -14.333893775939941, -13.133670806884766, -11.933446884155273, -10.733222961425781, -9.532999992370605, -8.33277702331543, -7.1325531005859375, -5.9323296546936035, -4.7321062088012695, -3.5318827629089355, -2.3316593170166016, -1.1314358711242676, 0.0687875747680664, 1.2690105438232422, 2.4692344665527344, 3.6694579124450684, 4.869681358337402, 6.069904804229736, 7.27012825012207, 8.470352172851562, 9.670575141906738, 10.870798110961914, 12.071022033691406, 13.271245956420898, 14.471468925476074, 15.67169189453125, 16.871915817260742, 18.072139739990234, 19.272361755371094, 20.472585678100586, 21.672809600830078, 22.87303352355957, 24.073257446289062, 25.273479461669922, 26.473703384399414, 27.673927307128906, 28.874149322509766, 30.074373245239258, 31.27459716796875]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 2.0, 4.0, 4.0, 5.0, 4.0, 13.0, 7.0, 16.0, 14.0, 22.0, 27.0, 29.0, 40.0, 32.0, 46.0, 48.0, 38.0, 41.0, 54.0, 54.0, 59.0, 48.0, 45.0, 40.0, 53.0, 49.0, 36.0, 28.0, 31.0, 22.0, 16.0, 17.0, 14.0, 10.0, 9.0, 6.0, 8.0, 5.0, 4.0, 1.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.8125, -10.5267333984375, -10.240966796875, -9.9552001953125, -9.66943359375, -9.3836669921875, -9.097900390625, -8.8121337890625, -8.5263671875, -8.2406005859375, -7.954833984375, -7.6690673828125, -7.38330078125, -7.0975341796875, -6.811767578125, -6.5260009765625, -6.240234375, -5.9544677734375, -5.668701171875, -5.3829345703125, -5.09716796875, -4.8114013671875, -4.525634765625, -4.2398681640625, -3.9541015625, -3.6683349609375, -3.382568359375, -3.0968017578125, -2.81103515625, -2.5252685546875, -2.239501953125, -1.9537353515625, -1.66796875, -1.3822021484375, -1.096435546875, -0.8106689453125, -0.52490234375, -0.2391357421875, 0.046630859375, 0.3323974609375, 0.6181640625, 0.9039306640625, 1.189697265625, 1.4754638671875, 1.76123046875, 2.0469970703125, 2.332763671875, 2.6185302734375, 2.904296875, 3.1900634765625, 3.475830078125, 3.7615966796875, 4.04736328125, 4.3331298828125, 4.618896484375, 4.9046630859375, 5.1904296875, 5.4761962890625, 5.761962890625, 6.0477294921875, 6.33349609375, 6.6192626953125, 6.905029296875, 7.1907958984375, 7.4765625]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 3.0, 6.0, 3.0, 9.0, 13.0, 10.0, 21.0, 37.0, 39.0, 73.0, 101.0, 167.0, 250.0, 371.0, 553.0, 818.0, 1257.0, 1867.0, 2638.0, 3949.0, 5947.0, 8987.0, 13689.0, 21012.0, 33716.0, 56008.0, 99467.0, 190835.0, 254240.0, 147146.0, 78761.0, 45961.0, 27941.0, 17742.0, 11647.0, 7706.0, 5164.0, 3391.0, 2335.0, 1525.0, 1009.0, 738.0, 443.0, 337.0, 208.0, 155.0, 73.0, 78.0, 34.0, 24.0, 21.0, 14.0, 7.0, 6.0, 8.0, 4.0, 2.0, 1.0, 2.0, 2.0], "bins": [-1.080078125, -1.0466461181640625, -1.013214111328125, -0.9797821044921875, -0.94635009765625, -0.9129180908203125, -0.879486083984375, -0.8460540771484375, -0.8126220703125, -0.7791900634765625, -0.745758056640625, -0.7123260498046875, -0.67889404296875, -0.6454620361328125, -0.612030029296875, -0.5785980224609375, -0.545166015625, -0.5117340087890625, -0.478302001953125, -0.4448699951171875, -0.41143798828125, -0.3780059814453125, -0.344573974609375, -0.3111419677734375, -0.2777099609375, -0.2442779541015625, -0.210845947265625, -0.1774139404296875, -0.14398193359375, -0.1105499267578125, -0.077117919921875, -0.0436859130859375, -0.01025390625, 0.0231781005859375, 0.056610107421875, 0.0900421142578125, 0.12347412109375, 0.1569061279296875, 0.190338134765625, 0.2237701416015625, 0.2572021484375, 0.2906341552734375, 0.324066162109375, 0.3574981689453125, 0.39093017578125, 0.4243621826171875, 0.457794189453125, 0.4912261962890625, 0.524658203125, 0.5580902099609375, 0.591522216796875, 0.6249542236328125, 0.65838623046875, 0.6918182373046875, 0.725250244140625, 0.7586822509765625, 0.7921142578125, 0.8255462646484375, 0.858978271484375, 0.8924102783203125, 0.92584228515625, 0.9592742919921875, 0.992706298828125, 1.0261383056640625, 1.0595703125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 7.0, 7.0, 13.0, 8.0, 15.0, 14.0, 9.0, 12.0, 13.0, 26.0, 19.0, 23.0, 25.0, 26.0, 23.0, 33.0, 31.0, 30.0, 39.0, 39.0, 37.0, 1068.0, 42.0, 40.0, 48.0, 34.0, 26.0, 38.0, 32.0, 26.0, 31.0, 25.0, 25.0, 21.0, 18.0, 23.0, 14.0, 13.0, 10.0, 8.0, 9.0, 2.0, 4.0, 4.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.328125, -4.19268798828125, -4.0572509765625, -3.92181396484375, -3.786376953125, -3.65093994140625, -3.5155029296875, -3.38006591796875, -3.24462890625, -3.10919189453125, -2.9737548828125, -2.83831787109375, -2.702880859375, -2.56744384765625, -2.4320068359375, -2.29656982421875, -2.1611328125, -2.02569580078125, -1.8902587890625, -1.75482177734375, -1.619384765625, -1.48394775390625, -1.3485107421875, -1.21307373046875, -1.07763671875, -0.94219970703125, -0.8067626953125, -0.67132568359375, -0.535888671875, -0.40045166015625, -0.2650146484375, -0.12957763671875, 0.005859375, 0.14129638671875, 0.2767333984375, 0.41217041015625, 0.547607421875, 0.68304443359375, 0.8184814453125, 0.95391845703125, 1.08935546875, 1.22479248046875, 1.3602294921875, 1.49566650390625, 1.631103515625, 1.76654052734375, 1.9019775390625, 2.03741455078125, 2.1728515625, 2.30828857421875, 2.4437255859375, 2.57916259765625, 2.714599609375, 2.85003662109375, 2.9854736328125, 3.12091064453125, 3.25634765625, 3.39178466796875, 3.5272216796875, 3.66265869140625, 3.798095703125, 3.93353271484375, 4.0689697265625, 4.20440673828125, 4.33984375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 2.0, 12.0, 10.0, 17.0, 18.0, 37.0, 49.0, 78.0, 109.0, 151.0, 237.0, 365.0, 512.0, 688.0, 1064.0, 1602.0, 2451.0, 3669.0, 5782.0, 9076.0, 14354.0, 23362.0, 38742.0, 66905.0, 123502.0, 1116143.0, 400208.0, 120991.0, 65709.0, 37963.0, 23285.0, 14474.0, 8903.0, 5747.0, 3576.0, 2461.0, 1595.0, 1068.0, 723.0, 501.0, 322.0, 246.0, 134.0, 113.0, 68.0, 36.0, 31.0, 18.0, 12.0, 4.0, 6.0, 3.0, 0.0, 1.0, 2.0, 3.0], "bins": [-1.015625, -0.9857406616210938, -0.9558563232421875, -0.9259719848632812, -0.896087646484375, -0.8662033081054688, -0.8363189697265625, -0.8064346313476562, -0.77655029296875, -0.7466659545898438, -0.7167816162109375, -0.6868972778320312, -0.657012939453125, -0.6271286010742188, -0.5972442626953125, -0.5673599243164062, -0.5374755859375, -0.5075912475585938, -0.4777069091796875, -0.44782257080078125, -0.417938232421875, -0.38805389404296875, -0.3581695556640625, -0.32828521728515625, -0.29840087890625, -0.26851654052734375, -0.2386322021484375, -0.20874786376953125, -0.178863525390625, -0.14897918701171875, -0.1190948486328125, -0.08921051025390625, -0.059326171875, -0.02944183349609375, 0.0004425048828125, 0.03032684326171875, 0.060211181640625, 0.09009552001953125, 0.1199798583984375, 0.14986419677734375, 0.17974853515625, 0.20963287353515625, 0.2395172119140625, 0.26940155029296875, 0.299285888671875, 0.32917022705078125, 0.3590545654296875, 0.38893890380859375, 0.4188232421875, 0.44870758056640625, 0.4785919189453125, 0.5084762573242188, 0.538360595703125, 0.5682449340820312, 0.5981292724609375, 0.6280136108398438, 0.65789794921875, 0.6877822875976562, 0.7176666259765625, 0.7475509643554688, 0.777435302734375, 0.8073196411132812, 0.8372039794921875, 0.8670883178710938, 0.89697265625]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 1.0, 7.0, 8.0, 7.0, 17.0, 16.0, 21.0, 28.0, 37.0, 54.0, 58.0, 75.0, 83.0, 74.0, 73.0, 78.0, 78.0, 71.0, 50.0, 31.0, 30.0, 23.0, 23.0, 13.0, 9.0, 7.0, 8.0, 4.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00327301025390625, -0.003156006336212158, -0.0030390024185180664, -0.0029219985008239746, -0.002804994583129883, -0.002687990665435791, -0.0025709867477416992, -0.0024539828300476074, -0.0023369789123535156, -0.002219974994659424, -0.002102971076965332, -0.0019859671592712402, -0.0018689632415771484, -0.0017519593238830566, -0.0016349554061889648, -0.001517951488494873, -0.0014009475708007812, -0.0012839436531066895, -0.0011669397354125977, -0.0010499358177185059, -0.0009329319000244141, -0.0008159279823303223, -0.0006989240646362305, -0.0005819201469421387, -0.0004649162292480469, -0.0003479123115539551, -0.00023090839385986328, -0.00011390447616577148, 3.0994415283203125e-06, 0.00012010335922241211, 0.0002371072769165039, 0.0003541111946105957, 0.0004711151123046875, 0.0005881190299987793, 0.0007051229476928711, 0.0008221268653869629, 0.0009391307830810547, 0.0010561347007751465, 0.0011731386184692383, 0.00129014253616333, 0.0014071464538574219, 0.0015241503715515137, 0.0016411542892456055, 0.0017581582069396973, 0.001875162124633789, 0.001992166042327881, 0.0021091699600219727, 0.0022261738777160645, 0.0023431777954101562, 0.002460181713104248, 0.00257718563079834, 0.0026941895484924316, 0.0028111934661865234, 0.0029281973838806152, 0.003045201301574707, 0.003162205219268799, 0.0032792091369628906, 0.0033962130546569824, 0.0035132169723510742, 0.003630220890045166, 0.003747224807739258, 0.0038642287254333496, 0.003981232643127441, 0.004098236560821533, 0.004215240478515625]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 4.0, 3.0, 6.0, 7.0, 8.0, 10.0, 12.0, 26.0, 22.0, 35.0, 35.0, 51.0, 80.0, 122.0, 195.0, 347.0, 1559.0, 1009222.0, 35349.0, 732.0, 245.0, 140.0, 98.0, 64.0, 43.0, 35.0, 24.0, 14.0, 15.0, 10.0, 10.0, 6.0, 4.0, 4.0, 4.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.08575439453125, -0.0833578109741211, -0.08096122741699219, -0.07856464385986328, -0.07616806030273438, -0.07377147674560547, -0.07137489318847656, -0.06897830963134766, -0.06658172607421875, -0.06418514251708984, -0.06178855895996094, -0.05939197540283203, -0.056995391845703125, -0.05459880828857422, -0.05220222473144531, -0.049805641174316406, -0.0474090576171875, -0.045012474060058594, -0.04261589050292969, -0.04021930694580078, -0.037822723388671875, -0.03542613983154297, -0.03302955627441406, -0.030632972717285156, -0.02823638916015625, -0.025839805603027344, -0.023443222045898438, -0.02104663848876953, -0.018650054931640625, -0.01625347137451172, -0.013856887817382812, -0.011460304260253906, -0.009063720703125, -0.006667137145996094, -0.0042705535888671875, -0.0018739700317382812, 0.000522613525390625, 0.0029191970825195312, 0.0053157806396484375, 0.007712364196777344, 0.01010894775390625, 0.012505531311035156, 0.014902114868164062, 0.01729869842529297, 0.019695281982421875, 0.02209186553955078, 0.024488449096679688, 0.026885032653808594, 0.0292816162109375, 0.031678199768066406, 0.03407478332519531, 0.03647136688232422, 0.038867950439453125, 0.04126453399658203, 0.04366111755371094, 0.046057701110839844, 0.04845428466796875, 0.050850868225097656, 0.05324745178222656, 0.05564403533935547, 0.058040618896484375, 0.06043720245361328, 0.06283378601074219, 0.0652303695678711, 0.067626953125]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 7.0, 109.0, 636.0, 257.0, 9.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014509019674733281, -0.0011387320701032877, -0.0008265621145255864, -0.000514392158947885, -0.00020222226157784462, 0.0001099476357921958, 0.00042211764957755804, 0.0007342874305322766, 0.0010464574443176389, 0.0013586273416876793, 0.0016707973554730415, 0.0019829673692584038, 0.0022951371502131224, 0.002607306931167841, 0.002919476944953203, 0.0032316469587385654, 0.0035438169725239277, 0.00385598698630929, 0.004168157000094652, 0.004480326548218727, 0.004792496562004089, 0.005104666575789452, 0.005416836589574814, 0.005729006603360176, 0.006041176151484251, 0.006353346165269613, 0.0066655161790549755, 0.0069776857271790504, 0.007289855740964413, 0.007602025754749775, 0.007914195768535137, 0.0082263657823205, 0.008538535796105862, 0.008850705809891224, 0.009162875823676586, 0.009475045837461948, 0.00978721585124731, 0.010099384933710098, 0.01041155494749546, 0.010723724961280823, 0.011035894975066185, 0.011348064988851547, 0.01166023500263691, 0.011972405016422272, 0.012284575030207634, 0.012596745043992996, 0.012908915057778358, 0.013221084140241146, 0.013533255085349083, 0.013845425099134445, 0.014157595112919807, 0.01446976512670517, 0.014781935140490532, 0.015094105154275894, 0.015406275168061256, 0.01571844518184662, 0.01603061333298683, 0.016342783346772194, 0.016654953360557556, 0.01696712337434292, 0.01727929338812828, 0.017591463401913643, 0.017903633415699005, 0.018215803429484367, 0.01852797344326973]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 3.0, 3.0, 8.0, 4.0, 4.0, 6.0, 8.0, 13.0, 15.0, 22.0, 10.0, 22.0, 18.0, 38.0, 23.0, 38.0, 38.0, 40.0, 43.0, 40.0, 40.0, 34.0, 40.0, 45.0, 48.0, 37.0, 35.0, 37.0, 33.0, 34.0, 32.0, 33.0, 16.0, 27.0, 23.0, 21.0, 17.0, 14.0, 14.0, 11.0, 7.0, 5.0, 5.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.001601576805114746, -0.0015521403402090073, -0.0015027038753032684, -0.0014532674103975296, -0.0014038309454917908, -0.001354394480586052, -0.0013049580156803131, -0.0012555215507745743, -0.0012060850858688354, -0.0011566486209630966, -0.0011072121560573578, -0.001057775691151619, -0.0010083392262458801, -0.0009589027613401413, -0.0009094662964344025, -0.0008600298315286636, -0.0008105933666229248, -0.000761156901717186, -0.0007117204368114471, -0.0006622839719057083, -0.0006128475069999695, -0.0005634110420942307, -0.0005139745771884918, -0.000464538112282753, -0.00041510164737701416, -0.00036566518247127533, -0.0003162287175655365, -0.00026679225265979767, -0.00021735578775405884, -0.00016791932284832, -0.00011848285794258118, -6.904639303684235e-05, -1.9609928131103516e-05, 2.9826536774635315e-05, 7.926300168037415e-05, 0.00012869946658611298, 0.0001781359314918518, 0.00022757239639759064, 0.00027700886130332947, 0.0003264453262090683, 0.00037588179111480713, 0.00042531825602054596, 0.0004747547209262848, 0.0005241911858320236, 0.0005736276507377625, 0.0006230641156435013, 0.0006725005805492401, 0.0007219370454549789, 0.0007713735103607178, 0.0008208099752664566, 0.0008702464401721954, 0.0009196829050779343, 0.0009691193699836731, 0.001018555834889412, 0.0010679922997951508, 0.0011174287647008896, 0.0011668652296066284, 0.0012163016945123672, 0.001265738159418106, 0.001315174624323845, 0.0013646110892295837, 0.0014140475541353226, 0.0014634840190410614, 0.0015129204839468002, 0.001562356948852539]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 2.0, 4.0, 4.0, 5.0, 4.0, 13.0, 7.0, 16.0, 14.0, 22.0, 27.0, 29.0, 40.0, 32.0, 46.0, 48.0, 38.0, 41.0, 54.0, 54.0, 59.0, 48.0, 44.0, 41.0, 53.0, 49.0, 36.0, 28.0, 31.0, 22.0, 16.0, 17.0, 14.0, 10.0, 9.0, 6.0, 8.0, 5.0, 4.0, 1.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.8125, -10.5267333984375, -10.240966796875, -9.9552001953125, -9.66943359375, -9.3836669921875, -9.097900390625, -8.8121337890625, -8.5263671875, -8.2406005859375, -7.954833984375, -7.6690673828125, -7.38330078125, -7.0975341796875, -6.811767578125, -6.5260009765625, -6.240234375, -5.9544677734375, -5.668701171875, -5.3829345703125, -5.09716796875, -4.8114013671875, -4.525634765625, -4.2398681640625, -3.9541015625, -3.6683349609375, -3.382568359375, -3.0968017578125, -2.81103515625, -2.5252685546875, -2.239501953125, -1.9537353515625, -1.66796875, -1.3822021484375, -1.096435546875, -0.8106689453125, -0.52490234375, -0.2391357421875, 0.046630859375, 0.3323974609375, 0.6181640625, 0.9039306640625, 1.189697265625, 1.4754638671875, 1.76123046875, 2.0469970703125, 2.332763671875, 2.6185302734375, 2.904296875, 3.1900634765625, 3.475830078125, 3.7615966796875, 4.04736328125, 4.3331298828125, 4.618896484375, 4.9046630859375, 5.1904296875, 5.4761962890625, 5.761962890625, 6.0477294921875, 6.33349609375, 6.6192626953125, 6.905029296875, 7.1907958984375, 7.4765625]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 9.0, 8.0, 16.0, 18.0, 24.0, 31.0, 49.0, 73.0, 97.0, 172.0, 299.0, 505.0, 1006.0, 2305.0, 6779.0, 38595.0, 653938.0, 310631.0, 24822.0, 5251.0, 1894.0, 852.0, 462.0, 256.0, 127.0, 99.0, 62.0, 39.0, 34.0, 26.0, 15.0, 20.0, 9.0, 8.0, 6.0, 4.0, 1.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.96875, -19.4417724609375, -18.914794921875, -18.3878173828125, -17.86083984375, -17.3338623046875, -16.806884765625, -16.2799072265625, -15.7529296875, -15.2259521484375, -14.698974609375, -14.1719970703125, -13.64501953125, -13.1180419921875, -12.591064453125, -12.0640869140625, -11.537109375, -11.0101318359375, -10.483154296875, -9.9561767578125, -9.42919921875, -8.9022216796875, -8.375244140625, -7.8482666015625, -7.3212890625, -6.7943115234375, -6.267333984375, -5.7403564453125, -5.21337890625, -4.6864013671875, -4.159423828125, -3.6324462890625, -3.10546875, -2.5784912109375, -2.051513671875, -1.5245361328125, -0.99755859375, -0.4705810546875, 0.056396484375, 0.5833740234375, 1.1103515625, 1.6373291015625, 2.164306640625, 2.6912841796875, 3.21826171875, 3.7452392578125, 4.272216796875, 4.7991943359375, 5.326171875, 5.8531494140625, 6.380126953125, 6.9071044921875, 7.43408203125, 7.9610595703125, 8.488037109375, 9.0150146484375, 9.5419921875, 10.0689697265625, 10.595947265625, 11.1229248046875, 11.64990234375, 12.1768798828125, 12.703857421875, 13.2308349609375, 13.7578125]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 4.0, 6.0, 5.0, 11.0, 14.0, 17.0, 21.0, 26.0, 26.0, 38.0, 52.0, 50.0, 45.0, 58.0, 69.0, 163.0, 1827.0, 180.0, 58.0, 62.0, 49.0, 42.0, 47.0, 28.0, 30.0, 29.0, 13.0, 22.0, 10.0, 7.0, 5.0, 12.0, 4.0, 8.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.125, -22.18310546875, -21.2412109375, -20.29931640625, -19.357421875, -18.41552734375, -17.4736328125, -16.53173828125, -15.58984375, -14.64794921875, -13.7060546875, -12.76416015625, -11.822265625, -10.88037109375, -9.9384765625, -8.99658203125, -8.0546875, -7.11279296875, -6.1708984375, -5.22900390625, -4.287109375, -3.34521484375, -2.4033203125, -1.46142578125, -0.51953125, 0.42236328125, 1.3642578125, 2.30615234375, 3.248046875, 4.18994140625, 5.1318359375, 6.07373046875, 7.015625, 7.95751953125, 8.8994140625, 9.84130859375, 10.783203125, 11.72509765625, 12.6669921875, 13.60888671875, 14.55078125, 15.49267578125, 16.4345703125, 17.37646484375, 18.318359375, 19.26025390625, 20.2021484375, 21.14404296875, 22.0859375, 23.02783203125, 23.9697265625, 24.91162109375, 25.853515625, 26.79541015625, 27.7373046875, 28.67919921875, 29.62109375, 30.56298828125, 31.5048828125, 32.44677734375, 33.388671875, 34.33056640625, 35.2724609375, 36.21435546875, 37.15625]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 3.0, 1.0, 10.0, 9.0, 11.0, 3.0, 7.0, 18.0, 20.0, 20.0, 29.0, 31.0, 54.0, 78.0, 102.0, 169.0, 393.0, 1769.0, 88620.0, 3049401.0, 3738.0, 565.0, 200.0, 106.0, 96.0, 59.0, 39.0, 35.0, 21.0, 28.0, 19.0, 12.0, 9.0, 7.0, 9.0, 6.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-110.6875, -107.8603515625, -105.033203125, -102.2060546875, -99.37890625, -96.5517578125, -93.724609375, -90.8974609375, -88.0703125, -85.2431640625, -82.416015625, -79.5888671875, -76.76171875, -73.9345703125, -71.107421875, -68.2802734375, -65.453125, -62.6259765625, -59.798828125, -56.9716796875, -54.14453125, -51.3173828125, -48.490234375, -45.6630859375, -42.8359375, -40.0087890625, -37.181640625, -34.3544921875, -31.52734375, -28.7001953125, -25.873046875, -23.0458984375, -20.21875, -17.3916015625, -14.564453125, -11.7373046875, -8.91015625, -6.0830078125, -3.255859375, -0.4287109375, 2.3984375, 5.2255859375, 8.052734375, 10.8798828125, 13.70703125, 16.5341796875, 19.361328125, 22.1884765625, 25.015625, 27.8427734375, 30.669921875, 33.4970703125, 36.32421875, 39.1513671875, 41.978515625, 44.8056640625, 47.6328125, 50.4599609375, 53.287109375, 56.1142578125, 58.94140625, 61.7685546875, 64.595703125, 67.4228515625, 70.25]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 178.0, 813.0, 25.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.71171569824219, -33.06572341918945, -25.41973114013672, -17.773738861083984, -10.12774658203125, -2.4817543029785156, 5.164237976074219, 12.810230255126953, 20.456222534179688, 28.102214813232422, 35.748207092285156, 43.39419937133789, 51.040191650390625, 58.68618392944336, 66.3321762084961, 73.97816467285156, 81.62416076660156, 89.27015686035156, 96.91614532470703, 104.5621337890625, 112.2081298828125, 119.8541259765625, 127.50011444091797, 135.14610290527344, 142.79209899902344, 150.43809509277344, 158.08407592773438, 165.73007202148438, 173.37606811523438, 181.02206420898438, 188.66806030273438, 196.3140411376953, 203.96002197265625, 211.60601806640625, 219.25201416015625, 226.8979949951172, 234.5439910888672, 242.1899871826172, 249.83596801757812, 257.4819641113281, 265.1279602050781, 272.7739562988281, 280.4199523925781, 288.0659484863281, 295.7119140625, 303.35791015625, 311.00390625, 318.64990234375, 326.2958984375, 333.94189453125, 341.587890625, 349.23388671875, 356.8798828125, 364.5258483886719, 372.1718444824219, 379.8178405761719, 387.4638366699219, 395.1098327636719, 402.7558288574219, 410.4018249511719, 418.04779052734375, 425.69378662109375, 433.33978271484375, 440.98577880859375, 448.63177490234375]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 7.0, 4.0, 5.0, 6.0, 11.0, 9.0, 9.0, 17.0, 14.0, 22.0, 17.0, 26.0, 20.0, 34.0, 32.0, 36.0, 33.0, 34.0, 42.0, 32.0, 33.0, 43.0, 36.0, 47.0, 38.0, 49.0, 42.0, 32.0, 32.0, 35.0, 26.0, 20.0, 26.0, 27.0, 28.0, 12.0, 12.0, 11.0, 9.0, 9.0, 7.0, 6.0, 4.0, 7.0, 0.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-77.7824478149414, -75.5604019165039, -73.3383560180664, -71.1163101196289, -68.8942642211914, -66.67222595214844, -64.45018005371094, -62.22813034057617, -60.00608825683594, -57.78404235839844, -55.56199645996094, -53.33995056152344, -51.1179084777832, -48.8958625793457, -46.6738166809082, -44.4517707824707, -42.2297248840332, -40.0076789855957, -37.7856330871582, -35.56359100341797, -33.34154510498047, -31.11949920654297, -28.89745330810547, -26.67540740966797, -24.4533634185791, -22.2313175201416, -20.009273529052734, -17.787227630615234, -15.56518268585205, -13.343137741088867, -11.121091842651367, -8.899046897888184, -6.677001953125, -4.454957008361816, -2.2329115867614746, -0.010866165161132812, 2.211178779602051, 4.433223724365234, 6.655269622802734, 8.877314567565918, 11.099359512329102, 13.321404457092285, 15.543449401855469, 17.76549530029297, 19.98754119873047, 22.209585189819336, 24.431631088256836, 26.653675079345703, 28.875720977783203, 31.097766876220703, 33.3198127746582, 35.54185485839844, 37.76390075683594, 39.98594665527344, 42.20799255371094, 44.43003845214844, 46.65208435058594, 48.87413024902344, 51.09617614746094, 53.31822204589844, 55.54026412963867, 57.76231002807617, 59.98435592651367, 62.20640182495117, 64.4284439086914]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 4.0, 6.0, 11.0, 10.0, 5.0, 10.0, 10.0, 14.0, 26.0, 30.0, 25.0, 31.0, 35.0, 29.0, 34.0, 51.0, 35.0, 39.0, 52.0, 50.0, 49.0, 47.0, 44.0, 49.0, 39.0, 46.0, 34.0, 31.0, 24.0, 15.0, 25.0, 17.0, 12.0, 9.0, 11.0, 8.0, 7.0, 9.0, 4.0, 5.0, 4.0, 4.0, 1.0, 4.0, 0.0, 1.0], "bins": [-10.4765625, -10.19769287109375, -9.9188232421875, -9.63995361328125, -9.361083984375, -9.08221435546875, -8.8033447265625, -8.52447509765625, -8.24560546875, -7.96673583984375, -7.6878662109375, -7.40899658203125, -7.130126953125, -6.85125732421875, -6.5723876953125, -6.29351806640625, -6.0146484375, -5.73577880859375, -5.4569091796875, -5.17803955078125, -4.899169921875, -4.62030029296875, -4.3414306640625, -4.06256103515625, -3.78369140625, -3.50482177734375, -3.2259521484375, -2.94708251953125, -2.668212890625, -2.38934326171875, -2.1104736328125, -1.83160400390625, -1.552734375, -1.27386474609375, -0.9949951171875, -0.71612548828125, -0.437255859375, -0.15838623046875, 0.1204833984375, 0.39935302734375, 0.67822265625, 0.95709228515625, 1.2359619140625, 1.51483154296875, 1.793701171875, 2.07257080078125, 2.3514404296875, 2.63031005859375, 2.9091796875, 3.18804931640625, 3.4669189453125, 3.74578857421875, 4.024658203125, 4.30352783203125, 4.5823974609375, 4.86126708984375, 5.14013671875, 5.41900634765625, 5.6978759765625, 5.97674560546875, 6.255615234375, 6.53448486328125, 6.8133544921875, 7.09222412109375, 7.37109375]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 7.0, 13.0, 13.0, 8.0, 19.0, 17.0, 37.0, 38.0, 58.0, 84.0, 137.0, 223.0, 382.0, 760.0, 1401.0, 3346.0, 9849.0, 40141.0, 259545.0, 1313562.0, 1876633.0, 569429.0, 90945.0, 17820.0, 5489.0, 2171.0, 930.0, 486.0, 258.0, 167.0, 89.0, 54.0, 50.0, 32.0, 31.0, 18.0, 19.0, 9.0, 7.0, 5.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-15.0078125, -14.6251220703125, -14.242431640625, -13.8597412109375, -13.47705078125, -13.0943603515625, -12.711669921875, -12.3289794921875, -11.9462890625, -11.5635986328125, -11.180908203125, -10.7982177734375, -10.41552734375, -10.0328369140625, -9.650146484375, -9.2674560546875, -8.884765625, -8.5020751953125, -8.119384765625, -7.7366943359375, -7.35400390625, -6.9713134765625, -6.588623046875, -6.2059326171875, -5.8232421875, -5.4405517578125, -5.057861328125, -4.6751708984375, -4.29248046875, -3.9097900390625, -3.527099609375, -3.1444091796875, -2.76171875, -2.3790283203125, -1.996337890625, -1.6136474609375, -1.23095703125, -0.8482666015625, -0.465576171875, -0.0828857421875, 0.2998046875, 0.6824951171875, 1.065185546875, 1.4478759765625, 1.83056640625, 2.2132568359375, 2.595947265625, 2.9786376953125, 3.361328125, 3.7440185546875, 4.126708984375, 4.5093994140625, 4.89208984375, 5.2747802734375, 5.657470703125, 6.0401611328125, 6.4228515625, 6.8055419921875, 7.188232421875, 7.5709228515625, 7.95361328125, 8.3363037109375, 8.718994140625, 9.1016845703125, 9.484375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 5.0, 8.0, 10.0, 7.0, 11.0, 19.0, 28.0, 34.0, 45.0, 64.0, 94.0, 106.0, 157.0, 200.0, 247.0, 356.0, 386.0, 399.0, 394.0, 348.0, 259.0, 210.0, 156.0, 128.0, 85.0, 81.0, 52.0, 52.0, 26.0, 23.0, 17.0, 13.0, 14.0, 12.0, 8.0, 3.0, 2.0, 4.0, 5.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-13.7734375, -13.3623046875, -12.951171875, -12.5400390625, -12.12890625, -11.7177734375, -11.306640625, -10.8955078125, -10.484375, -10.0732421875, -9.662109375, -9.2509765625, -8.83984375, -8.4287109375, -8.017578125, -7.6064453125, -7.1953125, -6.7841796875, -6.373046875, -5.9619140625, -5.55078125, -5.1396484375, -4.728515625, -4.3173828125, -3.90625, -3.4951171875, -3.083984375, -2.6728515625, -2.26171875, -1.8505859375, -1.439453125, -1.0283203125, -0.6171875, -0.2060546875, 0.205078125, 0.6162109375, 1.02734375, 1.4384765625, 1.849609375, 2.2607421875, 2.671875, 3.0830078125, 3.494140625, 3.9052734375, 4.31640625, 4.7275390625, 5.138671875, 5.5498046875, 5.9609375, 6.3720703125, 6.783203125, 7.1943359375, 7.60546875, 8.0166015625, 8.427734375, 8.8388671875, 9.25, 9.6611328125, 10.072265625, 10.4833984375, 10.89453125, 11.3056640625, 11.716796875, 12.1279296875, 12.5390625]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 3.0, 9.0, 11.0, 8.0, 13.0, 18.0, 31.0, 33.0, 40.0, 62.0, 76.0, 97.0, 144.0, 161.0, 237.0, 271.0, 422.0, 780.0, 2752.0, 53353.0, 3910958.0, 217038.0, 5122.0, 975.0, 446.0, 300.0, 230.0, 174.0, 135.0, 111.0, 65.0, 38.0, 46.0, 23.0, 25.0, 16.0, 11.0, 12.0, 10.0, 7.0, 5.0, 8.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.0625, -45.41943359375, -43.7763671875, -42.13330078125, -40.490234375, -38.84716796875, -37.2041015625, -35.56103515625, -33.91796875, -32.27490234375, -30.6318359375, -28.98876953125, -27.345703125, -25.70263671875, -24.0595703125, -22.41650390625, -20.7734375, -19.13037109375, -17.4873046875, -15.84423828125, -14.201171875, -12.55810546875, -10.9150390625, -9.27197265625, -7.62890625, -5.98583984375, -4.3427734375, -2.69970703125, -1.056640625, 0.58642578125, 2.2294921875, 3.87255859375, 5.515625, 7.15869140625, 8.8017578125, 10.44482421875, 12.087890625, 13.73095703125, 15.3740234375, 17.01708984375, 18.66015625, 20.30322265625, 21.9462890625, 23.58935546875, 25.232421875, 26.87548828125, 28.5185546875, 30.16162109375, 31.8046875, 33.44775390625, 35.0908203125, 36.73388671875, 38.376953125, 40.02001953125, 41.6630859375, 43.30615234375, 44.94921875, 46.59228515625, 48.2353515625, 49.87841796875, 51.521484375, 53.16455078125, 54.8076171875, 56.45068359375, 58.09375]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 8.0, 173.0, 743.0, 92.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.823184967041016, -42.15327453613281, -29.483366012573242, -16.813457489013672, -4.143547058105469, 8.526363372802734, 21.196269989013672, 33.86618423461914, 46.53609085083008, 59.20600128173828, 71.87590789794922, 84.54582214355469, 97.21572875976562, 109.88563537597656, 122.5555419921875, 135.2254638671875, 147.89537048339844, 160.56527709960938, 173.2351837158203, 185.90509033203125, 198.57501220703125, 211.2449188232422, 223.91482543945312, 236.58474731445312, 249.254638671875, 261.924560546875, 274.5944519042969, 287.2643737792969, 299.93426513671875, 312.60418701171875, 325.27410888671875, 337.9440002441406, 350.6139221191406, 363.2838439941406, 375.9537353515625, 388.6236572265625, 401.2935485839844, 413.9634704589844, 426.63336181640625, 439.30328369140625, 451.97320556640625, 464.64312744140625, 477.3130187988281, 489.9829406738281, 502.65283203125, 515.32275390625, 527.99267578125, 540.66259765625, 553.3324584960938, 566.0023803710938, 578.6723022460938, 591.3421630859375, 604.0120849609375, 616.6820068359375, 629.3519287109375, 642.0218505859375, 654.6917724609375, 667.3616943359375, 680.0316162109375, 692.7014770507812, 705.3713989257812, 718.0413208007812, 730.7112426757812, 743.3811645507812, 756.051025390625]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 6.0, 2.0, 6.0, 7.0, 15.0, 15.0, 11.0, 20.0, 21.0, 31.0, 30.0, 29.0, 32.0, 44.0, 42.0, 39.0, 51.0, 52.0, 47.0, 46.0, 40.0, 43.0, 41.0, 34.0, 45.0, 45.0, 25.0, 30.0, 30.0, 28.0, 24.0, 18.0, 16.0, 10.0, 10.0, 5.0, 4.0, 6.0, 5.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.80809020996094, -57.991485595703125, -56.17488098144531, -54.358272552490234, -52.54166793823242, -50.72506332397461, -48.90845489501953, -47.09185028076172, -45.275245666503906, -43.458641052246094, -41.64203643798828, -39.8254280090332, -38.00882339477539, -36.19221878051758, -34.3756103515625, -32.55900573730469, -30.742401123046875, -28.925796508789062, -27.109189987182617, -25.292583465576172, -23.47597885131836, -21.659374237060547, -19.8427677154541, -18.026161193847656, -16.209556579589844, -14.392951011657715, -12.576345443725586, -10.759739875793457, -8.943134307861328, -7.126528739929199, -5.30992317199707, -3.4933176040649414, -1.6767120361328125, 0.1398935317993164, 1.9564990997314453, 3.773104667663574, 5.589710235595703, 7.406315803527832, 9.222921371459961, 11.03952693939209, 12.856132507324219, 14.672738075256348, 16.489343643188477, 18.305950164794922, 20.122554779052734, 21.939159393310547, 23.755765914916992, 25.572372436523438, 27.38897705078125, 29.205581665039062, 31.022188186645508, 32.83879470825195, 34.655399322509766, 36.47200393676758, 38.288612365722656, 40.10521697998047, 41.92182159423828, 43.738426208496094, 45.555030822753906, 47.371639251708984, 49.1882438659668, 51.00484848022461, 52.82145690917969, 54.6380615234375, 56.45466613769531]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 10.0, 4.0, 7.0, 8.0, 13.0, 15.0, 13.0, 17.0, 11.0, 13.0, 17.0, 28.0, 24.0, 23.0, 44.0, 38.0, 36.0, 43.0, 41.0, 53.0, 38.0, 41.0, 44.0, 48.0, 34.0, 38.0, 39.0, 32.0, 36.0, 20.0, 28.0, 19.0, 26.0, 16.0, 20.0, 11.0, 9.0, 11.0, 5.0, 7.0, 5.0, 5.0, 7.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.75, -7.50860595703125, -7.2672119140625, -7.02581787109375, -6.784423828125, -6.54302978515625, -6.3016357421875, -6.06024169921875, -5.81884765625, -5.57745361328125, -5.3360595703125, -5.09466552734375, -4.853271484375, -4.61187744140625, -4.3704833984375, -4.12908935546875, -3.8876953125, -3.64630126953125, -3.4049072265625, -3.16351318359375, -2.922119140625, -2.68072509765625, -2.4393310546875, -2.19793701171875, -1.95654296875, -1.71514892578125, -1.4737548828125, -1.23236083984375, -0.990966796875, -0.74957275390625, -0.5081787109375, -0.26678466796875, -0.025390625, 0.21600341796875, 0.4573974609375, 0.69879150390625, 0.940185546875, 1.18157958984375, 1.4229736328125, 1.66436767578125, 1.90576171875, 2.14715576171875, 2.3885498046875, 2.62994384765625, 2.871337890625, 3.11273193359375, 3.3541259765625, 3.59552001953125, 3.8369140625, 4.07830810546875, 4.3197021484375, 4.56109619140625, 4.802490234375, 5.04388427734375, 5.2852783203125, 5.52667236328125, 5.76806640625, 6.00946044921875, 6.2508544921875, 6.49224853515625, 6.733642578125, 6.97503662109375, 7.2164306640625, 7.45782470703125, 7.69921875]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 8.0, 13.0, 19.0, 21.0, 34.0, 50.0, 66.0, 118.0, 155.0, 233.0, 303.0, 464.0, 660.0, 994.0, 1384.0, 2069.0, 2956.0, 4322.0, 6688.0, 9994.0, 15887.0, 25265.0, 42016.0, 74125.0, 143426.0, 266784.0, 204476.0, 100892.0, 55069.0, 32116.0, 20008.0, 12687.0, 8279.0, 5274.0, 3687.0, 2475.0, 1726.0, 1169.0, 805.0, 588.0, 374.0, 269.0, 181.0, 144.0, 91.0, 70.0, 33.0, 30.0, 25.0, 16.0, 7.0, 4.0, 8.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.115234375, -1.080108642578125, -1.04498291015625, -1.009857177734375, -0.9747314453125, -0.939605712890625, -0.90447998046875, -0.869354248046875, -0.834228515625, -0.799102783203125, -0.76397705078125, -0.728851318359375, -0.6937255859375, -0.658599853515625, -0.62347412109375, -0.588348388671875, -0.55322265625, -0.518096923828125, -0.48297119140625, -0.447845458984375, -0.4127197265625, -0.377593994140625, -0.34246826171875, -0.307342529296875, -0.272216796875, -0.237091064453125, -0.20196533203125, -0.166839599609375, -0.1317138671875, -0.096588134765625, -0.06146240234375, -0.026336669921875, 0.0087890625, 0.043914794921875, 0.07904052734375, 0.114166259765625, 0.1492919921875, 0.184417724609375, 0.21954345703125, 0.254669189453125, 0.289794921875, 0.324920654296875, 0.36004638671875, 0.395172119140625, 0.4302978515625, 0.465423583984375, 0.50054931640625, 0.535675048828125, 0.57080078125, 0.605926513671875, 0.64105224609375, 0.676177978515625, 0.7113037109375, 0.746429443359375, 0.78155517578125, 0.816680908203125, 0.851806640625, 0.886932373046875, 0.92205810546875, 0.957183837890625, 0.9923095703125, 1.027435302734375, 1.06256103515625, 1.097686767578125, 1.1328125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 4.0, 3.0, 10.0, 11.0, 16.0, 16.0, 15.0, 19.0, 21.0, 24.0, 18.0, 28.0, 31.0, 26.0, 50.0, 41.0, 35.0, 40.0, 39.0, 36.0, 1064.0, 31.0, 41.0, 48.0, 33.0, 39.0, 37.0, 41.0, 38.0, 27.0, 21.0, 15.0, 15.0, 17.0, 13.0, 11.0, 4.0, 11.0, 8.0, 4.0, 7.0, 7.0, 4.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-4.97265625, -4.82275390625, -4.6728515625, -4.52294921875, -4.373046875, -4.22314453125, -4.0732421875, -3.92333984375, -3.7734375, -3.62353515625, -3.4736328125, -3.32373046875, -3.173828125, -3.02392578125, -2.8740234375, -2.72412109375, -2.57421875, -2.42431640625, -2.2744140625, -2.12451171875, -1.974609375, -1.82470703125, -1.6748046875, -1.52490234375, -1.375, -1.22509765625, -1.0751953125, -0.92529296875, -0.775390625, -0.62548828125, -0.4755859375, -0.32568359375, -0.17578125, -0.02587890625, 0.1240234375, 0.27392578125, 0.423828125, 0.57373046875, 0.7236328125, 0.87353515625, 1.0234375, 1.17333984375, 1.3232421875, 1.47314453125, 1.623046875, 1.77294921875, 1.9228515625, 2.07275390625, 2.22265625, 2.37255859375, 2.5224609375, 2.67236328125, 2.822265625, 2.97216796875, 3.1220703125, 3.27197265625, 3.421875, 3.57177734375, 3.7216796875, 3.87158203125, 4.021484375, 4.17138671875, 4.3212890625, 4.47119140625, 4.62109375]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 5.0, 5.0, 12.0, 15.0, 18.0, 20.0, 36.0, 56.0, 68.0, 117.0, 138.0, 266.0, 379.0, 612.0, 1018.0, 1557.0, 2405.0, 3801.0, 6508.0, 10768.0, 18568.0, 32343.0, 59257.0, 118052.0, 277278.0, 1292873.0, 126337.0, 62376.0, 34104.0, 19453.0, 11096.0, 6625.0, 3967.0, 2539.0, 1615.0, 972.0, 662.0, 403.0, 292.0, 156.0, 98.0, 61.0, 67.0, 40.0, 27.0, 17.0, 16.0, 14.0, 6.0, 5.0, 6.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.1728515625, -1.1362457275390625, -1.099639892578125, -1.0630340576171875, -1.02642822265625, -0.9898223876953125, -0.953216552734375, -0.9166107177734375, -0.8800048828125, -0.8433990478515625, -0.806793212890625, -0.7701873779296875, -0.73358154296875, -0.6969757080078125, -0.660369873046875, -0.6237640380859375, -0.587158203125, -0.5505523681640625, -0.513946533203125, -0.4773406982421875, -0.44073486328125, -0.4041290283203125, -0.367523193359375, -0.3309173583984375, -0.2943115234375, -0.2577056884765625, -0.221099853515625, -0.1844940185546875, -0.14788818359375, -0.1112823486328125, -0.074676513671875, -0.0380706787109375, -0.00146484375, 0.0351409912109375, 0.071746826171875, 0.1083526611328125, 0.14495849609375, 0.1815643310546875, 0.218170166015625, 0.2547760009765625, 0.2913818359375, 0.3279876708984375, 0.364593505859375, 0.4011993408203125, 0.43780517578125, 0.4744110107421875, 0.511016845703125, 0.5476226806640625, 0.584228515625, 0.6208343505859375, 0.657440185546875, 0.6940460205078125, 0.73065185546875, 0.7672576904296875, 0.803863525390625, 0.8404693603515625, 0.8770751953125, 0.9136810302734375, 0.950286865234375, 0.9868927001953125, 1.02349853515625, 1.0601043701171875, 1.096710205078125, 1.1333160400390625, 1.169921875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 6.0, 0.0, 1.0, 3.0, 5.0, 7.0, 10.0, 11.0, 10.0, 20.0, 20.0, 32.0, 43.0, 39.0, 45.0, 59.0, 55.0, 53.0, 69.0, 59.0, 65.0, 87.0, 56.0, 47.0, 40.0, 27.0, 30.0, 21.0, 15.0, 16.0, 13.0, 4.0, 6.0, 4.0, 8.0, 5.0, 2.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.003643035888671875, -0.0035384297370910645, -0.003433823585510254, -0.0033292174339294434, -0.003224611282348633, -0.0031200051307678223, -0.0030153989791870117, -0.002910792827606201, -0.0028061866760253906, -0.00270158052444458, -0.0025969743728637695, -0.002492368221282959, -0.0023877620697021484, -0.002283155918121338, -0.0021785497665405273, -0.002073943614959717, -0.0019693374633789062, -0.0018647313117980957, -0.0017601251602172852, -0.0016555190086364746, -0.001550912857055664, -0.0014463067054748535, -0.001341700553894043, -0.0012370944023132324, -0.0011324882507324219, -0.0010278820991516113, -0.0009232759475708008, -0.0008186697959899902, -0.0007140636444091797, -0.0006094574928283691, -0.0005048513412475586, -0.00040024518966674805, -0.0002956390380859375, -0.00019103288650512695, -8.64267349243164e-05, 1.817941665649414e-05, 0.0001227855682373047, 0.00022739171981811523, 0.0003319978713989258, 0.00043660402297973633, 0.0005412101745605469, 0.0006458163261413574, 0.000750422477722168, 0.0008550286293029785, 0.0009596347808837891, 0.0010642409324645996, 0.0011688470840454102, 0.0012734532356262207, 0.0013780593872070312, 0.0014826655387878418, 0.0015872716903686523, 0.0016918778419494629, 0.0017964839935302734, 0.001901090145111084, 0.0020056962966918945, 0.002110302448272705, 0.0022149085998535156, 0.002319514751434326, 0.0024241209030151367, 0.0025287270545959473, 0.002633333206176758, 0.0027379393577575684, 0.002842545509338379, 0.0029471516609191895, 0.0030517578125]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 6.0, 5.0, 7.0, 8.0, 11.0, 8.0, 21.0, 23.0, 37.0, 40.0, 62.0, 103.0, 143.0, 275.0, 794.0, 253642.0, 791733.0, 828.0, 308.0, 159.0, 84.0, 64.0, 59.0, 25.0, 35.0, 14.0, 18.0, 9.0, 8.0, 6.0, 2.0, 0.0, 3.0, 1.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0791015625, -0.07637882232666016, -0.07365608215332031, -0.07093334197998047, -0.06821060180664062, -0.06548786163330078, -0.06276512145996094, -0.060042381286621094, -0.05731964111328125, -0.054596900939941406, -0.05187416076660156, -0.04915142059326172, -0.046428680419921875, -0.04370594024658203, -0.04098320007324219, -0.038260459899902344, -0.0355377197265625, -0.032814979553222656, -0.030092239379882812, -0.02736949920654297, -0.024646759033203125, -0.02192401885986328, -0.019201278686523438, -0.016478538513183594, -0.01375579833984375, -0.011033058166503906, -0.008310317993164062, -0.005587577819824219, -0.002864837646484375, -0.00014209747314453125, 0.0025806427001953125, 0.005303382873535156, 0.008026123046875, 0.010748863220214844, 0.013471603393554688, 0.01619434356689453, 0.018917083740234375, 0.02163982391357422, 0.024362564086914062, 0.027085304260253906, 0.02980804443359375, 0.032530784606933594, 0.03525352478027344, 0.03797626495361328, 0.040699005126953125, 0.04342174530029297, 0.04614448547363281, 0.048867225646972656, 0.0515899658203125, 0.054312705993652344, 0.05703544616699219, 0.05975818634033203, 0.062480926513671875, 0.06520366668701172, 0.06792640686035156, 0.0706491470336914, 0.07337188720703125, 0.0760946273803711, 0.07881736755371094, 0.08154010772705078, 0.08426284790039062, 0.08698558807373047, 0.08970832824707031, 0.09243106842041016, 0.09515380859375]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 27.0, 173.0, 510.0, 251.0, 42.0, 9.0, 0.0, 1.0], "bins": [-0.011518800631165504, -0.011322228237986565, -0.0111256567761302, -0.010929085314273834, -0.010732512921094894, -0.010535940527915955, -0.01033936906605959, -0.010142797604203224, -0.009946225211024284, -0.009749652817845345, -0.00955308135598898, -0.009356509894132614, -0.009159937500953674, -0.008963365107774734, -0.00876679364591837, -0.008570222184062004, -0.008373649790883064, -0.008177077397704124, -0.00798050593584776, -0.007783934008330107, -0.007587362080812454, -0.007390790153294802, -0.007194218225777149, -0.006997646298259497, -0.006801074370741844, -0.006604502443224192, -0.006407930515706539, -0.006211358588188887, -0.006014786660671234, -0.005818214733153582, -0.005621642805635929, -0.005425070878118277, -0.005228498950600624, -0.005031927023082972, -0.004835355095565319, -0.0046387831680476665, -0.004442211240530014, -0.0042456393130123615, -0.004049067385494709, -0.0038524954579770565, -0.0036559232976287603, -0.003459351370111108, -0.0032627794425934553, -0.003066207515075803, -0.0028696355875581503, -0.0026730636600404978, -0.0024764917325228453, -0.0022799198050051928, -0.0020833478774875402, -0.0018867759499698877, -0.0016902040224522352, -0.0014936320949345827, -0.0012970601674169302, -0.0011004882398992777, -0.0009039163123816252, -0.0007073443848639727, -0.0005107724573463202, -0.00031420052982866764, -0.00011762860231101513, 7.894332520663738e-05, 0.0002755152527242899, 0.0004720871802419424, 0.0006686591077595949, 0.0008652310352772474, 0.0010618029627949]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 7.0, 9.0, 6.0, 12.0, 15.0, 16.0, 16.0, 17.0, 18.0, 15.0, 19.0, 26.0, 27.0, 39.0, 47.0, 24.0, 37.0, 38.0, 44.0, 35.0, 45.0, 54.0, 47.0, 38.0, 38.0, 41.0, 29.0, 40.0, 25.0, 28.0, 22.0, 19.0, 18.0, 12.0, 12.0, 12.0, 8.0, 11.0, 4.0, 10.0, 8.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.0017020702362060547, -0.001650598831474781, -0.0015991274267435074, -0.0015476560220122337, -0.00149618461728096, -0.0014447132125496864, -0.0013932418078184128, -0.0013417704030871391, -0.0012902989983558655, -0.0012388275936245918, -0.0011873561888933182, -0.0011358847841620445, -0.0010844133794307709, -0.0010329419746994972, -0.0009814705699682236, -0.0009299991652369499, -0.0008785277605056763, -0.0008270563557744026, -0.000775584951043129, -0.0007241135463118553, -0.0006726421415805817, -0.000621170736849308, -0.0005696993321180344, -0.0005182279273867607, -0.00046675652265548706, -0.0004152851179242134, -0.00036381371319293976, -0.0003123423084616661, -0.00026087090373039246, -0.0002093994989991188, -0.00015792809426784515, -0.0001064566895365715, -5.498528480529785e-05, -3.5138800740242004e-06, 4.795752465724945e-05, 9.94289293885231e-05, 0.00015090033411979675, 0.0002023717388510704, 0.00025384314358234406, 0.0003053145483136177, 0.00035678595304489136, 0.000408257357776165, 0.00045972876250743866, 0.0005112001672387123, 0.000562671571969986, 0.0006141429767012596, 0.0006656143814325333, 0.0007170857861638069, 0.0007685571908950806, 0.0008200285956263542, 0.0008715000003576279, 0.0009229714050889015, 0.0009744428098201752, 0.0010259142145514488, 0.0010773856192827225, 0.0011288570240139961, 0.0011803284287452698, 0.0012317998334765434, 0.001283271238207817, 0.0013347426429390907, 0.0013862140476703644, 0.001437685452401638, 0.0014891568571329117, 0.0015406282618641853, 0.001592099666595459]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 10.0, 4.0, 7.0, 8.0, 13.0, 15.0, 14.0, 16.0, 11.0, 13.0, 17.0, 28.0, 24.0, 23.0, 44.0, 38.0, 36.0, 43.0, 41.0, 53.0, 39.0, 40.0, 44.0, 48.0, 34.0, 38.0, 39.0, 32.0, 36.0, 20.0, 28.0, 19.0, 26.0, 16.0, 20.0, 11.0, 9.0, 11.0, 5.0, 7.0, 5.0, 5.0, 7.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.75, -7.50860595703125, -7.2672119140625, -7.02581787109375, -6.784423828125, -6.54302978515625, -6.3016357421875, -6.06024169921875, -5.81884765625, -5.57745361328125, -5.3360595703125, -5.09466552734375, -4.853271484375, -4.61187744140625, -4.3704833984375, -4.12908935546875, -3.8876953125, -3.64630126953125, -3.4049072265625, -3.16351318359375, -2.922119140625, -2.68072509765625, -2.4393310546875, -2.19793701171875, -1.95654296875, -1.71514892578125, -1.4737548828125, -1.23236083984375, -0.990966796875, -0.74957275390625, -0.5081787109375, -0.26678466796875, -0.025390625, 0.21600341796875, 0.4573974609375, 0.69879150390625, 0.940185546875, 1.18157958984375, 1.4229736328125, 1.66436767578125, 1.90576171875, 2.14715576171875, 2.3885498046875, 2.62994384765625, 2.871337890625, 3.11273193359375, 3.3541259765625, 3.59552001953125, 3.8369140625, 4.07830810546875, 4.3197021484375, 4.56109619140625, 4.802490234375, 5.04388427734375, 5.2852783203125, 5.52667236328125, 5.76806640625, 6.00946044921875, 6.2508544921875, 6.49224853515625, 6.733642578125, 6.97503662109375, 7.2164306640625, 7.45782470703125, 7.69921875]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 6.0, 4.0, 6.0, 6.0, 9.0, 17.0, 22.0, 26.0, 33.0, 60.0, 64.0, 123.0, 207.0, 326.0, 563.0, 1064.0, 1966.0, 4034.0, 8334.0, 18161.0, 43248.0, 119212.0, 364917.0, 315935.0, 101540.0, 37663.0, 15746.0, 7390.0, 3626.0, 1848.0, 1048.0, 533.0, 315.0, 168.0, 105.0, 64.0, 49.0, 31.0, 26.0, 15.0, 9.0, 10.0, 13.0, 8.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.57421875, -6.3682861328125, -6.162353515625, -5.9564208984375, -5.75048828125, -5.5445556640625, -5.338623046875, -5.1326904296875, -4.9267578125, -4.7208251953125, -4.514892578125, -4.3089599609375, -4.10302734375, -3.8970947265625, -3.691162109375, -3.4852294921875, -3.279296875, -3.0733642578125, -2.867431640625, -2.6614990234375, -2.45556640625, -2.2496337890625, -2.043701171875, -1.8377685546875, -1.6318359375, -1.4259033203125, -1.219970703125, -1.0140380859375, -0.80810546875, -0.6021728515625, -0.396240234375, -0.1903076171875, 0.015625, 0.2215576171875, 0.427490234375, 0.6334228515625, 0.83935546875, 1.0452880859375, 1.251220703125, 1.4571533203125, 1.6630859375, 1.8690185546875, 2.074951171875, 2.2808837890625, 2.48681640625, 2.6927490234375, 2.898681640625, 3.1046142578125, 3.310546875, 3.5164794921875, 3.722412109375, 3.9283447265625, 4.13427734375, 4.3402099609375, 4.546142578125, 4.7520751953125, 4.9580078125, 5.1639404296875, 5.369873046875, 5.5758056640625, 5.78173828125, 5.9876708984375, 6.193603515625, 6.3995361328125, 6.60546875]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [4.0, 2.0, 6.0, 1.0, 1.0, 2.0, 6.0, 6.0, 7.0, 7.0, 11.0, 14.0, 7.0, 25.0, 12.0, 12.0, 20.0, 27.0, 29.0, 25.0, 26.0, 24.0, 40.0, 36.0, 53.0, 90.0, 143.0, 1417.0, 408.0, 139.0, 62.0, 49.0, 45.0, 27.0, 24.0, 27.0, 33.0, 26.0, 26.0, 26.0, 17.0, 17.0, 21.0, 10.0, 9.0, 4.0, 10.0, 8.0, 8.0, 4.0, 2.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.890625, -18.215576171875, -17.54052734375, -16.865478515625, -16.1904296875, -15.515380859375, -14.84033203125, -14.165283203125, -13.490234375, -12.815185546875, -12.14013671875, -11.465087890625, -10.7900390625, -10.114990234375, -9.43994140625, -8.764892578125, -8.08984375, -7.414794921875, -6.73974609375, -6.064697265625, -5.3896484375, -4.714599609375, -4.03955078125, -3.364501953125, -2.689453125, -2.014404296875, -1.33935546875, -0.664306640625, 0.0107421875, 0.685791015625, 1.36083984375, 2.035888671875, 2.7109375, 3.385986328125, 4.06103515625, 4.736083984375, 5.4111328125, 6.086181640625, 6.76123046875, 7.436279296875, 8.111328125, 8.786376953125, 9.46142578125, 10.136474609375, 10.8115234375, 11.486572265625, 12.16162109375, 12.836669921875, 13.51171875, 14.186767578125, 14.86181640625, 15.536865234375, 16.2119140625, 16.886962890625, 17.56201171875, 18.237060546875, 18.912109375, 19.587158203125, 20.26220703125, 20.937255859375, 21.6123046875, 22.287353515625, 22.96240234375, 23.637451171875, 24.3125]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 2.0, 6.0, 4.0, 8.0, 9.0, 11.0, 6.0, 10.0, 20.0, 34.0, 26.0, 34.0, 64.0, 64.0, 64.0, 98.0, 130.0, 177.0, 231.0, 374.0, 832.0, 5084.0, 469958.0, 2654442.0, 11340.0, 1145.0, 444.0, 237.0, 192.0, 153.0, 103.0, 69.0, 73.0, 47.0, 48.0, 32.0, 34.0, 22.0, 17.0, 12.0, 15.0, 9.0, 7.0, 6.0, 0.0, 5.0, 3.0, 6.0, 2.0, 1.0, 1.0, 1.0], "bins": [-41.125, -39.9541015625, -38.783203125, -37.6123046875, -36.44140625, -35.2705078125, -34.099609375, -32.9287109375, -31.7578125, -30.5869140625, -29.416015625, -28.2451171875, -27.07421875, -25.9033203125, -24.732421875, -23.5615234375, -22.390625, -21.2197265625, -20.048828125, -18.8779296875, -17.70703125, -16.5361328125, -15.365234375, -14.1943359375, -13.0234375, -11.8525390625, -10.681640625, -9.5107421875, -8.33984375, -7.1689453125, -5.998046875, -4.8271484375, -3.65625, -2.4853515625, -1.314453125, -0.1435546875, 1.02734375, 2.1982421875, 3.369140625, 4.5400390625, 5.7109375, 6.8818359375, 8.052734375, 9.2236328125, 10.39453125, 11.5654296875, 12.736328125, 13.9072265625, 15.078125, 16.2490234375, 17.419921875, 18.5908203125, 19.76171875, 20.9326171875, 22.103515625, 23.2744140625, 24.4453125, 25.6162109375, 26.787109375, 27.9580078125, 29.12890625, 30.2998046875, 31.470703125, 32.6416015625, 33.8125]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 24.0, 114.0, 304.0, 347.0, 165.0, 47.0, 12.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.7906265258789, -66.8886947631836, -64.98677062988281, -63.0848388671875, -61.18291091918945, -59.280982971191406, -57.379051208496094, -55.47712326049805, -53.5751953125, -51.67326736450195, -49.77133560180664, -47.869407653808594, -45.96747970581055, -44.0655517578125, -42.16361999511719, -40.26169204711914, -38.35976028442383, -36.45783233642578, -34.55590057373047, -32.65397262573242, -30.752044677734375, -28.850114822387695, -26.948184967041016, -25.04625701904297, -23.14432716369629, -21.24239730834961, -19.340469360351562, -17.438539505004883, -15.53661060333252, -13.634681701660156, -11.732751846313477, -9.830822944641113, -7.928897857666016, -6.026968955993652, -4.125039577484131, -2.2231101989746094, -0.3211812973022461, 1.5807476043701172, 3.482677459716797, 5.38460636138916, 7.286535263061523, 9.188464164733887, 11.09039306640625, 12.99232292175293, 14.894251823425293, 16.796180725097656, 18.698110580444336, 20.600040435791016, 22.501968383789062, 24.403898239135742, 26.30582618713379, 28.20775604248047, 30.109683990478516, 32.01161193847656, 33.913543701171875, 35.81547164916992, 37.71739959716797, 39.619327545166016, 41.52125930786133, 43.423187255859375, 45.32511520385742, 47.22704315185547, 49.12897491455078, 51.03090286254883, 52.93283462524414]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 8.0, 7.0, 10.0, 10.0, 11.0, 10.0, 15.0, 18.0, 19.0, 16.0, 18.0, 23.0, 24.0, 35.0, 20.0, 46.0, 49.0, 34.0, 40.0, 50.0, 39.0, 38.0, 43.0, 44.0, 36.0, 48.0, 28.0, 27.0, 30.0, 25.0, 30.0, 21.0, 20.0, 24.0, 15.0, 17.0, 10.0, 8.0, 8.0, 6.0, 4.0, 5.0, 4.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-52.45960998535156, -50.79045104980469, -49.12128829956055, -47.45212936401367, -45.78296661376953, -44.113807678222656, -42.444644927978516, -40.77548599243164, -39.1063232421875, -37.437164306640625, -35.768001556396484, -34.09884262084961, -32.42967987060547, -30.760520935058594, -29.091358184814453, -27.422199249267578, -25.75303840637207, -24.083877563476562, -22.414716720581055, -20.745555877685547, -19.07639503479004, -17.40723419189453, -15.73807430267334, -14.068913459777832, -12.399752616882324, -10.730591773986816, -9.061430931091309, -7.392270565032959, -5.723109722137451, -4.053949356079102, -2.3847885131835938, -0.7156276702880859, 0.9535331726074219, 2.6226940155029297, 4.2918548583984375, 5.961015224456787, 7.630176067352295, 9.299336433410645, 10.968497276306152, 12.63765811920166, 14.306818962097168, 15.975979804992676, 17.645139694213867, 19.314300537109375, 20.983461380004883, 22.65262222290039, 24.3217830657959, 25.990943908691406, 27.660104751586914, 29.329265594482422, 30.99842643737793, 32.66758728027344, 34.33674621582031, 36.00590896606445, 37.67506790161133, 39.34423065185547, 41.013389587402344, 42.68254852294922, 44.35171127319336, 46.020870208740234, 47.690032958984375, 49.35919189453125, 51.02835464477539, 52.697513580322266, 54.366676330566406]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 6.0, 2.0, 2.0, 5.0, 7.0, 11.0, 5.0, 16.0, 15.0, 14.0, 12.0, 13.0, 18.0, 26.0, 25.0, 32.0, 37.0, 37.0, 41.0, 41.0, 37.0, 49.0, 37.0, 43.0, 49.0, 46.0, 39.0, 50.0, 31.0, 26.0, 41.0, 26.0, 24.0, 19.0, 23.0, 18.0, 18.0, 12.0, 15.0, 7.0, 7.0, 10.0, 6.0, 3.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.140625, -7.888916015625, -7.63720703125, -7.385498046875, -7.1337890625, -6.882080078125, -6.63037109375, -6.378662109375, -6.126953125, -5.875244140625, -5.62353515625, -5.371826171875, -5.1201171875, -4.868408203125, -4.61669921875, -4.364990234375, -4.11328125, -3.861572265625, -3.60986328125, -3.358154296875, -3.1064453125, -2.854736328125, -2.60302734375, -2.351318359375, -2.099609375, -1.847900390625, -1.59619140625, -1.344482421875, -1.0927734375, -0.841064453125, -0.58935546875, -0.337646484375, -0.0859375, 0.165771484375, 0.41748046875, 0.669189453125, 0.9208984375, 1.172607421875, 1.42431640625, 1.676025390625, 1.927734375, 2.179443359375, 2.43115234375, 2.682861328125, 2.9345703125, 3.186279296875, 3.43798828125, 3.689697265625, 3.94140625, 4.193115234375, 4.44482421875, 4.696533203125, 4.9482421875, 5.199951171875, 5.45166015625, 5.703369140625, 5.955078125, 6.206787109375, 6.45849609375, 6.710205078125, 6.9619140625, 7.213623046875, 7.46533203125, 7.717041015625, 7.96875]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 5.0, 7.0, 10.0, 11.0, 11.0, 15.0, 22.0, 19.0, 25.0, 35.0, 45.0, 55.0, 78.0, 114.0, 205.0, 397.0, 1302.0, 7260.0, 119773.0, 3114780.0, 920951.0, 24663.0, 3005.0, 664.0, 244.0, 146.0, 114.0, 72.0, 53.0, 29.0, 30.0, 26.0, 22.0, 13.0, 21.0, 11.0, 17.0, 3.0, 6.0, 7.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-29.515625, -28.690185546875, -27.86474609375, -27.039306640625, -26.2138671875, -25.388427734375, -24.56298828125, -23.737548828125, -22.912109375, -22.086669921875, -21.26123046875, -20.435791015625, -19.6103515625, -18.784912109375, -17.95947265625, -17.134033203125, -16.30859375, -15.483154296875, -14.65771484375, -13.832275390625, -13.0068359375, -12.181396484375, -11.35595703125, -10.530517578125, -9.705078125, -8.879638671875, -8.05419921875, -7.228759765625, -6.4033203125, -5.577880859375, -4.75244140625, -3.927001953125, -3.1015625, -2.276123046875, -1.45068359375, -0.625244140625, 0.2001953125, 1.025634765625, 1.85107421875, 2.676513671875, 3.501953125, 4.327392578125, 5.15283203125, 5.978271484375, 6.8037109375, 7.629150390625, 8.45458984375, 9.280029296875, 10.10546875, 10.930908203125, 11.75634765625, 12.581787109375, 13.4072265625, 14.232666015625, 15.05810546875, 15.883544921875, 16.708984375, 17.534423828125, 18.35986328125, 19.185302734375, 20.0107421875, 20.836181640625, 21.66162109375, 22.487060546875, 23.3125]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 0.0, 2.0, 5.0, 12.0, 10.0, 5.0, 12.0, 19.0, 26.0, 34.0, 43.0, 64.0, 59.0, 114.0, 123.0, 162.0, 204.0, 301.0, 359.0, 422.0, 469.0, 388.0, 313.0, 232.0, 160.0, 133.0, 93.0, 82.0, 63.0, 42.0, 40.0, 24.0, 18.0, 17.0, 6.0, 6.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.9921875, -13.606201171875, -13.22021484375, -12.834228515625, -12.4482421875, -12.062255859375, -11.67626953125, -11.290283203125, -10.904296875, -10.518310546875, -10.13232421875, -9.746337890625, -9.3603515625, -8.974365234375, -8.58837890625, -8.202392578125, -7.81640625, -7.430419921875, -7.04443359375, -6.658447265625, -6.2724609375, -5.886474609375, -5.50048828125, -5.114501953125, -4.728515625, -4.342529296875, -3.95654296875, -3.570556640625, -3.1845703125, -2.798583984375, -2.41259765625, -2.026611328125, -1.640625, -1.254638671875, -0.86865234375, -0.482666015625, -0.0966796875, 0.289306640625, 0.67529296875, 1.061279296875, 1.447265625, 1.833251953125, 2.21923828125, 2.605224609375, 2.9912109375, 3.377197265625, 3.76318359375, 4.149169921875, 4.53515625, 4.921142578125, 5.30712890625, 5.693115234375, 6.0791015625, 6.465087890625, 6.85107421875, 7.237060546875, 7.623046875, 8.009033203125, 8.39501953125, 8.781005859375, 9.1669921875, 9.552978515625, 9.93896484375, 10.324951171875, 10.7109375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 6.0, 2.0, 2.0, 10.0, 8.0, 6.0, 8.0, 11.0, 17.0, 26.0, 26.0, 36.0, 41.0, 49.0, 71.0, 92.0, 138.0, 138.0, 173.0, 242.0, 385.0, 1000.0, 7441.0, 393235.0, 3746969.0, 39697.0, 2419.0, 645.0, 341.0, 218.0, 209.0, 130.0, 113.0, 78.0, 60.0, 55.0, 47.0, 35.0, 32.0, 24.0, 13.0, 8.0, 11.0, 4.0, 3.0, 5.0, 4.0, 4.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-55.6875, -54.06201171875, -52.4365234375, -50.81103515625, -49.185546875, -47.56005859375, -45.9345703125, -44.30908203125, -42.68359375, -41.05810546875, -39.4326171875, -37.80712890625, -36.181640625, -34.55615234375, -32.9306640625, -31.30517578125, -29.6796875, -28.05419921875, -26.4287109375, -24.80322265625, -23.177734375, -21.55224609375, -19.9267578125, -18.30126953125, -16.67578125, -15.05029296875, -13.4248046875, -11.79931640625, -10.173828125, -8.54833984375, -6.9228515625, -5.29736328125, -3.671875, -2.04638671875, -0.4208984375, 1.20458984375, 2.830078125, 4.45556640625, 6.0810546875, 7.70654296875, 9.33203125, 10.95751953125, 12.5830078125, 14.20849609375, 15.833984375, 17.45947265625, 19.0849609375, 20.71044921875, 22.3359375, 23.96142578125, 25.5869140625, 27.21240234375, 28.837890625, 30.46337890625, 32.0888671875, 33.71435546875, 35.33984375, 36.96533203125, 38.5908203125, 40.21630859375, 41.841796875, 43.46728515625, 45.0927734375, 46.71826171875, 48.34375]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 17.0, 241.0, 518.0, 201.0, 39.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.95737838745117, -31.95941734313965, -24.961456298828125, -17.9634952545166, -10.965534210205078, -3.967571258544922, 3.0303878784179688, 10.02834701538086, 17.026309967041016, 24.02427101135254, 31.022232055664062, 38.02019500732422, 45.01815414428711, 52.016117095947266, 59.014076232910156, 66.01203918457031, 73.00999450683594, 80.0079574584961, 87.00592041015625, 94.00387573242188, 101.00183868408203, 107.99980163574219, 114.99775695800781, 121.99571990966797, 128.99368286132812, 135.99163818359375, 142.98960876464844, 149.98756408691406, 156.98553466796875, 163.98348999023438, 170.9814453125, 177.97940063476562, 184.97738647460938, 191.975341796875, 198.9733123779297, 205.9712677001953, 212.96923828125, 219.96719360351562, 226.96514892578125, 233.96310424804688, 240.96107482910156, 247.9590301513672, 254.95700073242188, 261.9549560546875, 268.9529113769531, 275.95086669921875, 282.9488525390625, 289.9468078613281, 296.94476318359375, 303.9427185058594, 310.940673828125, 317.93865966796875, 324.9366149902344, 331.9345703125, 338.9325256347656, 345.93048095703125, 352.928466796875, 359.9264221191406, 366.92437744140625, 373.92236328125, 380.9203186035156, 387.91827392578125, 394.9162292480469, 401.9141845703125, 408.9121398925781]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 1.0, 5.0, 8.0, 6.0, 6.0, 12.0, 15.0, 17.0, 23.0, 22.0, 23.0, 22.0, 22.0, 30.0, 32.0, 43.0, 33.0, 35.0, 36.0, 37.0, 41.0, 40.0, 51.0, 48.0, 37.0, 49.0, 47.0, 31.0, 38.0, 17.0, 31.0, 16.0, 23.0, 17.0, 19.0, 13.0, 9.0, 11.0, 4.0, 5.0, 11.0, 8.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-45.64849853515625, -44.292381286621094, -42.9362678527832, -41.58015060424805, -40.224037170410156, -38.867919921875, -37.511802673339844, -36.15568542480469, -34.7995719909668, -33.44345474243164, -32.08734130859375, -30.731224060058594, -29.37510871887207, -28.018993377685547, -26.66287612915039, -25.306760787963867, -23.950645446777344, -22.59453010559082, -21.238414764404297, -19.88229751586914, -18.526182174682617, -17.170066833496094, -15.813950538635254, -14.457834243774414, -13.10171890258789, -11.745603561401367, -10.389487266540527, -9.033370971679688, -7.677255630493164, -6.321139812469482, -4.965023994445801, -3.608907699584961, -2.2527923583984375, -0.8966765403747559, 0.4594392776489258, 1.8155550956726074, 3.171670913696289, 4.527786731719971, 5.883902549743652, 7.240018844604492, 8.596134185791016, 9.952249526977539, 11.308365821838379, 12.664482116699219, 14.020597457885742, 15.376712799072266, 16.732830047607422, 18.088945388793945, 19.44506072998047, 20.801176071166992, 22.157291412353516, 23.513408660888672, 24.869524002075195, 26.22563934326172, 27.581756591796875, 28.9378719329834, 30.293987274169922, 31.650102615356445, 33.00621795654297, 34.362335205078125, 35.71845245361328, 37.07456588745117, 38.43068313598633, 39.78679656982422, 41.142913818359375]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 7.0, 5.0, 7.0, 10.0, 11.0, 10.0, 11.0, 17.0, 15.0, 17.0, 19.0, 27.0, 20.0, 28.0, 26.0, 35.0, 37.0, 29.0, 30.0, 39.0, 40.0, 40.0, 43.0, 35.0, 35.0, 39.0, 36.0, 32.0, 24.0, 26.0, 29.0, 32.0, 27.0, 23.0, 17.0, 23.0, 17.0, 16.0, 12.0, 13.0, 9.0, 9.0, 5.0, 4.0, 6.0, 2.0, 4.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-7.48828125, -7.265625, -7.04296875, -6.8203125, -6.59765625, -6.375, -6.15234375, -5.9296875, -5.70703125, -5.484375, -5.26171875, -5.0390625, -4.81640625, -4.59375, -4.37109375, -4.1484375, -3.92578125, -3.703125, -3.48046875, -3.2578125, -3.03515625, -2.8125, -2.58984375, -2.3671875, -2.14453125, -1.921875, -1.69921875, -1.4765625, -1.25390625, -1.03125, -0.80859375, -0.5859375, -0.36328125, -0.140625, 0.08203125, 0.3046875, 0.52734375, 0.75, 0.97265625, 1.1953125, 1.41796875, 1.640625, 1.86328125, 2.0859375, 2.30859375, 2.53125, 2.75390625, 2.9765625, 3.19921875, 3.421875, 3.64453125, 3.8671875, 4.08984375, 4.3125, 4.53515625, 4.7578125, 4.98046875, 5.203125, 5.42578125, 5.6484375, 5.87109375, 6.09375, 6.31640625, 6.5390625, 6.76171875]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 7.0, 3.0, 9.0, 4.0, 22.0, 22.0, 39.0, 53.0, 64.0, 100.0, 139.0, 213.0, 279.0, 470.0, 655.0, 934.0, 1448.0, 2078.0, 3140.0, 4640.0, 7079.0, 10848.0, 16367.0, 25154.0, 40267.0, 67113.0, 121059.0, 218376.0, 220528.0, 123285.0, 68822.0, 41265.0, 25469.0, 16273.0, 10518.0, 7197.0, 4701.0, 3142.0, 2158.0, 1495.0, 975.0, 699.0, 459.0, 322.0, 216.0, 152.0, 101.0, 67.0, 48.0, 35.0, 25.0, 11.0, 10.0, 6.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.0595703125, -1.0264739990234375, -0.993377685546875, -0.9602813720703125, -0.92718505859375, -0.8940887451171875, -0.860992431640625, -0.8278961181640625, -0.7947998046875, -0.7617034912109375, -0.728607177734375, -0.6955108642578125, -0.66241455078125, -0.6293182373046875, -0.596221923828125, -0.5631256103515625, -0.530029296875, -0.4969329833984375, -0.463836669921875, -0.4307403564453125, -0.39764404296875, -0.3645477294921875, -0.331451416015625, -0.2983551025390625, -0.2652587890625, -0.2321624755859375, -0.199066162109375, -0.1659698486328125, -0.13287353515625, -0.0997772216796875, -0.066680908203125, -0.0335845947265625, -0.00048828125, 0.0326080322265625, 0.065704345703125, 0.0988006591796875, 0.13189697265625, 0.1649932861328125, 0.198089599609375, 0.2311859130859375, 0.2642822265625, 0.2973785400390625, 0.330474853515625, 0.3635711669921875, 0.39666748046875, 0.4297637939453125, 0.462860107421875, 0.4959564208984375, 0.529052734375, 0.5621490478515625, 0.595245361328125, 0.6283416748046875, 0.66143798828125, 0.6945343017578125, 0.727630615234375, 0.7607269287109375, 0.7938232421875, 0.8269195556640625, 0.860015869140625, 0.8931121826171875, 0.92620849609375, 0.9593048095703125, 0.992401123046875, 1.0254974365234375, 1.05859375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 3.0, 2.0, 1.0, 5.0, 12.0, 11.0, 7.0, 15.0, 17.0, 16.0, 23.0, 24.0, 29.0, 33.0, 26.0, 25.0, 27.0, 31.0, 43.0, 26.0, 47.0, 45.0, 1059.0, 42.0, 41.0, 35.0, 40.0, 36.0, 38.0, 31.0, 37.0, 34.0, 25.0, 24.0, 12.0, 21.0, 20.0, 13.0, 9.0, 11.0, 5.0, 10.0, 3.0, 3.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-5.20703125, -5.0574951171875, -4.907958984375, -4.7584228515625, -4.60888671875, -4.4593505859375, -4.309814453125, -4.1602783203125, -4.0107421875, -3.8612060546875, -3.711669921875, -3.5621337890625, -3.41259765625, -3.2630615234375, -3.113525390625, -2.9639892578125, -2.814453125, -2.6649169921875, -2.515380859375, -2.3658447265625, -2.21630859375, -2.0667724609375, -1.917236328125, -1.7677001953125, -1.6181640625, -1.4686279296875, -1.319091796875, -1.1695556640625, -1.02001953125, -0.8704833984375, -0.720947265625, -0.5714111328125, -0.421875, -0.2723388671875, -0.122802734375, 0.0267333984375, 0.17626953125, 0.3258056640625, 0.475341796875, 0.6248779296875, 0.7744140625, 0.9239501953125, 1.073486328125, 1.2230224609375, 1.37255859375, 1.5220947265625, 1.671630859375, 1.8211669921875, 1.970703125, 2.1202392578125, 2.269775390625, 2.4193115234375, 2.56884765625, 2.7183837890625, 2.867919921875, 3.0174560546875, 3.1669921875, 3.3165283203125, 3.466064453125, 3.6156005859375, 3.76513671875, 3.9146728515625, 4.064208984375, 4.2137451171875, 4.36328125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 6.0, 3.0, 5.0, 14.0, 18.0, 18.0, 28.0, 63.0, 78.0, 110.0, 153.0, 238.0, 375.0, 539.0, 840.0, 1162.0, 1762.0, 2630.0, 4138.0, 6182.0, 9691.0, 15456.0, 24786.0, 41155.0, 72118.0, 138765.0, 1307602.0, 213869.0, 106261.0, 57805.0, 33924.0, 20650.0, 12897.0, 8320.0, 5128.0, 3441.0, 2279.0, 1510.0, 1024.0, 692.0, 459.0, 310.0, 212.0, 130.0, 101.0, 65.0, 50.0, 29.0, 18.0, 15.0, 8.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9501953125, -0.9183197021484375, -0.886444091796875, -0.8545684814453125, -0.82269287109375, -0.7908172607421875, -0.758941650390625, -0.7270660400390625, -0.6951904296875, -0.6633148193359375, -0.631439208984375, -0.5995635986328125, -0.56768798828125, -0.5358123779296875, -0.503936767578125, -0.4720611572265625, -0.440185546875, -0.4083099365234375, -0.376434326171875, -0.3445587158203125, -0.31268310546875, -0.2808074951171875, -0.248931884765625, -0.2170562744140625, -0.1851806640625, -0.1533050537109375, -0.121429443359375, -0.0895538330078125, -0.05767822265625, -0.0258026123046875, 0.006072998046875, 0.0379486083984375, 0.06982421875, 0.1016998291015625, 0.133575439453125, 0.1654510498046875, 0.19732666015625, 0.2292022705078125, 0.261077880859375, 0.2929534912109375, 0.3248291015625, 0.3567047119140625, 0.388580322265625, 0.4204559326171875, 0.45233154296875, 0.4842071533203125, 0.516082763671875, 0.5479583740234375, 0.579833984375, 0.6117095947265625, 0.643585205078125, 0.6754608154296875, 0.70733642578125, 0.7392120361328125, 0.771087646484375, 0.8029632568359375, 0.8348388671875, 0.8667144775390625, 0.898590087890625, 0.9304656982421875, 0.96234130859375, 0.9942169189453125, 1.026092529296875, 1.0579681396484375, 1.08984375]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 4.0, 8.0, 7.0, 7.0, 18.0, 17.0, 13.0, 21.0, 23.0, 25.0, 31.0, 36.0, 51.0, 59.0, 51.0, 58.0, 53.0, 59.0, 47.0, 67.0, 58.0, 48.0, 40.0, 29.0, 38.0, 34.0, 20.0, 22.0, 13.0, 10.0, 7.0, 4.0, 9.0, 2.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0022430419921875, -0.0021635890007019043, -0.0020841360092163086, -0.002004683017730713, -0.0019252300262451172, -0.0018457770347595215, -0.0017663240432739258, -0.00168687105178833, -0.0016074180603027344, -0.0015279650688171387, -0.001448512077331543, -0.0013690590858459473, -0.0012896060943603516, -0.0012101531028747559, -0.0011307001113891602, -0.0010512471199035645, -0.0009717941284179688, -0.000892341136932373, -0.0008128881454467773, -0.0007334351539611816, -0.0006539821624755859, -0.0005745291709899902, -0.0004950761795043945, -0.00041562318801879883, -0.0003361701965332031, -0.0002567172050476074, -0.00017726421356201172, -9.781122207641602e-05, -1.8358230590820312e-05, 6.109476089477539e-05, 0.0001405477523803711, 0.0002200007438659668, 0.0002994537353515625, 0.0003789067268371582, 0.0004583597183227539, 0.0005378127098083496, 0.0006172657012939453, 0.000696718692779541, 0.0007761716842651367, 0.0008556246757507324, 0.0009350776672363281, 0.0010145306587219238, 0.0010939836502075195, 0.0011734366416931152, 0.001252889633178711, 0.0013323426246643066, 0.0014117956161499023, 0.001491248607635498, 0.0015707015991210938, 0.0016501545906066895, 0.0017296075820922852, 0.0018090605735778809, 0.0018885135650634766, 0.0019679665565490723, 0.002047419548034668, 0.0021268725395202637, 0.0022063255310058594, 0.002285778522491455, 0.0023652315139770508, 0.0024446845054626465, 0.002524137496948242, 0.002603590488433838, 0.0026830434799194336, 0.0027624964714050293, 0.002841949462890625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 9.0, 4.0, 11.0, 10.0, 10.0, 27.0, 14.0, 35.0, 50.0, 63.0, 105.0, 107.0, 177.0, 391.0, 1124.0, 664490.0, 379934.0, 1029.0, 354.0, 188.0, 113.0, 62.0, 54.0, 38.0, 38.0, 32.0, 24.0, 12.0, 13.0, 11.0, 9.0, 2.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06878662109375, -0.06676149368286133, -0.06473636627197266, -0.06271123886108398, -0.06068611145019531, -0.05866098403930664, -0.05663585662841797, -0.0546107292175293, -0.052585601806640625, -0.05056047439575195, -0.04853534698486328, -0.04651021957397461, -0.04448509216308594, -0.042459964752197266, -0.040434837341308594, -0.03840970993041992, -0.03638458251953125, -0.03435945510864258, -0.032334327697753906, -0.030309200286865234, -0.028284072875976562, -0.02625894546508789, -0.02423381805419922, -0.022208690643310547, -0.020183563232421875, -0.018158435821533203, -0.01613330841064453, -0.01410818099975586, -0.012083053588867188, -0.010057926177978516, -0.008032798767089844, -0.006007671356201172, -0.0039825439453125, -0.001957416534423828, 6.771087646484375e-05, 0.0020928382873535156, 0.0041179656982421875, 0.006143093109130859, 0.008168220520019531, 0.010193347930908203, 0.012218475341796875, 0.014243602752685547, 0.01626873016357422, 0.01829385757446289, 0.020318984985351562, 0.022344112396240234, 0.024369239807128906, 0.026394367218017578, 0.02841949462890625, 0.030444622039794922, 0.032469749450683594, 0.034494876861572266, 0.03652000427246094, 0.03854513168334961, 0.04057025909423828, 0.04259538650512695, 0.044620513916015625, 0.0466456413269043, 0.04867076873779297, 0.05069589614868164, 0.05272102355957031, 0.054746150970458984, 0.056771278381347656, 0.05879640579223633, 0.060821533203125]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 15.0, 304.0, 654.0, 46.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01918666996061802, -0.018812132999300957, -0.018437596037983894, -0.018063057214021683, -0.01768852025270462, -0.017313983291387558, -0.016939446330070496, -0.016564909368753433, -0.01619037240743637, -0.01581583544611931, -0.015441297553479671, -0.015066760592162609, -0.014692222699522972, -0.01431768573820591, -0.013943148776888847, -0.013568611815571785, -0.013194072991609573, -0.012819536030292511, -0.012444998137652874, -0.012070461176335812, -0.011695923283696175, -0.011321386322379112, -0.01094684936106205, -0.010572312399744987, -0.01019777450710535, -0.009823237545788288, -0.009448699653148651, -0.009074162691831589, -0.008699625730514526, -0.00832508783787489, -0.007950550876557827, -0.007576013449579477, -0.007201475091278553, -0.006826937664300203, -0.006452400237321854, -0.006077863276004791, -0.005703325849026442, -0.005328788422048092, -0.0049542514607310295, -0.00457971403375268, -0.00420517660677433, -0.0038306391797959805, -0.0034561019856482744, -0.0030815647915005684, -0.0027070273645222187, -0.002332489937543869, -0.001957952743396163, -0.001583415549248457, -0.0012088781222701073, -0.0008343408117070794, -0.00045980350114405155, -8.526619058102369e-05, 0.00028927111998200417, 0.000663808430545032, 0.0010383457411080599, 0.001412882935255766, 0.0017874203622341156, 0.0021619577892124653, 0.0025364949833601713, 0.0029110321775078773, 0.003285569604486227, 0.0036601070314645767, 0.004034643992781639, 0.004409181419759989, 0.0047837188467383385]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 3.0, 7.0, 6.0, 12.0, 8.0, 13.0, 16.0, 15.0, 16.0, 27.0, 30.0, 28.0, 43.0, 34.0, 34.0, 37.0, 33.0, 41.0, 52.0, 51.0, 46.0, 37.0, 41.0, 42.0, 31.0, 33.0, 33.0, 30.0, 33.0, 27.0, 22.0, 17.0, 16.0, 17.0, 15.0, 12.0, 14.0, 12.0, 5.0, 4.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0014487504959106445, -0.0014047836884856224, -0.0013608168810606003, -0.0013168500736355782, -0.001272883266210556, -0.001228916458785534, -0.0011849496513605118, -0.0011409828439354897, -0.0010970160365104675, -0.0010530492290854454, -0.0010090824216604233, -0.0009651156142354012, -0.000921148806810379, -0.0008771819993853569, -0.0008332151919603348, -0.0007892483845353127, -0.0007452815771102905, -0.0007013147696852684, -0.0006573479622602463, -0.0006133811548352242, -0.000569414347410202, -0.0005254475399851799, -0.0004814807325601578, -0.00043751392513513565, -0.0003935471177101135, -0.0003495803102850914, -0.0003056135028600693, -0.00026164669543504715, -0.00021767988801002502, -0.0001737130805850029, -0.00012974627315998077, -8.577946573495865e-05, -4.1812658309936523e-05, 2.154149115085602e-06, 4.612095654010773e-05, 9.008776396512985e-05, 0.00013405457139015198, 0.0001780213788151741, 0.00022198818624019623, 0.00026595499366521835, 0.0003099218010902405, 0.0003538886085152626, 0.00039785541594028473, 0.00044182222336530685, 0.000485789030790329, 0.0005297558382153511, 0.0005737226456403732, 0.0006176894530653954, 0.0006616562604904175, 0.0007056230679154396, 0.0007495898753404617, 0.0007935566827654839, 0.000837523490190506, 0.0008814902976155281, 0.0009254571050405502, 0.0009694239124655724, 0.0010133907198905945, 0.0010573575273156166, 0.0011013243347406387, 0.0011452911421656609, 0.001189257949590683, 0.0012332247570157051, 0.0012771915644407272, 0.0013211583718657494, 0.0013651251792907715]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 7.0, 5.0, 7.0, 10.0, 11.0, 10.0, 11.0, 17.0, 15.0, 17.0, 19.0, 27.0, 20.0, 28.0, 26.0, 35.0, 37.0, 29.0, 30.0, 39.0, 40.0, 40.0, 43.0, 35.0, 35.0, 39.0, 36.0, 32.0, 24.0, 26.0, 29.0, 32.0, 27.0, 23.0, 17.0, 23.0, 17.0, 16.0, 12.0, 13.0, 9.0, 9.0, 5.0, 4.0, 6.0, 2.0, 4.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-7.48828125, -7.265625, -7.04296875, -6.8203125, -6.59765625, -6.375, -6.15234375, -5.9296875, -5.70703125, -5.484375, -5.26171875, -5.0390625, -4.81640625, -4.59375, -4.37109375, -4.1484375, -3.92578125, -3.703125, -3.48046875, -3.2578125, -3.03515625, -2.8125, -2.58984375, -2.3671875, -2.14453125, -1.921875, -1.69921875, -1.4765625, -1.25390625, -1.03125, -0.80859375, -0.5859375, -0.36328125, -0.140625, 0.08203125, 0.3046875, 0.52734375, 0.75, 0.97265625, 1.1953125, 1.41796875, 1.640625, 1.86328125, 2.0859375, 2.30859375, 2.53125, 2.75390625, 2.9765625, 3.19921875, 3.421875, 3.64453125, 3.8671875, 4.08984375, 4.3125, 4.53515625, 4.7578125, 4.98046875, 5.203125, 5.42578125, 5.6484375, 5.87109375, 6.09375, 6.31640625, 6.5390625, 6.76171875]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 8.0, 5.0, 7.0, 10.0, 15.0, 16.0, 13.0, 26.0, 22.0, 30.0, 34.0, 53.0, 63.0, 91.0, 112.0, 166.0, 241.0, 420.0, 732.0, 2259.0, 9646.0, 61834.0, 677497.0, 260001.0, 27134.0, 5059.0, 1371.0, 592.0, 287.0, 203.0, 148.0, 108.0, 72.0, 54.0, 46.0, 42.0, 37.0, 24.0, 12.0, 11.0, 14.0, 10.0, 6.0, 6.0, 8.0, 2.0, 4.0, 5.0, 2.0, 5.0, 1.0, 0.0, 1.0], "bins": [-14.859375, -14.419677734375, -13.97998046875, -13.540283203125, -13.1005859375, -12.660888671875, -12.22119140625, -11.781494140625, -11.341796875, -10.902099609375, -10.46240234375, -10.022705078125, -9.5830078125, -9.143310546875, -8.70361328125, -8.263916015625, -7.82421875, -7.384521484375, -6.94482421875, -6.505126953125, -6.0654296875, -5.625732421875, -5.18603515625, -4.746337890625, -4.306640625, -3.866943359375, -3.42724609375, -2.987548828125, -2.5478515625, -2.108154296875, -1.66845703125, -1.228759765625, -0.7890625, -0.349365234375, 0.09033203125, 0.530029296875, 0.9697265625, 1.409423828125, 1.84912109375, 2.288818359375, 2.728515625, 3.168212890625, 3.60791015625, 4.047607421875, 4.4873046875, 4.927001953125, 5.36669921875, 5.806396484375, 6.24609375, 6.685791015625, 7.12548828125, 7.565185546875, 8.0048828125, 8.444580078125, 8.88427734375, 9.323974609375, 9.763671875, 10.203369140625, 10.64306640625, 11.082763671875, 11.5224609375, 11.962158203125, 12.40185546875, 12.841552734375, 13.28125]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 4.0, 4.0, 8.0, 8.0, 13.0, 15.0, 16.0, 26.0, 17.0, 24.0, 26.0, 36.0, 33.0, 48.0, 42.0, 45.0, 52.0, 67.0, 195.0, 1653.0, 224.0, 76.0, 43.0, 51.0, 33.0, 40.0, 39.0, 30.0, 34.0, 15.0, 14.0, 13.0, 15.0, 17.0, 18.0, 9.0, 11.0, 5.0, 11.0, 7.0, 1.0, 8.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-23.65625, -22.92919921875, -22.2021484375, -21.47509765625, -20.748046875, -20.02099609375, -19.2939453125, -18.56689453125, -17.83984375, -17.11279296875, -16.3857421875, -15.65869140625, -14.931640625, -14.20458984375, -13.4775390625, -12.75048828125, -12.0234375, -11.29638671875, -10.5693359375, -9.84228515625, -9.115234375, -8.38818359375, -7.6611328125, -6.93408203125, -6.20703125, -5.47998046875, -4.7529296875, -4.02587890625, -3.298828125, -2.57177734375, -1.8447265625, -1.11767578125, -0.390625, 0.33642578125, 1.0634765625, 1.79052734375, 2.517578125, 3.24462890625, 3.9716796875, 4.69873046875, 5.42578125, 6.15283203125, 6.8798828125, 7.60693359375, 8.333984375, 9.06103515625, 9.7880859375, 10.51513671875, 11.2421875, 11.96923828125, 12.6962890625, 13.42333984375, 14.150390625, 14.87744140625, 15.6044921875, 16.33154296875, 17.05859375, 17.78564453125, 18.5126953125, 19.23974609375, 19.966796875, 20.69384765625, 21.4208984375, 22.14794921875, 22.875]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 5.0, 3.0, 3.0, 7.0, 9.0, 6.0, 12.0, 11.0, 21.0, 16.0, 18.0, 19.0, 22.0, 35.0, 44.0, 45.0, 77.0, 92.0, 147.0, 258.0, 482.0, 1621.0, 53352.0, 3078260.0, 8973.0, 1042.0, 416.0, 189.0, 132.0, 83.0, 61.0, 52.0, 36.0, 26.0, 19.0, 31.0, 22.0, 18.0, 10.0, 10.0, 5.0, 8.0, 4.0, 4.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.84375, -51.208984375, -49.57421875, -47.939453125, -46.3046875, -44.669921875, -43.03515625, -41.400390625, -39.765625, -38.130859375, -36.49609375, -34.861328125, -33.2265625, -31.591796875, -29.95703125, -28.322265625, -26.6875, -25.052734375, -23.41796875, -21.783203125, -20.1484375, -18.513671875, -16.87890625, -15.244140625, -13.609375, -11.974609375, -10.33984375, -8.705078125, -7.0703125, -5.435546875, -3.80078125, -2.166015625, -0.53125, 1.103515625, 2.73828125, 4.373046875, 6.0078125, 7.642578125, 9.27734375, 10.912109375, 12.546875, 14.181640625, 15.81640625, 17.451171875, 19.0859375, 20.720703125, 22.35546875, 23.990234375, 25.625, 27.259765625, 28.89453125, 30.529296875, 32.1640625, 33.798828125, 35.43359375, 37.068359375, 38.703125, 40.337890625, 41.97265625, 43.607421875, 45.2421875, 46.876953125, 48.51171875, 50.146484375, 51.78125]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 7.0, 178.0, 632.0, 184.0, 17.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.809925079345703, -27.198936462402344, -23.58794593811035, -19.97695541381836, -16.365966796875, -12.75497817993164, -9.143987655639648, -5.532997131347656, -1.9220085144042969, 1.688981056213379, 5.299970626831055, 8.91096019744873, 12.521949768066406, 16.132938385009766, 19.743928909301758, 23.35491943359375, 26.96590805053711, 30.57689666748047, 34.187889099121094, 37.79887771606445, 41.40986633300781, 45.02085494995117, 48.63184356689453, 52.242835998535156, 55.853824615478516, 59.464813232421875, 63.0758056640625, 66.6867904663086, 70.29778289794922, 73.90876770019531, 77.51976013183594, 81.13075256347656, 84.74174499511719, 88.35273742675781, 91.9637222290039, 95.57471466064453, 99.18569946289062, 102.79669189453125, 106.40768432617188, 110.0186767578125, 113.6296615600586, 117.24065399169922, 120.85163879394531, 124.46263122558594, 128.07362365722656, 131.68460083007812, 135.29559326171875, 138.90658569335938, 142.517578125, 146.12857055664062, 149.73956298828125, 153.3505401611328, 156.96153259277344, 160.57252502441406, 164.1835174560547, 167.7945098876953, 171.40548706054688, 175.0164794921875, 178.62747192382812, 182.2384490966797, 185.8494415283203, 189.46043395996094, 193.07142639160156, 196.6824188232422, 200.2934112548828]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 1.0, 5.0, 3.0, 4.0, 3.0, 4.0, 7.0, 9.0, 4.0, 12.0, 16.0, 16.0, 12.0, 19.0, 20.0, 25.0, 26.0, 27.0, 34.0, 35.0, 49.0, 36.0, 39.0, 51.0, 40.0, 36.0, 48.0, 53.0, 42.0, 37.0, 41.0, 31.0, 25.0, 33.0, 28.0, 19.0, 14.0, 14.0, 14.0, 11.0, 17.0, 10.0, 10.0, 9.0, 3.0, 10.0, 5.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.43195343017578, -51.59483337402344, -49.75771713256836, -47.920597076416016, -46.08348083496094, -44.246360778808594, -42.409244537353516, -40.57212448120117, -38.735008239746094, -36.89788818359375, -35.06077194213867, -33.22365188598633, -31.38653564453125, -29.549415588378906, -27.712299346923828, -25.875179290771484, -24.038061141967773, -22.200942993164062, -20.36382484436035, -18.52670669555664, -16.68958854675293, -14.852469444274902, -13.015351295471191, -11.17823314666748, -9.34111499786377, -7.503996849060059, -5.666878700256348, -3.8297600746154785, -1.9926419258117676, -0.15552330017089844, 1.6815948486328125, 3.5187129974365234, 5.355831146240234, 7.192949295043945, 9.030067443847656, 10.867185592651367, 12.704303741455078, 14.541422843933105, 16.3785400390625, 18.215660095214844, 20.052776336669922, 21.889894485473633, 23.727012634277344, 25.564130783081055, 27.401248931884766, 29.23836898803711, 31.075485229492188, 32.91260528564453, 34.749725341796875, 36.58684539794922, 38.4239616394043, 40.26108169555664, 42.09819793701172, 43.93531799316406, 45.77243423461914, 47.609554290771484, 49.44667053222656, 51.283790588378906, 53.120906829833984, 54.95802688598633, 56.795143127441406, 58.63226318359375, 60.46937942504883, 62.30649948120117, 64.14361572265625]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 7.0, 14.0, 15.0, 10.0, 14.0, 20.0, 17.0, 31.0, 24.0, 15.0, 24.0, 27.0, 25.0, 39.0, 35.0, 31.0, 38.0, 41.0, 34.0, 42.0, 34.0, 42.0, 37.0, 27.0, 39.0, 25.0, 36.0, 27.0, 33.0, 23.0, 27.0, 21.0, 23.0, 11.0, 8.0, 21.0, 9.0, 6.0, 14.0, 7.0, 4.0, 2.0, 2.0, 5.0, 3.0, 5.0, 0.0, 3.0], "bins": [-8.1484375, -7.9193115234375, -7.690185546875, -7.4610595703125, -7.23193359375, -7.0028076171875, -6.773681640625, -6.5445556640625, -6.3154296875, -6.0863037109375, -5.857177734375, -5.6280517578125, -5.39892578125, -5.1697998046875, -4.940673828125, -4.7115478515625, -4.482421875, -4.2532958984375, -4.024169921875, -3.7950439453125, -3.56591796875, -3.3367919921875, -3.107666015625, -2.8785400390625, -2.6494140625, -2.4202880859375, -2.191162109375, -1.9620361328125, -1.73291015625, -1.5037841796875, -1.274658203125, -1.0455322265625, -0.81640625, -0.5872802734375, -0.358154296875, -0.1290283203125, 0.10009765625, 0.3292236328125, 0.558349609375, 0.7874755859375, 1.0166015625, 1.2457275390625, 1.474853515625, 1.7039794921875, 1.93310546875, 2.1622314453125, 2.391357421875, 2.6204833984375, 2.849609375, 3.0787353515625, 3.307861328125, 3.5369873046875, 3.76611328125, 3.9952392578125, 4.224365234375, 4.4534912109375, 4.6826171875, 4.9117431640625, 5.140869140625, 5.3699951171875, 5.59912109375, 5.8282470703125, 6.057373046875, 6.2864990234375, 6.515625]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 2.0, 5.0, 8.0, 9.0, 9.0, 11.0, 15.0, 18.0, 16.0, 30.0, 35.0, 44.0, 54.0, 106.0, 159.0, 241.0, 466.0, 915.0, 2124.0, 6318.0, 31852.0, 413168.0, 2847187.0, 823137.0, 53755.0, 9335.0, 2747.0, 1118.0, 558.0, 282.0, 169.0, 97.0, 77.0, 45.0, 36.0, 19.0, 18.0, 12.0, 16.0, 10.0, 10.0, 8.0, 13.0, 1.0, 4.0, 4.0, 7.0, 6.0, 4.0, 4.0, 1.0], "bins": [-21.125, -20.531982421875, -19.93896484375, -19.345947265625, -18.7529296875, -18.159912109375, -17.56689453125, -16.973876953125, -16.380859375, -15.787841796875, -15.19482421875, -14.601806640625, -14.0087890625, -13.415771484375, -12.82275390625, -12.229736328125, -11.63671875, -11.043701171875, -10.45068359375, -9.857666015625, -9.2646484375, -8.671630859375, -8.07861328125, -7.485595703125, -6.892578125, -6.299560546875, -5.70654296875, -5.113525390625, -4.5205078125, -3.927490234375, -3.33447265625, -2.741455078125, -2.1484375, -1.555419921875, -0.96240234375, -0.369384765625, 0.2236328125, 0.816650390625, 1.40966796875, 2.002685546875, 2.595703125, 3.188720703125, 3.78173828125, 4.374755859375, 4.9677734375, 5.560791015625, 6.15380859375, 6.746826171875, 7.33984375, 7.932861328125, 8.52587890625, 9.118896484375, 9.7119140625, 10.304931640625, 10.89794921875, 11.490966796875, 12.083984375, 12.677001953125, 13.27001953125, 13.863037109375, 14.4560546875, 15.049072265625, 15.64208984375, 16.235107421875, 16.828125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 2.0, 6.0, 5.0, 5.0, 7.0, 10.0, 19.0, 23.0, 19.0, 37.0, 43.0, 59.0, 85.0, 104.0, 141.0, 230.0, 273.0, 323.0, 374.0, 437.0, 419.0, 358.0, 247.0, 193.0, 142.0, 133.0, 110.0, 67.0, 46.0, 45.0, 29.0, 19.0, 17.0, 10.0, 6.0, 8.0, 8.0, 7.0, 3.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.8046875, -11.4310302734375, -11.057373046875, -10.6837158203125, -10.31005859375, -9.9364013671875, -9.562744140625, -9.1890869140625, -8.8154296875, -8.4417724609375, -8.068115234375, -7.6944580078125, -7.32080078125, -6.9471435546875, -6.573486328125, -6.1998291015625, -5.826171875, -5.4525146484375, -5.078857421875, -4.7052001953125, -4.33154296875, -3.9578857421875, -3.584228515625, -3.2105712890625, -2.8369140625, -2.4632568359375, -2.089599609375, -1.7159423828125, -1.34228515625, -0.9686279296875, -0.594970703125, -0.2213134765625, 0.15234375, 0.5260009765625, 0.899658203125, 1.2733154296875, 1.64697265625, 2.0206298828125, 2.394287109375, 2.7679443359375, 3.1416015625, 3.5152587890625, 3.888916015625, 4.2625732421875, 4.63623046875, 5.0098876953125, 5.383544921875, 5.7572021484375, 6.130859375, 6.5045166015625, 6.878173828125, 7.2518310546875, 7.62548828125, 7.9991455078125, 8.372802734375, 8.7464599609375, 9.1201171875, 9.4937744140625, 9.867431640625, 10.2410888671875, 10.61474609375, 10.9884033203125, 11.362060546875, 11.7357177734375, 12.109375]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 7.0, 6.0, 14.0, 11.0, 17.0, 16.0, 16.0, 23.0, 37.0, 35.0, 48.0, 74.0, 82.0, 99.0, 149.0, 183.0, 264.0, 453.0, 1050.0, 4801.0, 81145.0, 3731613.0, 359883.0, 10873.0, 1620.0, 595.0, 318.0, 205.0, 147.0, 108.0, 77.0, 73.0, 48.0, 43.0, 30.0, 30.0, 21.0, 10.0, 9.0, 8.0, 15.0, 12.0, 5.0, 7.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-43.03125, -41.71435546875, -40.3974609375, -39.08056640625, -37.763671875, -36.44677734375, -35.1298828125, -33.81298828125, -32.49609375, -31.17919921875, -29.8623046875, -28.54541015625, -27.228515625, -25.91162109375, -24.5947265625, -23.27783203125, -21.9609375, -20.64404296875, -19.3271484375, -18.01025390625, -16.693359375, -15.37646484375, -14.0595703125, -12.74267578125, -11.42578125, -10.10888671875, -8.7919921875, -7.47509765625, -6.158203125, -4.84130859375, -3.5244140625, -2.20751953125, -0.890625, 0.42626953125, 1.7431640625, 3.06005859375, 4.376953125, 5.69384765625, 7.0107421875, 8.32763671875, 9.64453125, 10.96142578125, 12.2783203125, 13.59521484375, 14.912109375, 16.22900390625, 17.5458984375, 18.86279296875, 20.1796875, 21.49658203125, 22.8134765625, 24.13037109375, 25.447265625, 26.76416015625, 28.0810546875, 29.39794921875, 30.71484375, 32.03173828125, 33.3486328125, 34.66552734375, 35.982421875, 37.29931640625, 38.6162109375, 39.93310546875, 41.25]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 7.0, 133.0, 491.0, 328.0, 53.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-267.1344299316406, -259.8751220703125, -252.6157989501953, -245.35647583007812, -238.09716796875, -230.8378448486328, -223.57852172851562, -216.3192138671875, -209.05990600585938, -201.8005828857422, -194.54127502441406, -187.28195190429688, -180.02264404296875, -172.76332092285156, -165.50399780273438, -158.24468994140625, -150.98536682128906, -143.72604370117188, -136.46673583984375, -129.20741271972656, -121.94810485839844, -114.68878173828125, -107.4294662475586, -100.17015075683594, -92.91083526611328, -85.65151977539062, -78.39220428466797, -71.13288879394531, -63.87356948852539, -56.614253997802734, -49.35493469238281, -42.095619201660156, -34.83628845214844, -27.57697296142578, -20.317655563354492, -13.058338165283203, -5.799022674560547, 1.4602928161621094, 8.719612121582031, 15.978927612304688, 23.238243103027344, 30.49755859375, 37.756874084472656, 45.01619338989258, 52.275508880615234, 59.53482437133789, 66.79414367675781, 74.05345916748047, 81.31277465820312, 88.57209014892578, 95.83140563964844, 103.09072875976562, 110.35003662109375, 117.60935974121094, 124.8686752319336, 132.12799072265625, 139.38729858398438, 146.64662170410156, 153.9059295654297, 161.16525268554688, 168.424560546875, 175.6838836669922, 182.94320678710938, 190.2025146484375, 197.4618377685547]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 8.0, 5.0, 14.0, 17.0, 8.0, 18.0, 22.0, 15.0, 28.0, 31.0, 28.0, 21.0, 36.0, 44.0, 43.0, 43.0, 40.0, 41.0, 39.0, 52.0, 31.0, 41.0, 38.0, 40.0, 41.0, 40.0, 32.0, 35.0, 23.0, 21.0, 21.0, 16.0, 10.0, 9.0, 11.0, 10.0, 6.0, 9.0, 7.0, 5.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-53.59698486328125, -52.17804718017578, -50.75910949707031, -49.340171813964844, -47.921234130859375, -46.502296447753906, -45.08335876464844, -43.66442108154297, -42.2454833984375, -40.82654571533203, -39.40760803222656, -37.988670349121094, -36.569732666015625, -35.150794982910156, -33.73185729980469, -32.31291961669922, -30.893978118896484, -29.475040435791016, -28.056102752685547, -26.637165069580078, -25.21822738647461, -23.79928970336914, -22.38035011291504, -20.96141242980957, -19.5424747467041, -18.123537063598633, -16.704599380493164, -15.285660743713379, -13.86672306060791, -12.447785377502441, -11.028846740722656, -9.609909057617188, -8.190971374511719, -6.77203369140625, -5.353095531463623, -3.934157371520996, -2.5152196884155273, -1.0962820053100586, 0.32265663146972656, 1.7415943145751953, 3.160531997680664, 4.579469680786133, 5.99840784072876, 7.417346000671387, 8.836283683776855, 10.255221366882324, 11.67416000366211, 13.093097686767578, 14.512035369873047, 15.930973052978516, 17.349910736083984, 18.768848419189453, 20.187786102294922, 21.60672378540039, 23.025663375854492, 24.44460105895996, 25.86353874206543, 27.2824764251709, 28.701414108276367, 30.12035369873047, 31.539291381835938, 32.958229064941406, 34.377166748046875, 35.796104431152344, 37.21504211425781]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 11.0, 6.0, 7.0, 7.0, 13.0, 13.0, 20.0, 15.0, 20.0, 27.0, 34.0, 36.0, 24.0, 31.0, 43.0, 32.0, 29.0, 46.0, 59.0, 41.0, 48.0, 53.0, 45.0, 30.0, 34.0, 26.0, 30.0, 32.0, 32.0, 32.0, 26.0, 19.0, 23.0, 17.0, 8.0, 13.0, 7.0, 4.0, 2.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5390625, -8.2679443359375, -7.996826171875, -7.7257080078125, -7.45458984375, -7.1834716796875, -6.912353515625, -6.6412353515625, -6.3701171875, -6.0989990234375, -5.827880859375, -5.5567626953125, -5.28564453125, -5.0145263671875, -4.743408203125, -4.4722900390625, -4.201171875, -3.9300537109375, -3.658935546875, -3.3878173828125, -3.11669921875, -2.8455810546875, -2.574462890625, -2.3033447265625, -2.0322265625, -1.7611083984375, -1.489990234375, -1.2188720703125, -0.94775390625, -0.6766357421875, -0.405517578125, -0.1343994140625, 0.13671875, 0.4078369140625, 0.678955078125, 0.9500732421875, 1.22119140625, 1.4923095703125, 1.763427734375, 2.0345458984375, 2.3056640625, 2.5767822265625, 2.847900390625, 3.1190185546875, 3.39013671875, 3.6612548828125, 3.932373046875, 4.2034912109375, 4.474609375, 4.7457275390625, 5.016845703125, 5.2879638671875, 5.55908203125, 5.8302001953125, 6.101318359375, 6.3724365234375, 6.6435546875, 6.9146728515625, 7.185791015625, 7.4569091796875, 7.72802734375, 7.9991455078125, 8.270263671875, 8.5413818359375, 8.8125]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 7.0, 8.0, 10.0, 11.0, 17.0, 23.0, 46.0, 68.0, 93.0, 128.0, 158.0, 266.0, 362.0, 565.0, 814.0, 1091.0, 1594.0, 2275.0, 3397.0, 5022.0, 7316.0, 11071.0, 17275.0, 27345.0, 45287.0, 79192.0, 145956.0, 243247.0, 194178.0, 105052.0, 58945.0, 34750.0, 21565.0, 13718.0, 8839.0, 5930.0, 4031.0, 2720.0, 1948.0, 1304.0, 877.0, 633.0, 438.0, 317.0, 216.0, 138.0, 101.0, 65.0, 56.0, 31.0, 17.0, 22.0, 13.0, 9.0, 3.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-1.033203125, -0.9984588623046875, -0.963714599609375, -0.9289703369140625, -0.89422607421875, -0.8594818115234375, -0.824737548828125, -0.7899932861328125, -0.7552490234375, -0.7205047607421875, -0.685760498046875, -0.6510162353515625, -0.61627197265625, -0.5815277099609375, -0.546783447265625, -0.5120391845703125, -0.477294921875, -0.4425506591796875, -0.407806396484375, -0.3730621337890625, -0.33831787109375, -0.3035736083984375, -0.268829345703125, -0.2340850830078125, -0.1993408203125, -0.1645965576171875, -0.129852294921875, -0.0951080322265625, -0.06036376953125, -0.0256195068359375, 0.009124755859375, 0.0438690185546875, 0.07861328125, 0.1133575439453125, 0.148101806640625, 0.1828460693359375, 0.21759033203125, 0.2523345947265625, 0.287078857421875, 0.3218231201171875, 0.3565673828125, 0.3913116455078125, 0.426055908203125, 0.4608001708984375, 0.49554443359375, 0.5302886962890625, 0.565032958984375, 0.5997772216796875, 0.634521484375, 0.6692657470703125, 0.704010009765625, 0.7387542724609375, 0.77349853515625, 0.8082427978515625, 0.842987060546875, 0.8777313232421875, 0.9124755859375, 0.9472198486328125, 0.981964111328125, 1.0167083740234375, 1.05145263671875, 1.0861968994140625, 1.120941162109375, 1.1556854248046875, 1.1904296875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 5.0, 1.0, 3.0, 5.0, 3.0, 2.0, 7.0, 9.0, 7.0, 7.0, 10.0, 16.0, 15.0, 16.0, 12.0, 16.0, 22.0, 25.0, 34.0, 34.0, 48.0, 38.0, 34.0, 30.0, 37.0, 30.0, 1065.0, 46.0, 36.0, 42.0, 24.0, 38.0, 44.0, 33.0, 28.0, 26.0, 25.0, 19.0, 16.0, 8.0, 21.0, 10.0, 12.0, 18.0, 8.0, 9.0, 11.0, 7.0, 8.0, 6.0, 6.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.63671875, -4.48480224609375, -4.3328857421875, -4.18096923828125, -4.029052734375, -3.87713623046875, -3.7252197265625, -3.57330322265625, -3.42138671875, -3.26947021484375, -3.1175537109375, -2.96563720703125, -2.813720703125, -2.66180419921875, -2.5098876953125, -2.35797119140625, -2.2060546875, -2.05413818359375, -1.9022216796875, -1.75030517578125, -1.598388671875, -1.44647216796875, -1.2945556640625, -1.14263916015625, -0.99072265625, -0.83880615234375, -0.6868896484375, -0.53497314453125, -0.383056640625, -0.23114013671875, -0.0792236328125, 0.07269287109375, 0.224609375, 0.37652587890625, 0.5284423828125, 0.68035888671875, 0.832275390625, 0.98419189453125, 1.1361083984375, 1.28802490234375, 1.43994140625, 1.59185791015625, 1.7437744140625, 1.89569091796875, 2.047607421875, 2.19952392578125, 2.3514404296875, 2.50335693359375, 2.6552734375, 2.80718994140625, 2.9591064453125, 3.11102294921875, 3.262939453125, 3.41485595703125, 3.5667724609375, 3.71868896484375, 3.87060546875, 4.02252197265625, 4.1744384765625, 4.32635498046875, 4.478271484375, 4.63018798828125, 4.7821044921875, 4.93402099609375, 5.0859375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 3.0, 6.0, 5.0, 13.0, 13.0, 26.0, 54.0, 48.0, 81.0, 107.0, 175.0, 234.0, 350.0, 470.0, 645.0, 888.0, 1347.0, 1895.0, 2671.0, 3910.0, 5987.0, 8723.0, 13303.0, 20176.0, 31836.0, 52224.0, 90860.0, 166791.0, 1290177.0, 167932.0, 91098.0, 52323.0, 31567.0, 20274.0, 13278.0, 8627.0, 5946.0, 3941.0, 2712.0, 1917.0, 1340.0, 893.0, 681.0, 459.0, 334.0, 246.0, 165.0, 144.0, 80.0, 53.0, 35.0, 29.0, 15.0, 13.0, 8.0, 8.0, 6.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.95556640625, -0.92523193359375, -0.8948974609375, -0.86456298828125, -0.834228515625, -0.80389404296875, -0.7735595703125, -0.74322509765625, -0.712890625, -0.68255615234375, -0.6522216796875, -0.62188720703125, -0.591552734375, -0.56121826171875, -0.5308837890625, -0.50054931640625, -0.47021484375, -0.43988037109375, -0.4095458984375, -0.37921142578125, -0.348876953125, -0.31854248046875, -0.2882080078125, -0.25787353515625, -0.2275390625, -0.19720458984375, -0.1668701171875, -0.13653564453125, -0.106201171875, -0.07586669921875, -0.0455322265625, -0.01519775390625, 0.01513671875, 0.04547119140625, 0.0758056640625, 0.10614013671875, 0.136474609375, 0.16680908203125, 0.1971435546875, 0.22747802734375, 0.2578125, 0.28814697265625, 0.3184814453125, 0.34881591796875, 0.379150390625, 0.40948486328125, 0.4398193359375, 0.47015380859375, 0.50048828125, 0.53082275390625, 0.5611572265625, 0.59149169921875, 0.621826171875, 0.65216064453125, 0.6824951171875, 0.71282958984375, 0.7431640625, 0.77349853515625, 0.8038330078125, 0.83416748046875, 0.864501953125, 0.89483642578125, 0.9251708984375, 0.95550537109375, 0.98583984375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 4.0, 6.0, 9.0, 14.0, 8.0, 18.0, 20.0, 30.0, 36.0, 75.0, 74.0, 90.0, 100.0, 110.0, 97.0, 72.0, 54.0, 54.0, 31.0, 29.0, 13.0, 11.0, 11.0, 13.0, 4.0, 7.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00342559814453125, -0.0032994747161865234, -0.003173351287841797, -0.0030472278594970703, -0.0029211044311523438, -0.002794981002807617, -0.0026688575744628906, -0.002542734146118164, -0.0024166107177734375, -0.002290487289428711, -0.0021643638610839844, -0.002038240432739258, -0.0019121170043945312, -0.0017859935760498047, -0.0016598701477050781, -0.0015337467193603516, -0.001407623291015625, -0.0012814998626708984, -0.0011553764343261719, -0.0010292530059814453, -0.0009031295776367188, -0.0007770061492919922, -0.0006508827209472656, -0.0005247592926025391, -0.0003986358642578125, -0.00027251243591308594, -0.00014638900756835938, -2.0265579223632812e-05, 0.00010585784912109375, 0.0002319812774658203, 0.0003581047058105469, 0.00048422813415527344, 0.0006103515625, 0.0007364749908447266, 0.0008625984191894531, 0.0009887218475341797, 0.0011148452758789062, 0.0012409687042236328, 0.0013670921325683594, 0.001493215560913086, 0.0016193389892578125, 0.001745462417602539, 0.0018715858459472656, 0.001997709274291992, 0.0021238327026367188, 0.0022499561309814453, 0.002376079559326172, 0.0025022029876708984, 0.002628326416015625, 0.0027544498443603516, 0.002880573272705078, 0.0030066967010498047, 0.0031328201293945312, 0.003258943557739258, 0.0033850669860839844, 0.003511190414428711, 0.0036373138427734375, 0.003763437271118164, 0.0038895606994628906, 0.004015684127807617, 0.004141807556152344, 0.00426793098449707, 0.004394054412841797, 0.0045201778411865234, 0.00464630126953125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 5.0, 12.0, 6.0, 16.0, 16.0, 30.0, 33.0, 47.0, 70.0, 113.0, 218.0, 383.0, 1673.0, 1040619.0, 4163.0, 511.0, 260.0, 133.0, 80.0, 45.0, 30.0, 33.0, 18.0, 18.0, 5.0, 7.0, 5.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.10382080078125, -0.10098457336425781, -0.09814834594726562, -0.09531211853027344, -0.09247589111328125, -0.08963966369628906, -0.08680343627929688, -0.08396720886230469, -0.0811309814453125, -0.07829475402832031, -0.07545852661132812, -0.07262229919433594, -0.06978607177734375, -0.06694984436035156, -0.06411361694335938, -0.06127738952636719, -0.058441162109375, -0.05560493469238281, -0.052768707275390625, -0.04993247985839844, -0.04709625244140625, -0.04426002502441406, -0.041423797607421875, -0.03858757019042969, -0.0357513427734375, -0.03291511535644531, -0.030078887939453125, -0.027242660522460938, -0.02440643310546875, -0.021570205688476562, -0.018733978271484375, -0.015897750854492188, -0.0130615234375, -0.010225296020507812, -0.007389068603515625, -0.0045528411865234375, -0.00171661376953125, 0.0011196136474609375, 0.003955841064453125, 0.0067920684814453125, 0.0096282958984375, 0.012464523315429688, 0.015300750732421875, 0.018136978149414062, 0.02097320556640625, 0.023809432983398438, 0.026645660400390625, 0.029481887817382812, 0.032318115234375, 0.03515434265136719, 0.037990570068359375, 0.04082679748535156, 0.04366302490234375, 0.04649925231933594, 0.049335479736328125, 0.05217170715332031, 0.0550079345703125, 0.05784416198730469, 0.060680389404296875, 0.06351661682128906, 0.06635284423828125, 0.06918907165527344, 0.07202529907226562, 0.07486152648925781, 0.07769775390625]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 51.0, 223.0, 441.0, 243.0, 41.0, 11.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008096171543002129, -0.007922104559838772, -0.007748038042336702, -0.007573971524834633, -0.007399904541671276, -0.007225838024169207, -0.007051771506667137, -0.00687770452350378, -0.006703637540340424, -0.006529571022838354, -0.006355504039674997, -0.006181437522172928, -0.006007370539009571, -0.005833304021507502, -0.005659237504005432, -0.005485170520842075, -0.005311104003340006, -0.005137037485837936, -0.00496297050267458, -0.00478890398517251, -0.004614837002009153, -0.004440770484507084, -0.004266703501343727, -0.004092636983841658, -0.003918570466339588, -0.003744503716006875, -0.003570436965674162, -0.0033963704481720924, -0.0032223034650087357, -0.003048236947506666, -0.002874170197173953, -0.00270010344684124, -0.0025260369293391705, -0.0023519701790064573, -0.002177903428673744, -0.0020038369111716747, -0.0018297700444236398, -0.0016557032940909266, -0.0014816366601735353, -0.0013075699098408222, -0.001133503159508109, -0.000959436409175396, -0.0007853697170503438, -0.0006113030249252915, -0.0004372362745925784, -0.0002631695242598653, -8.910289034247398e-05, 8.496385999023914e-05, 0.00025903061032295227, 0.00043309733155183494, 0.0006071640527807176, 0.0007812307449057698, 0.000955297495238483, 0.001129364245571196, 0.0013034308794885874, 0.0014774976298213005, 0.0016515643801540136, 0.0018256311304867268, 0.00199969788081944, 0.002173764631152153, 0.0023478311486542225, 0.0025218981318175793, 0.0026959646493196487, 0.002870031399652362, 0.003044098149985075]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 4.0, 11.0, 12.0, 9.0, 13.0, 16.0, 19.0, 14.0, 16.0, 21.0, 24.0, 24.0, 25.0, 19.0, 27.0, 39.0, 36.0, 32.0, 42.0, 49.0, 33.0, 36.0, 37.0, 33.0, 31.0, 36.0, 39.0, 35.0, 32.0, 31.0, 28.0, 24.0, 25.0, 12.0, 17.0, 16.0, 13.0, 16.0, 8.0, 9.0, 10.0, 6.0, 9.0, 5.0, 4.0, 2.0, 6.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.001431584358215332, -0.0013898732140660286, -0.0013481620699167252, -0.0013064509257674217, -0.0012647397816181183, -0.0012230286374688148, -0.0011813174933195114, -0.001139606349170208, -0.0010978952050209045, -0.001056184060871601, -0.0010144729167222977, -0.0009727617725729942, -0.0009310506284236908, -0.0008893394842743874, -0.0008476283401250839, -0.0008059171959757805, -0.000764206051826477, -0.0007224949076771736, -0.0006807837635278702, -0.0006390726193785667, -0.0005973614752292633, -0.0005556503310799599, -0.0005139391869306564, -0.000472228042781353, -0.00043051689863204956, -0.0003888057544827461, -0.0003470946103334427, -0.00030538346618413925, -0.0002636723220348358, -0.00022196117788553238, -0.00018025003373622894, -0.0001385388895869255, -9.682774543762207e-05, -5.5116601288318634e-05, -1.3405457139015198e-05, 2.830568701028824e-05, 7.001683115959167e-05, 0.00011172797530889511, 0.00015343911945819855, 0.00019515026360750198, 0.00023686140775680542, 0.00027857255190610886, 0.0003202836960554123, 0.00036199484020471573, 0.00040370598435401917, 0.0004454171285033226, 0.00048712827265262604, 0.0005288394168019295, 0.0005705505609512329, 0.0006122617051005363, 0.0006539728492498398, 0.0006956839933991432, 0.0007373951375484467, 0.0007791062816977501, 0.0008208174258470535, 0.000862528569996357, 0.0009042397141456604, 0.0009459508582949638, 0.0009876620024442673, 0.0010293731465935707, 0.0010710842907428741, 0.0011127954348921776, 0.001154506579041481, 0.0011962177231907845, 0.0012379288673400879]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 11.0, 6.0, 7.0, 7.0, 13.0, 13.0, 20.0, 16.0, 19.0, 27.0, 34.0, 36.0, 24.0, 31.0, 44.0, 31.0, 30.0, 48.0, 56.0, 42.0, 47.0, 54.0, 45.0, 29.0, 36.0, 24.0, 31.0, 33.0, 31.0, 32.0, 25.0, 20.0, 22.0, 17.0, 8.0, 13.0, 8.0, 3.0, 2.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5390625, -8.267822265625, -7.99658203125, -7.725341796875, -7.4541015625, -7.182861328125, -6.91162109375, -6.640380859375, -6.369140625, -6.097900390625, -5.82666015625, -5.555419921875, -5.2841796875, -5.012939453125, -4.74169921875, -4.470458984375, -4.19921875, -3.927978515625, -3.65673828125, -3.385498046875, -3.1142578125, -2.843017578125, -2.57177734375, -2.300537109375, -2.029296875, -1.758056640625, -1.48681640625, -1.215576171875, -0.9443359375, -0.673095703125, -0.40185546875, -0.130615234375, 0.140625, 0.411865234375, 0.68310546875, 0.954345703125, 1.2255859375, 1.496826171875, 1.76806640625, 2.039306640625, 2.310546875, 2.581787109375, 2.85302734375, 3.124267578125, 3.3955078125, 3.666748046875, 3.93798828125, 4.209228515625, 4.48046875, 4.751708984375, 5.02294921875, 5.294189453125, 5.5654296875, 5.836669921875, 6.10791015625, 6.379150390625, 6.650390625, 6.921630859375, 7.19287109375, 7.464111328125, 7.7353515625, 8.006591796875, 8.27783203125, 8.549072265625, 8.8203125]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 4.0, 4.0, 13.0, 10.0, 18.0, 21.0, 30.0, 32.0, 45.0, 59.0, 81.0, 104.0, 164.0, 234.0, 304.0, 431.0, 732.0, 1267.0, 2774.0, 10845.0, 82197.0, 865043.0, 68351.0, 9696.0, 2695.0, 1185.0, 689.0, 406.0, 311.0, 209.0, 153.0, 121.0, 91.0, 68.0, 40.0, 40.0, 20.0, 22.0, 12.0, 9.0, 4.0, 7.0, 6.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.5625, -20.877197265625, -20.19189453125, -19.506591796875, -18.8212890625, -18.135986328125, -17.45068359375, -16.765380859375, -16.080078125, -15.394775390625, -14.70947265625, -14.024169921875, -13.3388671875, -12.653564453125, -11.96826171875, -11.282958984375, -10.59765625, -9.912353515625, -9.22705078125, -8.541748046875, -7.8564453125, -7.171142578125, -6.48583984375, -5.800537109375, -5.115234375, -4.429931640625, -3.74462890625, -3.059326171875, -2.3740234375, -1.688720703125, -1.00341796875, -0.318115234375, 0.3671875, 1.052490234375, 1.73779296875, 2.423095703125, 3.1083984375, 3.793701171875, 4.47900390625, 5.164306640625, 5.849609375, 6.534912109375, 7.22021484375, 7.905517578125, 8.5908203125, 9.276123046875, 9.96142578125, 10.646728515625, 11.33203125, 12.017333984375, 12.70263671875, 13.387939453125, 14.0732421875, 14.758544921875, 15.44384765625, 16.129150390625, 16.814453125, 17.499755859375, 18.18505859375, 18.870361328125, 19.5556640625, 20.240966796875, 20.92626953125, 21.611572265625, 22.296875]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 4.0, 8.0, 3.0, 7.0, 15.0, 9.0, 14.0, 10.0, 22.0, 24.0, 28.0, 27.0, 25.0, 35.0, 32.0, 30.0, 50.0, 54.0, 98.0, 258.0, 1675.0, 115.0, 67.0, 52.0, 48.0, 39.0, 37.0, 37.0, 31.0, 25.0, 27.0, 25.0, 29.0, 15.0, 8.0, 17.0, 10.0, 8.0, 6.0, 9.0, 4.0, 2.0, 8.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-26.671875, -25.935791015625, -25.19970703125, -24.463623046875, -23.7275390625, -22.991455078125, -22.25537109375, -21.519287109375, -20.783203125, -20.047119140625, -19.31103515625, -18.574951171875, -17.8388671875, -17.102783203125, -16.36669921875, -15.630615234375, -14.89453125, -14.158447265625, -13.42236328125, -12.686279296875, -11.9501953125, -11.214111328125, -10.47802734375, -9.741943359375, -9.005859375, -8.269775390625, -7.53369140625, -6.797607421875, -6.0615234375, -5.325439453125, -4.58935546875, -3.853271484375, -3.1171875, -2.381103515625, -1.64501953125, -0.908935546875, -0.1728515625, 0.563232421875, 1.29931640625, 2.035400390625, 2.771484375, 3.507568359375, 4.24365234375, 4.979736328125, 5.7158203125, 6.451904296875, 7.18798828125, 7.924072265625, 8.66015625, 9.396240234375, 10.13232421875, 10.868408203125, 11.6044921875, 12.340576171875, 13.07666015625, 13.812744140625, 14.548828125, 15.284912109375, 16.02099609375, 16.757080078125, 17.4931640625, 18.229248046875, 18.96533203125, 19.701416015625, 20.4375]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 7.0, 6.0, 7.0, 6.0, 9.0, 13.0, 17.0, 20.0, 40.0, 30.0, 43.0, 55.0, 85.0, 94.0, 125.0, 234.0, 666.0, 5265.0, 3099452.0, 37421.0, 1196.0, 358.0, 137.0, 90.0, 73.0, 55.0, 45.0, 32.0, 31.0, 25.0, 17.0, 17.0, 7.0, 7.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-75.6875, -73.1396484375, -70.591796875, -68.0439453125, -65.49609375, -62.9482421875, -60.400390625, -57.8525390625, -55.3046875, -52.7568359375, -50.208984375, -47.6611328125, -45.11328125, -42.5654296875, -40.017578125, -37.4697265625, -34.921875, -32.3740234375, -29.826171875, -27.2783203125, -24.73046875, -22.1826171875, -19.634765625, -17.0869140625, -14.5390625, -11.9912109375, -9.443359375, -6.8955078125, -4.34765625, -1.7998046875, 0.748046875, 3.2958984375, 5.84375, 8.3916015625, 10.939453125, 13.4873046875, 16.03515625, 18.5830078125, 21.130859375, 23.6787109375, 26.2265625, 28.7744140625, 31.322265625, 33.8701171875, 36.41796875, 38.9658203125, 41.513671875, 44.0615234375, 46.609375, 49.1572265625, 51.705078125, 54.2529296875, 56.80078125, 59.3486328125, 61.896484375, 64.4443359375, 66.9921875, 69.5400390625, 72.087890625, 74.6357421875, 77.18359375, 79.7314453125, 82.279296875, 84.8271484375, 87.375]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 43.0, 128.0, 330.0, 317.0, 148.0, 42.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.324283599853516, -19.54854965209961, -17.772815704345703, -15.997082710266113, -14.221348762512207, -12.4456148147583, -10.669881820678711, -8.894147872924805, -7.118413925170898, -5.342679977416992, -3.566946506500244, -1.791213035583496, -0.015479087829589844, 1.7602548599243164, 3.5359878540039062, 5.3117218017578125, 7.087455749511719, 8.863189697265625, 10.638923645019531, 12.414656639099121, 14.190390586853027, 15.966124534606934, 17.741857528686523, 19.51759147644043, 21.293325424194336, 23.069059371948242, 24.84479331970215, 26.620525360107422, 28.396259307861328, 30.171993255615234, 31.94772720336914, 33.72346115112305, 35.49919891357422, 37.274932861328125, 39.05066680908203, 40.82640075683594, 42.602134704589844, 44.37786865234375, 46.153602600097656, 47.92933654785156, 49.70507049560547, 51.480804443359375, 53.25653839111328, 55.03227233886719, 56.808006286621094, 58.583740234375, 60.359474182128906, 62.13520812988281, 63.91093826293945, 65.6866683959961, 67.46240234375, 69.2381362915039, 71.01387023925781, 72.78960418701172, 74.56533813476562, 76.34107208251953, 78.11680603027344, 79.89253997802734, 81.66827392578125, 83.44400787353516, 85.21974182128906, 86.99547576904297, 88.77120971679688, 90.54694366455078, 92.32267761230469]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 5.0, 5.0, 8.0, 10.0, 8.0, 14.0, 10.0, 15.0, 23.0, 27.0, 21.0, 32.0, 31.0, 34.0, 36.0, 53.0, 43.0, 53.0, 44.0, 49.0, 38.0, 45.0, 46.0, 33.0, 29.0, 35.0, 37.0, 34.0, 20.0, 28.0, 29.0, 17.0, 19.0, 8.0, 12.0, 10.0, 7.0, 5.0, 8.0, 6.0, 4.0, 3.0, 4.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-68.32886505126953, -66.34992980957031, -64.37098693847656, -62.39204788208008, -60.413108825683594, -58.434173583984375, -56.45523452758789, -54.476295471191406, -52.49735641479492, -50.51841735839844, -48.53947830200195, -46.56053924560547, -44.58160400390625, -42.6026611328125, -40.62372589111328, -38.6447868347168, -36.66584777832031, -34.68690872192383, -32.707969665527344, -30.729032516479492, -28.750093460083008, -26.771154403686523, -24.792217254638672, -22.813278198242188, -20.834339141845703, -18.85540008544922, -16.876461029052734, -14.897523880004883, -12.918584823608398, -10.939645767211914, -8.960707664489746, -6.981769561767578, -5.002830505371094, -3.0238919258117676, -1.0449533462524414, 0.9339852333068848, 2.912923812866211, 4.891862869262695, 6.870800971984863, 8.849739074707031, 10.828678131103516, 12.8076171875, 14.786555290222168, 16.765493392944336, 18.74443244934082, 20.723371505737305, 22.702308654785156, 24.68124771118164, 26.660186767578125, 28.63912582397461, 30.618064880371094, 32.59700393676758, 34.57594299316406, 36.55487823486328, 38.533817291259766, 40.51275634765625, 42.491695404052734, 44.47063446044922, 46.4495735168457, 48.42851257324219, 50.407447814941406, 52.386390686035156, 54.365325927734375, 56.34426498413086, 58.323204040527344]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 5.0, 10.0, 12.0, 8.0, 13.0, 13.0, 14.0, 12.0, 25.0, 29.0, 23.0, 27.0, 29.0, 34.0, 29.0, 38.0, 38.0, 39.0, 39.0, 55.0, 50.0, 41.0, 48.0, 42.0, 26.0, 43.0, 33.0, 26.0, 36.0, 31.0, 27.0, 19.0, 22.0, 22.0, 13.0, 6.0, 8.0, 6.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5234375, -8.248291015625, -7.97314453125, -7.697998046875, -7.4228515625, -7.147705078125, -6.87255859375, -6.597412109375, -6.322265625, -6.047119140625, -5.77197265625, -5.496826171875, -5.2216796875, -4.946533203125, -4.67138671875, -4.396240234375, -4.12109375, -3.845947265625, -3.57080078125, -3.295654296875, -3.0205078125, -2.745361328125, -2.47021484375, -2.195068359375, -1.919921875, -1.644775390625, -1.36962890625, -1.094482421875, -0.8193359375, -0.544189453125, -0.26904296875, 0.006103515625, 0.28125, 0.556396484375, 0.83154296875, 1.106689453125, 1.3818359375, 1.656982421875, 1.93212890625, 2.207275390625, 2.482421875, 2.757568359375, 3.03271484375, 3.307861328125, 3.5830078125, 3.858154296875, 4.13330078125, 4.408447265625, 4.68359375, 4.958740234375, 5.23388671875, 5.509033203125, 5.7841796875, 6.059326171875, 6.33447265625, 6.609619140625, 6.884765625, 7.159912109375, 7.43505859375, 7.710205078125, 7.9853515625, 8.260498046875, 8.53564453125, 8.810791015625, 9.0859375]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 7.0, 5.0, 6.0, 13.0, 18.0, 11.0, 20.0, 31.0, 39.0, 53.0, 60.0, 104.0, 113.0, 184.0, 248.0, 417.0, 882.0, 1782.0, 4617.0, 16554.0, 131659.0, 1760096.0, 2061407.0, 186129.0, 20219.0, 5286.0, 1994.0, 937.0, 480.0, 276.0, 155.0, 141.0, 84.0, 61.0, 53.0, 42.0, 32.0, 20.0, 10.0, 10.0, 12.0, 7.0, 7.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.28125, -17.7109375, -17.140625, -16.5703125, -16.0, -15.4296875, -14.859375, -14.2890625, -13.71875, -13.1484375, -12.578125, -12.0078125, -11.4375, -10.8671875, -10.296875, -9.7265625, -9.15625, -8.5859375, -8.015625, -7.4453125, -6.875, -6.3046875, -5.734375, -5.1640625, -4.59375, -4.0234375, -3.453125, -2.8828125, -2.3125, -1.7421875, -1.171875, -0.6015625, -0.03125, 0.5390625, 1.109375, 1.6796875, 2.25, 2.8203125, 3.390625, 3.9609375, 4.53125, 5.1015625, 5.671875, 6.2421875, 6.8125, 7.3828125, 7.953125, 8.5234375, 9.09375, 9.6640625, 10.234375, 10.8046875, 11.375, 11.9453125, 12.515625, 13.0859375, 13.65625, 14.2265625, 14.796875, 15.3671875, 15.9375, 16.5078125, 17.078125, 17.6484375, 18.21875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 9.0, 8.0, 11.0, 12.0, 18.0, 35.0, 45.0, 66.0, 91.0, 147.0, 251.0, 370.0, 508.0, 627.0, 565.0, 447.0, 286.0, 167.0, 145.0, 82.0, 49.0, 41.0, 24.0, 20.0, 14.0, 10.0, 12.0, 6.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.015625, -15.5263671875, -15.037109375, -14.5478515625, -14.05859375, -13.5693359375, -13.080078125, -12.5908203125, -12.1015625, -11.6123046875, -11.123046875, -10.6337890625, -10.14453125, -9.6552734375, -9.166015625, -8.6767578125, -8.1875, -7.6982421875, -7.208984375, -6.7197265625, -6.23046875, -5.7412109375, -5.251953125, -4.7626953125, -4.2734375, -3.7841796875, -3.294921875, -2.8056640625, -2.31640625, -1.8271484375, -1.337890625, -0.8486328125, -0.359375, 0.1298828125, 0.619140625, 1.1083984375, 1.59765625, 2.0869140625, 2.576171875, 3.0654296875, 3.5546875, 4.0439453125, 4.533203125, 5.0224609375, 5.51171875, 6.0009765625, 6.490234375, 6.9794921875, 7.46875, 7.9580078125, 8.447265625, 8.9365234375, 9.42578125, 9.9150390625, 10.404296875, 10.8935546875, 11.3828125, 11.8720703125, 12.361328125, 12.8505859375, 13.33984375, 13.8291015625, 14.318359375, 14.8076171875, 15.296875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 4.0, 5.0, 6.0, 4.0, 10.0, 14.0, 13.0, 26.0, 18.0, 30.0, 31.0, 45.0, 47.0, 76.0, 109.0, 106.0, 189.0, 276.0, 536.0, 1224.0, 4531.0, 41123.0, 2481571.0, 1626001.0, 31676.0, 4043.0, 1138.0, 479.0, 254.0, 183.0, 133.0, 89.0, 65.0, 56.0, 40.0, 35.0, 21.0, 20.0, 15.0, 12.0, 6.0, 4.0, 8.0, 1.0, 3.0, 4.0, 5.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-36.9375, -35.744140625, -34.55078125, -33.357421875, -32.1640625, -30.970703125, -29.77734375, -28.583984375, -27.390625, -26.197265625, -25.00390625, -23.810546875, -22.6171875, -21.423828125, -20.23046875, -19.037109375, -17.84375, -16.650390625, -15.45703125, -14.263671875, -13.0703125, -11.876953125, -10.68359375, -9.490234375, -8.296875, -7.103515625, -5.91015625, -4.716796875, -3.5234375, -2.330078125, -1.13671875, 0.056640625, 1.25, 2.443359375, 3.63671875, 4.830078125, 6.0234375, 7.216796875, 8.41015625, 9.603515625, 10.796875, 11.990234375, 13.18359375, 14.376953125, 15.5703125, 16.763671875, 17.95703125, 19.150390625, 20.34375, 21.537109375, 22.73046875, 23.923828125, 25.1171875, 26.310546875, 27.50390625, 28.697265625, 29.890625, 31.083984375, 32.27734375, 33.470703125, 34.6640625, 35.857421875, 37.05078125, 38.244140625, 39.4375]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [37.0, 434.0, 498.0, 41.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.64754295349121, -9.361690521240234, -0.07583808898925781, 9.210014343261719, 18.495866775512695, 27.78171730041504, 37.06757354736328, 46.353424072265625, 55.63927459716797, 64.92512512207031, 74.21098327636719, 83.49683380126953, 92.78268432617188, 102.06853485107422, 111.35438537597656, 120.64024353027344, 129.9261016845703, 139.2119598388672, 148.497802734375, 157.78366088867188, 167.06951904296875, 176.35536193847656, 185.64122009277344, 194.92706298828125, 204.21292114257812, 213.498779296875, 222.7846221923828, 232.0704803466797, 241.3563232421875, 250.64218139648438, 259.92803955078125, 269.2138977050781, 278.499755859375, 287.7856140136719, 297.07147216796875, 306.3572998046875, 315.6431579589844, 324.92901611328125, 334.2148742675781, 343.500732421875, 352.78656005859375, 362.0724182128906, 371.3582763671875, 380.64410400390625, 389.9299621582031, 399.2158203125, 408.5016784667969, 417.78753662109375, 427.0733947753906, 436.3592529296875, 445.6451110839844, 454.9309387207031, 464.216796875, 473.5026550292969, 482.78851318359375, 492.0743713378906, 501.3602294921875, 510.6460876464844, 519.9319458007812, 529.2177734375, 538.503662109375, 547.7894897460938, 557.0753173828125, 566.3612060546875, 575.6470336914062]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 3.0, 2.0, 5.0, 8.0, 7.0, 6.0, 12.0, 14.0, 22.0, 22.0, 21.0, 27.0, 13.0, 31.0, 21.0, 32.0, 37.0, 46.0, 31.0, 39.0, 40.0, 39.0, 30.0, 42.0, 43.0, 39.0, 36.0, 31.0, 30.0, 35.0, 35.0, 21.0, 27.0, 24.0, 23.0, 17.0, 18.0, 8.0, 15.0, 11.0, 9.0, 7.0, 4.0, 4.0, 5.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-38.665008544921875, -37.35017395019531, -36.03533935546875, -34.72050476074219, -33.405670166015625, -32.0908317565918, -30.775997161865234, -29.461162567138672, -28.14632797241211, -26.831493377685547, -25.516658782958984, -24.20182228088379, -22.886987686157227, -21.572153091430664, -20.25731658935547, -18.942481994628906, -17.627647399902344, -16.31281280517578, -14.997977256774902, -13.683141708374023, -12.368307113647461, -11.053472518920898, -9.73863697052002, -8.42380142211914, -7.108966827392578, -5.794131755828857, -4.479296684265137, -3.164461612701416, -1.8496265411376953, -0.5347914695739746, 0.7800436019897461, 2.094879150390625, 3.4097137451171875, 4.724548816680908, 6.039383888244629, 7.35421895980835, 8.66905403137207, 9.983888626098633, 11.298724174499512, 12.61355972290039, 13.928394317626953, 15.243228912353516, 16.558063507080078, 17.872900009155273, 19.187734603881836, 20.5025691986084, 21.817405700683594, 23.132240295410156, 24.44707489013672, 25.76190948486328, 27.076744079589844, 28.39158058166504, 29.7064151763916, 31.021249771118164, 32.33608627319336, 33.65092086791992, 34.965755462646484, 36.28059005737305, 37.59542465209961, 38.91025924682617, 40.22509765625, 41.53993225097656, 42.854766845703125, 44.16960144042969, 45.48443603515625]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 5.0, 2.0, 4.0, 8.0, 8.0, 15.0, 12.0, 7.0, 17.0, 10.0, 11.0, 17.0, 13.0, 31.0, 30.0, 22.0, 24.0, 22.0, 39.0, 19.0, 35.0, 37.0, 47.0, 39.0, 35.0, 41.0, 42.0, 32.0, 38.0, 42.0, 25.0, 41.0, 30.0, 25.0, 24.0, 29.0, 17.0, 16.0, 12.0, 21.0, 10.0, 9.0, 11.0, 5.0, 11.0, 5.0, 4.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.453125, -7.21649169921875, -6.9798583984375, -6.74322509765625, -6.506591796875, -6.26995849609375, -6.0333251953125, -5.79669189453125, -5.56005859375, -5.32342529296875, -5.0867919921875, -4.85015869140625, -4.613525390625, -4.37689208984375, -4.1402587890625, -3.90362548828125, -3.6669921875, -3.43035888671875, -3.1937255859375, -2.95709228515625, -2.720458984375, -2.48382568359375, -2.2471923828125, -2.01055908203125, -1.77392578125, -1.53729248046875, -1.3006591796875, -1.06402587890625, -0.827392578125, -0.59075927734375, -0.3541259765625, -0.11749267578125, 0.119140625, 0.35577392578125, 0.5924072265625, 0.82904052734375, 1.065673828125, 1.30230712890625, 1.5389404296875, 1.77557373046875, 2.01220703125, 2.24884033203125, 2.4854736328125, 2.72210693359375, 2.958740234375, 3.19537353515625, 3.4320068359375, 3.66864013671875, 3.9052734375, 4.14190673828125, 4.3785400390625, 4.61517333984375, 4.851806640625, 5.08843994140625, 5.3250732421875, 5.56170654296875, 5.79833984375, 6.03497314453125, 6.2716064453125, 6.50823974609375, 6.744873046875, 6.98150634765625, 7.2181396484375, 7.45477294921875, 7.69140625]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 10.0, 10.0, 19.0, 19.0, 20.0, 36.0, 38.0, 68.0, 83.0, 176.0, 259.0, 450.0, 727.0, 1142.0, 1956.0, 3390.0, 5477.0, 9222.0, 15784.0, 27758.0, 49857.0, 94321.0, 196988.0, 293682.0, 164762.0, 80805.0, 42707.0, 24358.0, 13981.0, 8289.0, 4738.0, 2896.0, 1729.0, 1084.0, 650.0, 359.0, 267.0, 157.0, 110.0, 59.0, 47.0, 19.0, 15.0, 9.0, 6.0, 6.0, 4.0, 5.0, 3.0, 3.0, 1.0, 2.0, 4.0], "bins": [-1.5224609375, -1.478179931640625, -1.43389892578125, -1.389617919921875, -1.3453369140625, -1.301055908203125, -1.25677490234375, -1.212493896484375, -1.168212890625, -1.123931884765625, -1.07965087890625, -1.035369873046875, -0.9910888671875, -0.946807861328125, -0.90252685546875, -0.858245849609375, -0.81396484375, -0.769683837890625, -0.72540283203125, -0.681121826171875, -0.6368408203125, -0.592559814453125, -0.54827880859375, -0.503997802734375, -0.459716796875, -0.415435791015625, -0.37115478515625, -0.326873779296875, -0.2825927734375, -0.238311767578125, -0.19403076171875, -0.149749755859375, -0.10546875, -0.061187744140625, -0.01690673828125, 0.027374267578125, 0.0716552734375, 0.115936279296875, 0.16021728515625, 0.204498291015625, 0.248779296875, 0.293060302734375, 0.33734130859375, 0.381622314453125, 0.4259033203125, 0.470184326171875, 0.51446533203125, 0.558746337890625, 0.60302734375, 0.647308349609375, 0.69158935546875, 0.735870361328125, 0.7801513671875, 0.824432373046875, 0.86871337890625, 0.912994384765625, 0.957275390625, 1.001556396484375, 1.04583740234375, 1.090118408203125, 1.1343994140625, 1.178680419921875, 1.22296142578125, 1.267242431640625, 1.3115234375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 3.0, 3.0, 6.0, 5.0, 2.0, 4.0, 11.0, 8.0, 11.0, 12.0, 13.0, 9.0, 13.0, 26.0, 29.0, 24.0, 32.0, 27.0, 34.0, 32.0, 30.0, 43.0, 45.0, 35.0, 1065.0, 38.0, 41.0, 44.0, 32.0, 44.0, 34.0, 42.0, 33.0, 25.0, 25.0, 21.0, 24.0, 8.0, 14.0, 9.0, 13.0, 10.0, 7.0, 13.0, 10.0, 9.0, 4.0, 2.0, 6.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-4.92578125, -4.77520751953125, -4.6246337890625, -4.47406005859375, -4.323486328125, -4.17291259765625, -4.0223388671875, -3.87176513671875, -3.72119140625, -3.57061767578125, -3.4200439453125, -3.26947021484375, -3.118896484375, -2.96832275390625, -2.8177490234375, -2.66717529296875, -2.5166015625, -2.36602783203125, -2.2154541015625, -2.06488037109375, -1.914306640625, -1.76373291015625, -1.6131591796875, -1.46258544921875, -1.31201171875, -1.16143798828125, -1.0108642578125, -0.86029052734375, -0.709716796875, -0.55914306640625, -0.4085693359375, -0.25799560546875, -0.107421875, 0.04315185546875, 0.1937255859375, 0.34429931640625, 0.494873046875, 0.64544677734375, 0.7960205078125, 0.94659423828125, 1.09716796875, 1.24774169921875, 1.3983154296875, 1.54888916015625, 1.699462890625, 1.85003662109375, 2.0006103515625, 2.15118408203125, 2.3017578125, 2.45233154296875, 2.6029052734375, 2.75347900390625, 2.904052734375, 3.05462646484375, 3.2052001953125, 3.35577392578125, 3.50634765625, 3.65692138671875, 3.8074951171875, 3.95806884765625, 4.108642578125, 4.25921630859375, 4.4097900390625, 4.56036376953125, 4.7109375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 9.0, 13.0, 6.0, 14.0, 34.0, 33.0, 50.0, 76.0, 139.0, 145.0, 205.0, 333.0, 448.0, 655.0, 932.0, 1399.0, 2048.0, 3031.0, 4672.0, 6726.0, 10723.0, 16768.0, 26835.0, 44671.0, 78257.0, 149590.0, 1302719.0, 196691.0, 101638.0, 56251.0, 33494.0, 20561.0, 12984.0, 8388.0, 5397.0, 3550.0, 2402.0, 1667.0, 1113.0, 736.0, 555.0, 362.0, 245.0, 168.0, 125.0, 90.0, 63.0, 36.0, 36.0, 22.0, 13.0, 13.0, 4.0, 1.0, 3.0, 2.0, 2.0], "bins": [-1.10546875, -1.0726776123046875, -1.039886474609375, -1.0070953369140625, -0.97430419921875, -0.9415130615234375, -0.908721923828125, -0.8759307861328125, -0.8431396484375, -0.8103485107421875, -0.777557373046875, -0.7447662353515625, -0.71197509765625, -0.6791839599609375, -0.646392822265625, -0.6136016845703125, -0.580810546875, -0.5480194091796875, -0.515228271484375, -0.4824371337890625, -0.44964599609375, -0.4168548583984375, -0.384063720703125, -0.3512725830078125, -0.3184814453125, -0.2856903076171875, -0.252899169921875, -0.2201080322265625, -0.18731689453125, -0.1545257568359375, -0.121734619140625, -0.0889434814453125, -0.05615234375, -0.0233612060546875, 0.009429931640625, 0.0422210693359375, 0.07501220703125, 0.1078033447265625, 0.140594482421875, 0.1733856201171875, 0.2061767578125, 0.2389678955078125, 0.271759033203125, 0.3045501708984375, 0.33734130859375, 0.3701324462890625, 0.402923583984375, 0.4357147216796875, 0.468505859375, 0.5012969970703125, 0.534088134765625, 0.5668792724609375, 0.59967041015625, 0.6324615478515625, 0.665252685546875, 0.6980438232421875, 0.7308349609375, 0.7636260986328125, 0.796417236328125, 0.8292083740234375, 0.86199951171875, 0.8947906494140625, 0.927581787109375, 0.9603729248046875, 0.9931640625]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 5.0, 6.0, 4.0, 7.0, 7.0, 9.0, 4.0, 8.0, 15.0, 13.0, 13.0, 15.0, 30.0, 24.0, 35.0, 29.0, 38.0, 52.0, 37.0, 55.0, 56.0, 65.0, 44.0, 41.0, 49.0, 40.0, 51.0, 39.0, 37.0, 24.0, 24.0, 32.0, 20.0, 22.0, 13.0, 5.0, 8.0, 9.0, 11.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0019683837890625, -0.001899033784866333, -0.001829683780670166, -0.001760333776473999, -0.001690983772277832, -0.001621633768081665, -0.001552283763885498, -0.001482933759689331, -0.001413583755493164, -0.001344233751296997, -0.00127488374710083, -0.001205533742904663, -0.001136183738708496, -0.001066833734512329, -0.0009974837303161621, -0.0009281337261199951, -0.0008587837219238281, -0.0007894337177276611, -0.0007200837135314941, -0.0006507337093353271, -0.0005813837051391602, -0.0005120337009429932, -0.00044268369674682617, -0.0003733336925506592, -0.0003039836883544922, -0.0002346336841583252, -0.0001652836799621582, -9.593367576599121e-05, -2.658367156982422e-05, 4.2766332626342773e-05, 0.00011211633682250977, 0.00018146634101867676, 0.00025081634521484375, 0.00032016634941101074, 0.00038951635360717773, 0.0004588663578033447, 0.0005282163619995117, 0.0005975663661956787, 0.0006669163703918457, 0.0007362663745880127, 0.0008056163787841797, 0.0008749663829803467, 0.0009443163871765137, 0.0010136663913726807, 0.0010830163955688477, 0.0011523663997650146, 0.0012217164039611816, 0.0012910664081573486, 0.0013604164123535156, 0.0014297664165496826, 0.0014991164207458496, 0.0015684664249420166, 0.0016378164291381836, 0.0017071664333343506, 0.0017765164375305176, 0.0018458664417266846, 0.0019152164459228516, 0.0019845664501190186, 0.0020539164543151855, 0.0021232664585113525, 0.0021926164627075195, 0.0022619664669036865, 0.0023313164710998535, 0.0024006664752960205, 0.0024700164794921875]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 6.0, 8.0, 6.0, 6.0, 12.0, 20.0, 16.0, 22.0, 32.0, 44.0, 54.0, 59.0, 72.0, 111.0, 167.0, 279.0, 573.0, 2321.0, 966870.0, 75853.0, 944.0, 402.0, 180.0, 128.0, 77.0, 68.0, 41.0, 43.0, 34.0, 15.0, 28.0, 16.0, 8.0, 5.0, 8.0, 9.0, 7.0, 5.0, 1.0, 7.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.057708740234375, -0.056049346923828125, -0.05438995361328125, -0.052730560302734375, -0.0510711669921875, -0.049411773681640625, -0.04775238037109375, -0.046092987060546875, -0.04443359375, -0.042774200439453125, -0.04111480712890625, -0.039455413818359375, -0.0377960205078125, -0.036136627197265625, -0.03447723388671875, -0.032817840576171875, -0.031158447265625, -0.029499053955078125, -0.02783966064453125, -0.026180267333984375, -0.0245208740234375, -0.022861480712890625, -0.02120208740234375, -0.019542694091796875, -0.01788330078125, -0.016223907470703125, -0.01456451416015625, -0.012905120849609375, -0.0112457275390625, -0.009586334228515625, -0.00792694091796875, -0.006267547607421875, -0.004608154296875, -0.002948760986328125, -0.00128936767578125, 0.000370025634765625, 0.0020294189453125, 0.003688812255859375, 0.00534820556640625, 0.007007598876953125, 0.0086669921875, 0.010326385498046875, 0.01198577880859375, 0.013645172119140625, 0.0153045654296875, 0.016963958740234375, 0.01862335205078125, 0.020282745361328125, 0.021942138671875, 0.023601531982421875, 0.02526092529296875, 0.026920318603515625, 0.0285797119140625, 0.030239105224609375, 0.03189849853515625, 0.033557891845703125, 0.03521728515625, 0.036876678466796875, 0.03853607177734375, 0.040195465087890625, 0.0418548583984375, 0.043514251708984375, 0.04517364501953125, 0.046833038330078125, 0.048492431640625]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 15.0, 428.0, 556.0, 17.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02301296591758728, -0.02260955236852169, -0.0222061388194561, -0.02180272527039051, -0.02139931358397007, -0.02099590003490448, -0.02059248648583889, -0.0201890729367733, -0.01978565938770771, -0.01938224583864212, -0.01897883228957653, -0.01857541874051094, -0.0181720070540905, -0.01776859350502491, -0.01736517995595932, -0.01696176640689373, -0.01655835285782814, -0.01615493930876255, -0.01575152575969696, -0.015348113141953945, -0.014944699592888355, -0.01454128697514534, -0.01413787342607975, -0.01373445987701416, -0.013331047259271145, -0.012927633710205555, -0.01252422109246254, -0.01212080754339695, -0.01171739399433136, -0.01131398044526577, -0.010910567827522755, -0.010507154278457165, -0.01010374166071415, -0.00970032811164856, -0.009296915493905544, -0.008893501944839954, -0.008490088395774364, -0.00808667577803135, -0.007683262228965759, -0.007279848679900169, -0.0068764351308345795, -0.006473022047430277, -0.006069608498364687, -0.005666195414960384, -0.0052627818658947945, -0.004859368782490492, -0.004455955699086189, -0.004052542150020599, -0.0036491286009550095, -0.003245715284720063, -0.002842301968485117, -0.0024388888850808144, -0.0020354753360152245, -0.0016320622526109219, -0.0012286489363759756, -0.0008252356201410294, -0.0004218223039060831, -1.8409016774967313e-05, 0.0003850042703561485, 0.0007884175283834338, 0.00119183084461838, 0.0015952440444380045, 0.0019986573606729507, 0.002402070676907897, 0.0028054839931428432]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 4.0, 6.0, 4.0, 10.0, 11.0, 15.0, 19.0, 14.0, 21.0, 25.0, 33.0, 36.0, 38.0, 26.0, 51.0, 42.0, 45.0, 42.0, 38.0, 50.0, 58.0, 40.0, 48.0, 42.0, 27.0, 32.0, 30.0, 28.0, 25.0, 25.0, 19.0, 24.0, 15.0, 11.0, 10.0, 12.0, 10.0, 4.0, 6.0, 3.0, 5.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011220574378967285, -0.001079595647752285, -0.0010371338576078415, -0.000994672067463398, -0.0009522102773189545, -0.000909748487174511, -0.0008672866970300674, -0.0008248249068856239, -0.0007823631167411804, -0.0007399013265967369, -0.0006974395364522934, -0.0006549777463078499, -0.0006125159561634064, -0.0005700541660189629, -0.0005275923758745193, -0.00048513058573007584, -0.0004426687955856323, -0.0004002070054411888, -0.0003577452152967453, -0.0003152834251523018, -0.0002728216350078583, -0.00023035984486341476, -0.00018789805471897125, -0.00014543626457452774, -0.00010297447443008423, -6.0512684285640717e-05, -1.8050894141197205e-05, 2.4410896003246307e-05, 6.687268614768982e-05, 0.00010933447629213333, 0.00015179626643657684, 0.00019425805658102036, 0.00023671984672546387, 0.0002791816368699074, 0.0003216434270143509, 0.0003641052171587944, 0.0004065670073032379, 0.0004490287974476814, 0.0004914905875921249, 0.0005339523777365685, 0.000576414167881012, 0.0006188759580254555, 0.000661337748169899, 0.0007037995383143425, 0.000746261328458786, 0.0007887231186032295, 0.000831184908747673, 0.0008736466988921165, 0.0009161084890365601, 0.0009585702791810036, 0.001001032069325447, 0.0010434938594698906, 0.001085955649614334, 0.0011284174397587776, 0.0011708792299032211, 0.0012133410200476646, 0.0012558028101921082, 0.0012982646003365517, 0.0013407263904809952, 0.0013831881806254387, 0.0014256499707698822, 0.0014681117609143257, 0.0015105735510587692, 0.0015530353412032127, 0.0015954971313476562]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 5.0, 2.0, 4.0, 8.0, 8.0, 15.0, 12.0, 7.0, 17.0, 10.0, 11.0, 17.0, 13.0, 31.0, 30.0, 22.0, 24.0, 22.0, 39.0, 19.0, 35.0, 37.0, 47.0, 39.0, 35.0, 41.0, 42.0, 32.0, 38.0, 42.0, 25.0, 41.0, 30.0, 25.0, 24.0, 29.0, 17.0, 16.0, 12.0, 21.0, 10.0, 9.0, 11.0, 5.0, 11.0, 5.0, 4.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.453125, -7.21649169921875, -6.9798583984375, -6.74322509765625, -6.506591796875, -6.26995849609375, -6.0333251953125, -5.79669189453125, -5.56005859375, -5.32342529296875, -5.0867919921875, -4.85015869140625, -4.613525390625, -4.37689208984375, -4.1402587890625, -3.90362548828125, -3.6669921875, -3.43035888671875, -3.1937255859375, -2.95709228515625, -2.720458984375, -2.48382568359375, -2.2471923828125, -2.01055908203125, -1.77392578125, -1.53729248046875, -1.3006591796875, -1.06402587890625, -0.827392578125, -0.59075927734375, -0.3541259765625, -0.11749267578125, 0.119140625, 0.35577392578125, 0.5924072265625, 0.82904052734375, 1.065673828125, 1.30230712890625, 1.5389404296875, 1.77557373046875, 2.01220703125, 2.24884033203125, 2.4854736328125, 2.72210693359375, 2.958740234375, 3.19537353515625, 3.4320068359375, 3.66864013671875, 3.9052734375, 4.14190673828125, 4.3785400390625, 4.61517333984375, 4.851806640625, 5.08843994140625, 5.3250732421875, 5.56170654296875, 5.79833984375, 6.03497314453125, 6.2716064453125, 6.50823974609375, 6.744873046875, 6.98150634765625, 7.2181396484375, 7.45477294921875, 7.69140625]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 5.0, 9.0, 7.0, 8.0, 18.0, 26.0, 22.0, 33.0, 44.0, 56.0, 59.0, 89.0, 105.0, 159.0, 185.0, 295.0, 461.0, 859.0, 1561.0, 2860.0, 6062.0, 13895.0, 35847.0, 102981.0, 358826.0, 358114.0, 103382.0, 35623.0, 13920.0, 6124.0, 2902.0, 1511.0, 855.0, 525.0, 322.0, 214.0, 142.0, 99.0, 67.0, 84.0, 45.0, 46.0, 28.0, 21.0, 18.0, 15.0, 10.0, 4.0, 5.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.9453125, -9.634521484375, -9.32373046875, -9.012939453125, -8.7021484375, -8.391357421875, -8.08056640625, -7.769775390625, -7.458984375, -7.148193359375, -6.83740234375, -6.526611328125, -6.2158203125, -5.905029296875, -5.59423828125, -5.283447265625, -4.97265625, -4.661865234375, -4.35107421875, -4.040283203125, -3.7294921875, -3.418701171875, -3.10791015625, -2.797119140625, -2.486328125, -2.175537109375, -1.86474609375, -1.553955078125, -1.2431640625, -0.932373046875, -0.62158203125, -0.310791015625, 0.0, 0.310791015625, 0.62158203125, 0.932373046875, 1.2431640625, 1.553955078125, 1.86474609375, 2.175537109375, 2.486328125, 2.797119140625, 3.10791015625, 3.418701171875, 3.7294921875, 4.040283203125, 4.35107421875, 4.661865234375, 4.97265625, 5.283447265625, 5.59423828125, 5.905029296875, 6.2158203125, 6.526611328125, 6.83740234375, 7.148193359375, 7.458984375, 7.769775390625, 8.08056640625, 8.391357421875, 8.7021484375, 9.012939453125, 9.32373046875, 9.634521484375, 9.9453125]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 5.0, 5.0, 6.0, 8.0, 12.0, 19.0, 22.0, 20.0, 26.0, 29.0, 26.0, 43.0, 36.0, 49.0, 58.0, 71.0, 83.0, 112.0, 1523.0, 296.0, 113.0, 93.0, 54.0, 48.0, 44.0, 39.0, 28.0, 25.0, 27.0, 18.0, 24.0, 14.0, 17.0, 6.0, 11.0, 10.0, 7.0, 7.0, 5.0, 2.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.515625, -22.777587890625, -22.03955078125, -21.301513671875, -20.5634765625, -19.825439453125, -19.08740234375, -18.349365234375, -17.611328125, -16.873291015625, -16.13525390625, -15.397216796875, -14.6591796875, -13.921142578125, -13.18310546875, -12.445068359375, -11.70703125, -10.968994140625, -10.23095703125, -9.492919921875, -8.7548828125, -8.016845703125, -7.27880859375, -6.540771484375, -5.802734375, -5.064697265625, -4.32666015625, -3.588623046875, -2.8505859375, -2.112548828125, -1.37451171875, -0.636474609375, 0.1015625, 0.839599609375, 1.57763671875, 2.315673828125, 3.0537109375, 3.791748046875, 4.52978515625, 5.267822265625, 6.005859375, 6.743896484375, 7.48193359375, 8.219970703125, 8.9580078125, 9.696044921875, 10.43408203125, 11.172119140625, 11.91015625, 12.648193359375, 13.38623046875, 14.124267578125, 14.8623046875, 15.600341796875, 16.33837890625, 17.076416015625, 17.814453125, 18.552490234375, 19.29052734375, 20.028564453125, 20.7666015625, 21.504638671875, 22.24267578125, 22.980712890625, 23.71875]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 4.0, 2.0, 8.0, 7.0, 7.0, 9.0, 9.0, 17.0, 24.0, 21.0, 31.0, 31.0, 41.0, 62.0, 73.0, 107.0, 111.0, 176.0, 234.0, 401.0, 870.0, 4010.0, 49684.0, 2580293.0, 487445.0, 18118.0, 2074.0, 643.0, 299.0, 225.0, 145.0, 122.0, 90.0, 61.0, 56.0, 53.0, 37.0, 28.0, 13.0, 12.0, 9.0, 8.0, 6.0, 11.0, 6.0, 9.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-30.921875, -29.979736328125, -29.03759765625, -28.095458984375, -27.1533203125, -26.211181640625, -25.26904296875, -24.326904296875, -23.384765625, -22.442626953125, -21.50048828125, -20.558349609375, -19.6162109375, -18.674072265625, -17.73193359375, -16.789794921875, -15.84765625, -14.905517578125, -13.96337890625, -13.021240234375, -12.0791015625, -11.136962890625, -10.19482421875, -9.252685546875, -8.310546875, -7.368408203125, -6.42626953125, -5.484130859375, -4.5419921875, -3.599853515625, -2.65771484375, -1.715576171875, -0.7734375, 0.168701171875, 1.11083984375, 2.052978515625, 2.9951171875, 3.937255859375, 4.87939453125, 5.821533203125, 6.763671875, 7.705810546875, 8.64794921875, 9.590087890625, 10.5322265625, 11.474365234375, 12.41650390625, 13.358642578125, 14.30078125, 15.242919921875, 16.18505859375, 17.127197265625, 18.0693359375, 19.011474609375, 19.95361328125, 20.895751953125, 21.837890625, 22.780029296875, 23.72216796875, 24.664306640625, 25.6064453125, 26.548583984375, 27.49072265625, 28.432861328125, 29.375]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 13.0, 109.0, 499.0, 340.0, 52.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.66531372070312, -65.9568862915039, -62.24845504760742, -58.54002380371094, -54.83159637451172, -51.123165130615234, -47.41473388671875, -43.70630645751953, -39.99787521362305, -36.28944396972656, -32.581016540527344, -28.87258529663086, -25.164155960083008, -21.455726623535156, -17.747295379638672, -14.03886604309082, -10.330436706542969, -6.622006893157959, -2.913577079772949, 0.7948532104492188, 4.50328254699707, 8.211711883544922, 11.920143127441406, 15.628572463989258, 19.33700180053711, 23.04543113708496, 26.753860473632812, 30.462291717529297, 34.17072296142578, 37.879150390625, 41.587581634521484, 45.29601287841797, 49.00444030761719, 52.71287155151367, 56.42129898071289, 60.129730224609375, 63.838157653808594, 67.54658508300781, 71.25502014160156, 74.96344757080078, 78.671875, 82.38030242919922, 86.08873748779297, 89.79716491699219, 93.5055923461914, 97.21401977539062, 100.92245483398438, 104.6308822631836, 108.33931732177734, 112.04774475097656, 115.75617980957031, 119.46460723876953, 123.17303466796875, 126.8814697265625, 130.58990478515625, 134.29832458496094, 138.0067596435547, 141.71519470214844, 145.42361450195312, 149.13204956054688, 152.84048461914062, 156.5489044189453, 160.25733947753906, 163.9657745361328, 167.6741943359375]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 1.0, 1.0, 3.0, 0.0, 5.0, 2.0, 8.0, 5.0, 11.0, 11.0, 10.0, 12.0, 19.0, 9.0, 23.0, 17.0, 18.0, 20.0, 26.0, 30.0, 29.0, 30.0, 41.0, 40.0, 44.0, 28.0, 30.0, 31.0, 28.0, 29.0, 40.0, 41.0, 47.0, 34.0, 36.0, 22.0, 30.0, 26.0, 30.0, 23.0, 19.0, 18.0, 14.0, 11.0, 10.0, 11.0, 6.0, 9.0, 5.0, 3.0, 5.0, 5.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0], "bins": [-51.13078308105469, -49.60908889770508, -48.087398529052734, -46.565704345703125, -45.04401397705078, -43.52231979370117, -42.00062561035156, -40.47893524169922, -38.95724105834961, -37.435546875, -35.913856506347656, -34.39216232299805, -32.87046813964844, -31.348777770996094, -29.827083587646484, -28.305391311645508, -26.78369903564453, -25.262006759643555, -23.740314483642578, -22.21862030029297, -20.696928024291992, -19.175235748291016, -17.653541564941406, -16.13184928894043, -14.610157012939453, -13.088464736938477, -11.566771507263184, -10.04507827758789, -8.523386001586914, -7.001693248748779, -5.4800004959106445, -3.9583072662353516, -2.436614990234375, -0.9149222373962402, 0.6067705154418945, 2.1284632682800293, 3.650156021118164, 5.171848773956299, 6.693541526794434, 8.215234756469727, 9.736927032470703, 11.25861930847168, 12.780312538146973, 14.302005767822266, 15.823698043823242, 17.34539031982422, 18.867084503173828, 20.388776779174805, 21.91046905517578, 23.432161331176758, 24.953853607177734, 26.475547790527344, 27.99724006652832, 29.518932342529297, 31.040626525878906, 32.56231689453125, 34.08401107788086, 35.60570526123047, 37.12739562988281, 38.64908981323242, 40.17078399658203, 41.692474365234375, 43.214168548583984, 44.735862731933594, 46.25755310058594]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 0.0, 3.0, 8.0, 6.0, 7.0, 9.0, 13.0, 9.0, 14.0, 20.0, 14.0, 23.0, 28.0, 30.0, 34.0, 20.0, 21.0, 48.0, 31.0, 40.0, 43.0, 38.0, 52.0, 38.0, 36.0, 49.0, 41.0, 34.0, 44.0, 42.0, 30.0, 25.0, 26.0, 24.0, 22.0, 9.0, 7.0, 22.0, 11.0, 10.0, 7.0, 4.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.7109375, -8.443603515625, -8.17626953125, -7.908935546875, -7.6416015625, -7.374267578125, -7.10693359375, -6.839599609375, -6.572265625, -6.304931640625, -6.03759765625, -5.770263671875, -5.5029296875, -5.235595703125, -4.96826171875, -4.700927734375, -4.43359375, -4.166259765625, -3.89892578125, -3.631591796875, -3.3642578125, -3.096923828125, -2.82958984375, -2.562255859375, -2.294921875, -2.027587890625, -1.76025390625, -1.492919921875, -1.2255859375, -0.958251953125, -0.69091796875, -0.423583984375, -0.15625, 0.111083984375, 0.37841796875, 0.645751953125, 0.9130859375, 1.180419921875, 1.44775390625, 1.715087890625, 1.982421875, 2.249755859375, 2.51708984375, 2.784423828125, 3.0517578125, 3.319091796875, 3.58642578125, 3.853759765625, 4.12109375, 4.388427734375, 4.65576171875, 4.923095703125, 5.1904296875, 5.457763671875, 5.72509765625, 5.992431640625, 6.259765625, 6.527099609375, 6.79443359375, 7.061767578125, 7.3291015625, 7.596435546875, 7.86376953125, 8.131103515625, 8.3984375]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 8.0, 7.0, 13.0, 13.0, 12.0, 20.0, 15.0, 28.0, 17.0, 41.0, 39.0, 73.0, 159.0, 348.0, 1107.0, 5046.0, 50681.0, 1739928.0, 2310008.0, 77750.0, 6686.0, 1387.0, 417.0, 183.0, 79.0, 46.0, 25.0, 29.0, 16.0, 12.0, 13.0, 20.0, 9.0, 10.0, 12.0, 8.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.390625, -21.5927734375, -20.794921875, -19.9970703125, -19.19921875, -18.4013671875, -17.603515625, -16.8056640625, -16.0078125, -15.2099609375, -14.412109375, -13.6142578125, -12.81640625, -12.0185546875, -11.220703125, -10.4228515625, -9.625, -8.8271484375, -8.029296875, -7.2314453125, -6.43359375, -5.6357421875, -4.837890625, -4.0400390625, -3.2421875, -2.4443359375, -1.646484375, -0.8486328125, -0.05078125, 0.7470703125, 1.544921875, 2.3427734375, 3.140625, 3.9384765625, 4.736328125, 5.5341796875, 6.33203125, 7.1298828125, 7.927734375, 8.7255859375, 9.5234375, 10.3212890625, 11.119140625, 11.9169921875, 12.71484375, 13.5126953125, 14.310546875, 15.1083984375, 15.90625, 16.7041015625, 17.501953125, 18.2998046875, 19.09765625, 19.8955078125, 20.693359375, 21.4912109375, 22.2890625, 23.0869140625, 23.884765625, 24.6826171875, 25.48046875, 26.2783203125, 27.076171875, 27.8740234375, 28.671875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 5.0, 7.0, 2.0, 13.0, 23.0, 30.0, 28.0, 47.0, 79.0, 100.0, 147.0, 228.0, 334.0, 502.0, 663.0, 560.0, 437.0, 295.0, 194.0, 112.0, 88.0, 61.0, 42.0, 23.0, 16.0, 11.0, 9.0, 8.0, 7.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8203125, -12.3734130859375, -11.926513671875, -11.4796142578125, -11.03271484375, -10.5858154296875, -10.138916015625, -9.6920166015625, -9.2451171875, -8.7982177734375, -8.351318359375, -7.9044189453125, -7.45751953125, -7.0106201171875, -6.563720703125, -6.1168212890625, -5.669921875, -5.2230224609375, -4.776123046875, -4.3292236328125, -3.88232421875, -3.4354248046875, -2.988525390625, -2.5416259765625, -2.0947265625, -1.6478271484375, -1.200927734375, -0.7540283203125, -0.30712890625, 0.1397705078125, 0.586669921875, 1.0335693359375, 1.48046875, 1.9273681640625, 2.374267578125, 2.8211669921875, 3.26806640625, 3.7149658203125, 4.161865234375, 4.6087646484375, 5.0556640625, 5.5025634765625, 5.949462890625, 6.3963623046875, 6.84326171875, 7.2901611328125, 7.737060546875, 8.1839599609375, 8.630859375, 9.0777587890625, 9.524658203125, 9.9715576171875, 10.41845703125, 10.8653564453125, 11.312255859375, 11.7591552734375, 12.2060546875, 12.6529541015625, 13.099853515625, 13.5467529296875, 13.99365234375, 14.4405517578125, 14.887451171875, 15.3343505859375, 15.78125]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 6.0, 7.0, 12.0, 15.0, 15.0, 26.0, 34.0, 55.0, 106.0, 195.0, 512.0, 1304.0, 5183.0, 41418.0, 1027099.0, 3013372.0, 92669.0, 9083.0, 1839.0, 710.0, 271.0, 135.0, 69.0, 40.0, 28.0, 31.0, 15.0, 16.0, 3.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.484375, -27.539794921875, -26.59521484375, -25.650634765625, -24.7060546875, -23.761474609375, -22.81689453125, -21.872314453125, -20.927734375, -19.983154296875, -19.03857421875, -18.093994140625, -17.1494140625, -16.204833984375, -15.26025390625, -14.315673828125, -13.37109375, -12.426513671875, -11.48193359375, -10.537353515625, -9.5927734375, -8.648193359375, -7.70361328125, -6.759033203125, -5.814453125, -4.869873046875, -3.92529296875, -2.980712890625, -2.0361328125, -1.091552734375, -0.14697265625, 0.797607421875, 1.7421875, 2.686767578125, 3.63134765625, 4.575927734375, 5.5205078125, 6.465087890625, 7.40966796875, 8.354248046875, 9.298828125, 10.243408203125, 11.18798828125, 12.132568359375, 13.0771484375, 14.021728515625, 14.96630859375, 15.910888671875, 16.85546875, 17.800048828125, 18.74462890625, 19.689208984375, 20.6337890625, 21.578369140625, 22.52294921875, 23.467529296875, 24.412109375, 25.356689453125, 26.30126953125, 27.245849609375, 28.1904296875, 29.135009765625, 30.07958984375, 31.024169921875, 31.96875]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 12.0, 41.0, 81.0, 145.0, 173.0, 210.0, 157.0, 81.0, 67.0, 26.0, 12.0, 3.0, 1.0], "bins": [-129.12672424316406, -126.8286361694336, -124.53054809570312, -122.23246002197266, -119.93437194824219, -117.63627624511719, -115.33818817138672, -113.04010009765625, -110.74201202392578, -108.44392395019531, -106.14583587646484, -103.84774780273438, -101.54965209960938, -99.2515640258789, -96.95347595214844, -94.65538787841797, -92.3572998046875, -90.05921173095703, -87.76112365722656, -85.4630355834961, -83.16494750976562, -80.86685180664062, -78.56876373291016, -76.27067565917969, -73.97258758544922, -71.67449951171875, -69.37641143798828, -67.07832336425781, -64.78022766113281, -62.48214340209961, -60.184051513671875, -57.885963439941406, -55.58788299560547, -53.289794921875, -50.99170684814453, -48.6936149597168, -46.39552688598633, -44.09743881225586, -41.799346923828125, -39.501258850097656, -37.20317077636719, -34.90508270263672, -32.60699462890625, -30.308902740478516, -28.010814666748047, -25.712726593017578, -23.414636611938477, -21.116546630859375, -18.818456649780273, -16.520366668701172, -14.222278594970703, -11.924189567565918, -9.626100540161133, -7.328011512756348, -5.0299224853515625, -2.731832504272461, -0.4337444305419922, 1.864344596862793, 4.162433624267578, 6.460522651672363, 8.758611679077148, 11.056700706481934, 13.354789733886719, 15.65287971496582, 17.95096778869629]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 9.0, 6.0, 11.0, 7.0, 16.0, 21.0, 23.0, 26.0, 25.0, 23.0, 30.0, 29.0, 43.0, 29.0, 37.0, 40.0, 50.0, 42.0, 42.0, 42.0, 37.0, 53.0, 47.0, 43.0, 40.0, 35.0, 33.0, 26.0, 29.0, 25.0, 22.0, 9.0, 10.0, 9.0, 10.0, 6.0, 5.0, 5.0, 1.0, 1.0, 5.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-44.24957275390625, -42.88689422607422, -41.52421569824219, -40.161537170410156, -38.798858642578125, -37.436180114746094, -36.07350158691406, -34.71082305908203, -33.34814453125, -31.98546600341797, -30.622787475585938, -29.260108947753906, -27.897430419921875, -26.534751892089844, -25.172073364257812, -23.80939483642578, -22.44671630859375, -21.08403778076172, -19.721359252929688, -18.358680725097656, -16.996002197265625, -15.633323669433594, -14.270645141601562, -12.907966613769531, -11.5452880859375, -10.182609558105469, -8.819931030273438, -7.457252502441406, -6.094573974609375, -4.731895446777344, -3.3692169189453125, -2.0065383911132812, -0.64385986328125, 0.7188186645507812, 2.0814971923828125, 3.4441757202148438, 4.806854248046875, 6.169532775878906, 7.5322113037109375, 8.894889831542969, 10.257568359375, 11.620246887207031, 12.982925415039062, 14.345603942871094, 15.708282470703125, 17.070960998535156, 18.433639526367188, 19.79631805419922, 21.15899658203125, 22.52167510986328, 23.884353637695312, 25.247032165527344, 26.609710693359375, 27.972389221191406, 29.335067749023438, 30.69774627685547, 32.0604248046875, 33.42310333251953, 34.78578186035156, 36.148460388183594, 37.511138916015625, 38.873817443847656, 40.23649597167969, 41.59917449951172, 42.96185302734375]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 5.0, 3.0, 4.0, 3.0, 3.0, 3.0, 5.0, 7.0, 4.0, 12.0, 10.0, 9.0, 9.0, 13.0, 15.0, 19.0, 17.0, 27.0, 27.0, 32.0, 30.0, 31.0, 17.0, 25.0, 43.0, 30.0, 32.0, 37.0, 31.0, 39.0, 49.0, 33.0, 36.0, 37.0, 37.0, 31.0, 25.0, 31.0, 23.0, 20.0, 24.0, 17.0, 7.0, 18.0, 19.0, 15.0, 9.0, 7.0, 7.0, 7.0, 7.0, 6.0, 0.0, 2.0, 2.0, 5.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-7.71875, -7.47515869140625, -7.2315673828125, -6.98797607421875, -6.744384765625, -6.50079345703125, -6.2572021484375, -6.01361083984375, -5.77001953125, -5.52642822265625, -5.2828369140625, -5.03924560546875, -4.795654296875, -4.55206298828125, -4.3084716796875, -4.06488037109375, -3.8212890625, -3.57769775390625, -3.3341064453125, -3.09051513671875, -2.846923828125, -2.60333251953125, -2.3597412109375, -2.11614990234375, -1.87255859375, -1.62896728515625, -1.3853759765625, -1.14178466796875, -0.898193359375, -0.65460205078125, -0.4110107421875, -0.16741943359375, 0.076171875, 0.31976318359375, 0.5633544921875, 0.80694580078125, 1.050537109375, 1.29412841796875, 1.5377197265625, 1.78131103515625, 2.02490234375, 2.26849365234375, 2.5120849609375, 2.75567626953125, 2.999267578125, 3.24285888671875, 3.4864501953125, 3.73004150390625, 3.9736328125, 4.21722412109375, 4.4608154296875, 4.70440673828125, 4.947998046875, 5.19158935546875, 5.4351806640625, 5.67877197265625, 5.92236328125, 6.16595458984375, 6.4095458984375, 6.65313720703125, 6.896728515625, 7.14031982421875, 7.3839111328125, 7.62750244140625, 7.87109375]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 8.0, 16.0, 19.0, 30.0, 46.0, 57.0, 92.0, 130.0, 194.0, 267.0, 452.0, 596.0, 937.0, 1408.0, 2177.0, 3265.0, 4907.0, 7937.0, 11961.0, 19186.0, 30842.0, 50988.0, 87215.0, 158544.0, 244665.0, 176868.0, 97483.0, 56293.0, 33767.0, 20802.0, 12924.0, 8560.0, 5399.0, 3536.0, 2364.0, 1508.0, 1010.0, 694.0, 426.0, 340.0, 216.0, 138.0, 99.0, 63.0, 47.0, 21.0, 19.0, 13.0, 12.0, 9.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.2119140625, -1.173553466796875, -1.13519287109375, -1.096832275390625, -1.0584716796875, -1.020111083984375, -0.98175048828125, -0.943389892578125, -0.905029296875, -0.866668701171875, -0.82830810546875, -0.789947509765625, -0.7515869140625, -0.713226318359375, -0.67486572265625, -0.636505126953125, -0.59814453125, -0.559783935546875, -0.52142333984375, -0.483062744140625, -0.4447021484375, -0.406341552734375, -0.36798095703125, -0.329620361328125, -0.291259765625, -0.252899169921875, -0.21453857421875, -0.176177978515625, -0.1378173828125, -0.099456787109375, -0.06109619140625, -0.022735595703125, 0.015625, 0.053985595703125, 0.09234619140625, 0.130706787109375, 0.1690673828125, 0.207427978515625, 0.24578857421875, 0.284149169921875, 0.322509765625, 0.360870361328125, 0.39923095703125, 0.437591552734375, 0.4759521484375, 0.514312744140625, 0.55267333984375, 0.591033935546875, 0.62939453125, 0.667755126953125, 0.70611572265625, 0.744476318359375, 0.7828369140625, 0.821197509765625, 0.85955810546875, 0.897918701171875, 0.936279296875, 0.974639892578125, 1.01300048828125, 1.051361083984375, 1.0897216796875, 1.128082275390625, 1.16644287109375, 1.204803466796875, 1.2431640625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 7.0, 7.0, 10.0, 4.0, 11.0, 11.0, 13.0, 11.0, 16.0, 18.0, 19.0, 20.0, 33.0, 20.0, 29.0, 26.0, 29.0, 36.0, 33.0, 42.0, 47.0, 28.0, 45.0, 1069.0, 42.0, 40.0, 32.0, 34.0, 39.0, 32.0, 23.0, 26.0, 31.0, 24.0, 17.0, 18.0, 11.0, 11.0, 13.0, 11.0, 7.0, 8.0, 8.0, 4.0, 6.0, 4.0, 4.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.46484375, -5.2998046875, -5.134765625, -4.9697265625, -4.8046875, -4.6396484375, -4.474609375, -4.3095703125, -4.14453125, -3.9794921875, -3.814453125, -3.6494140625, -3.484375, -3.3193359375, -3.154296875, -2.9892578125, -2.82421875, -2.6591796875, -2.494140625, -2.3291015625, -2.1640625, -1.9990234375, -1.833984375, -1.6689453125, -1.50390625, -1.3388671875, -1.173828125, -1.0087890625, -0.84375, -0.6787109375, -0.513671875, -0.3486328125, -0.18359375, -0.0185546875, 0.146484375, 0.3115234375, 0.4765625, 0.6416015625, 0.806640625, 0.9716796875, 1.13671875, 1.3017578125, 1.466796875, 1.6318359375, 1.796875, 1.9619140625, 2.126953125, 2.2919921875, 2.45703125, 2.6220703125, 2.787109375, 2.9521484375, 3.1171875, 3.2822265625, 3.447265625, 3.6123046875, 3.77734375, 3.9423828125, 4.107421875, 4.2724609375, 4.4375, 4.6025390625, 4.767578125, 4.9326171875, 5.09765625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 5.0, 8.0, 11.0, 12.0, 18.0, 28.0, 40.0, 61.0, 102.0, 111.0, 185.0, 276.0, 393.0, 546.0, 801.0, 1161.0, 1651.0, 2425.0, 3586.0, 5315.0, 8161.0, 12355.0, 19315.0, 30482.0, 48677.0, 82923.0, 149568.0, 1282846.0, 183908.0, 101744.0, 58508.0, 36091.0, 22511.0, 14618.0, 9505.0, 6218.0, 4129.0, 2769.0, 1925.0, 1308.0, 908.0, 577.0, 417.0, 291.0, 216.0, 144.0, 98.0, 66.0, 41.0, 28.0, 29.0, 10.0, 10.0, 6.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-1.0078125, -0.9759979248046875, -0.944183349609375, -0.9123687744140625, -0.88055419921875, -0.8487396240234375, -0.816925048828125, -0.7851104736328125, -0.7532958984375, -0.7214813232421875, -0.689666748046875, -0.6578521728515625, -0.62603759765625, -0.5942230224609375, -0.562408447265625, -0.5305938720703125, -0.498779296875, -0.4669647216796875, -0.435150146484375, -0.4033355712890625, -0.37152099609375, -0.3397064208984375, -0.307891845703125, -0.2760772705078125, -0.2442626953125, -0.2124481201171875, -0.180633544921875, -0.1488189697265625, -0.11700439453125, -0.0851898193359375, -0.053375244140625, -0.0215606689453125, 0.01025390625, 0.0420684814453125, 0.073883056640625, 0.1056976318359375, 0.13751220703125, 0.1693267822265625, 0.201141357421875, 0.2329559326171875, 0.2647705078125, 0.2965850830078125, 0.328399658203125, 0.3602142333984375, 0.39202880859375, 0.4238433837890625, 0.455657958984375, 0.4874725341796875, 0.519287109375, 0.5511016845703125, 0.582916259765625, 0.6147308349609375, 0.64654541015625, 0.6783599853515625, 0.710174560546875, 0.7419891357421875, 0.7738037109375, 0.8056182861328125, 0.837432861328125, 0.8692474365234375, 0.90106201171875, 0.9328765869140625, 0.964691162109375, 0.9965057373046875, 1.0283203125]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 4.0, 1.0, 6.0, 4.0, 8.0, 13.0, 9.0, 10.0, 11.0, 19.0, 24.0, 34.0, 30.0, 44.0, 54.0, 62.0, 73.0, 75.0, 65.0, 68.0, 60.0, 58.0, 34.0, 48.0, 45.0, 24.0, 35.0, 17.0, 28.0, 12.0, 13.0, 7.0, 6.0, 2.0, 3.0, 4.0, 0.0, 1.0, 3.0], "bins": [-0.00455474853515625, -0.004450559616088867, -0.004346370697021484, -0.0042421817779541016, -0.004137992858886719, -0.004033803939819336, -0.003929615020751953, -0.0038254261016845703, -0.0037212371826171875, -0.0036170482635498047, -0.003512859344482422, -0.003408670425415039, -0.0033044815063476562, -0.0032002925872802734, -0.0030961036682128906, -0.002991914749145508, -0.002887725830078125, -0.002783536911010742, -0.0026793479919433594, -0.0025751590728759766, -0.0024709701538085938, -0.002366781234741211, -0.002262592315673828, -0.0021584033966064453, -0.0020542144775390625, -0.0019500255584716797, -0.0018458366394042969, -0.001741647720336914, -0.0016374588012695312, -0.0015332698822021484, -0.0014290809631347656, -0.0013248920440673828, -0.001220703125, -0.0011165142059326172, -0.0010123252868652344, -0.0009081363677978516, -0.0008039474487304688, -0.0006997585296630859, -0.0005955696105957031, -0.0004913806915283203, -0.0003871917724609375, -0.0002830028533935547, -0.00017881393432617188, -7.462501525878906e-05, 2.956390380859375e-05, 0.00013375282287597656, 0.00023794174194335938, 0.0003421306610107422, 0.000446319580078125, 0.0005505084991455078, 0.0006546974182128906, 0.0007588863372802734, 0.0008630752563476562, 0.0009672641754150391, 0.0010714530944824219, 0.0011756420135498047, 0.0012798309326171875, 0.0013840198516845703, 0.0014882087707519531, 0.001592397689819336, 0.0016965866088867188, 0.0018007755279541016, 0.0019049644470214844, 0.002009153366088867, 0.00211334228515625]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 14.0, 10.0, 17.0, 19.0, 26.0, 46.0, 50.0, 63.0, 103.0, 124.0, 212.0, 480.0, 1345.0, 986902.0, 57281.0, 834.0, 364.0, 219.0, 104.0, 83.0, 60.0, 51.0, 32.0, 28.0, 17.0, 17.0, 15.0, 7.0, 9.0, 8.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04730224609375, -0.04503059387207031, -0.042758941650390625, -0.04048728942871094, -0.03821563720703125, -0.03594398498535156, -0.033672332763671875, -0.03140068054199219, -0.0291290283203125, -0.026857376098632812, -0.024585723876953125, -0.022314071655273438, -0.02004241943359375, -0.017770767211914062, -0.015499114990234375, -0.013227462768554688, -0.010955810546875, -0.008684158325195312, -0.006412506103515625, -0.0041408538818359375, -0.00186920166015625, 0.0004024505615234375, 0.002674102783203125, 0.0049457550048828125, 0.0072174072265625, 0.009489059448242188, 0.011760711669921875, 0.014032363891601562, 0.01630401611328125, 0.018575668334960938, 0.020847320556640625, 0.023118972778320312, 0.025390625, 0.027662277221679688, 0.029933929443359375, 0.03220558166503906, 0.03447723388671875, 0.03674888610839844, 0.039020538330078125, 0.04129219055175781, 0.0435638427734375, 0.04583549499511719, 0.048107147216796875, 0.05037879943847656, 0.05265045166015625, 0.05492210388183594, 0.057193756103515625, 0.05946540832519531, 0.061737060546875, 0.06400871276855469, 0.06628036499023438, 0.06855201721191406, 0.07082366943359375, 0.07309532165527344, 0.07536697387695312, 0.07763862609863281, 0.0799102783203125, 0.08218193054199219, 0.08445358276367188, 0.08672523498535156, 0.08899688720703125, 0.09126853942871094, 0.09354019165039062, 0.09581184387207031, 0.09808349609375]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 19.0, 838.0, 159.0, 2.0, 1.0, 1.0], "bins": [-0.03422731161117554, -0.033654142171144485, -0.033080969005823135, -0.032507799565792084, -0.031934626400470734, -0.03136145696043968, -0.03078828565776348, -0.03021511435508728, -0.02964194305241108, -0.02906877174973488, -0.028495600447058678, -0.027922429144382477, -0.027349259704351425, -0.026776088401675224, -0.026202917098999023, -0.025629745796322823, -0.02505657449364662, -0.02448340319097042, -0.02391023188829422, -0.02333706244826317, -0.022763891145586967, -0.022190719842910767, -0.021617548540234566, -0.021044377237558365, -0.020471207797527313, -0.019898036494851112, -0.01932486519217491, -0.01875169575214386, -0.01817852444946766, -0.017605353146791458, -0.017032181844115257, -0.016459010541439056, -0.015885837376117706, -0.015312666073441505, -0.01473949570208788, -0.014166324399411678, -0.013593153096735477, -0.013019982725381851, -0.01244681142270565, -0.01187364012002945, -0.011300469748675823, -0.010727298445999622, -0.010154128074645996, -0.009580956771969795, -0.009007785469293594, -0.008434614166617393, -0.007861443795263767, -0.007288272492587566, -0.00671510212123394, -0.0061419312842190266, -0.005568759981542826, -0.004995589144527912, -0.004422417841851711, -0.0038492470048367977, -0.003276076167821884, -0.0027029048651456833, -0.002129733795300126, -0.0015565627254545689, -0.0009833917720243335, -0.0004102208185940981, 0.00016295025125145912, 0.0007361213210970163, 0.00130929215811193, 0.0018824634607881308, 0.0024556342978030443]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 2.0, 2.0, 0.0, 5.0, 8.0, 4.0, 4.0, 11.0, 8.0, 17.0, 14.0, 21.0, 23.0, 22.0, 31.0, 27.0, 30.0, 36.0, 48.0, 37.0, 47.0, 41.0, 37.0, 42.0, 42.0, 44.0, 46.0, 40.0, 30.0, 28.0, 35.0, 34.0, 34.0, 15.0, 23.0, 19.0, 20.0, 15.0, 10.0, 10.0, 11.0, 7.0, 6.0, 4.0, 2.0, 1.0, 5.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0014938712120056152, -0.0014473311603069305, -0.0014007911086082458, -0.0013542510569095612, -0.0013077110052108765, -0.0012611709535121918, -0.001214630901813507, -0.0011680908501148224, -0.0011215507984161377, -0.001075010746717453, -0.0010284706950187683, -0.0009819306433200836, -0.0009353905916213989, -0.0008888505399227142, -0.0008423104882240295, -0.0007957704365253448, -0.0007492303848266602, -0.0007026903331279755, -0.0006561502814292908, -0.0006096102297306061, -0.0005630701780319214, -0.0005165301263332367, -0.000469990074634552, -0.0004234500229358673, -0.0003769099712371826, -0.0003303699195384979, -0.00028382986783981323, -0.00023728981614112854, -0.00019074976444244385, -0.00014420971274375916, -9.766966104507446e-05, -5.112960934638977e-05, -4.589557647705078e-06, 4.1950494050979614e-05, 8.84905457496643e-05, 0.000135030597448349, 0.0001815706491470337, 0.00022811070084571838, 0.0002746507525444031, 0.00032119080424308777, 0.00036773085594177246, 0.00041427090764045715, 0.00046081095933914185, 0.0005073510110378265, 0.0005538910627365112, 0.0006004311144351959, 0.0006469711661338806, 0.0006935112178325653, 0.00074005126953125, 0.0007865913212299347, 0.0008331313729286194, 0.0008796714246273041, 0.0009262114763259888, 0.0009727515280246735, 0.0010192915797233582, 0.0010658316314220428, 0.0011123716831207275, 0.0011589117348194122, 0.001205451786518097, 0.0012519918382167816, 0.0012985318899154663, 0.001345071941614151, 0.0013916119933128357, 0.0014381520450115204, 0.001484692096710205]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 5.0, 3.0, 4.0, 3.0, 3.0, 3.0, 5.0, 7.0, 4.0, 12.0, 10.0, 9.0, 9.0, 13.0, 15.0, 19.0, 17.0, 27.0, 27.0, 32.0, 30.0, 31.0, 17.0, 25.0, 43.0, 30.0, 32.0, 37.0, 32.0, 38.0, 49.0, 33.0, 36.0, 37.0, 37.0, 31.0, 25.0, 31.0, 24.0, 19.0, 24.0, 17.0, 7.0, 18.0, 19.0, 15.0, 9.0, 7.0, 7.0, 7.0, 7.0, 6.0, 0.0, 2.0, 2.0, 5.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-7.71875, -7.47515869140625, -7.2315673828125, -6.98797607421875, -6.744384765625, -6.50079345703125, -6.2572021484375, -6.01361083984375, -5.77001953125, -5.52642822265625, -5.2828369140625, -5.03924560546875, -4.795654296875, -4.55206298828125, -4.3084716796875, -4.06488037109375, -3.8212890625, -3.57769775390625, -3.3341064453125, -3.09051513671875, -2.846923828125, -2.60333251953125, -2.3597412109375, -2.11614990234375, -1.87255859375, -1.62896728515625, -1.3853759765625, -1.14178466796875, -0.898193359375, -0.65460205078125, -0.4110107421875, -0.16741943359375, 0.076171875, 0.31976318359375, 0.5633544921875, 0.80694580078125, 1.050537109375, 1.29412841796875, 1.5377197265625, 1.78131103515625, 2.02490234375, 2.26849365234375, 2.5120849609375, 2.75567626953125, 2.999267578125, 3.24285888671875, 3.4864501953125, 3.73004150390625, 3.9736328125, 4.21722412109375, 4.4608154296875, 4.70440673828125, 4.947998046875, 5.19158935546875, 5.4351806640625, 5.67877197265625, 5.92236328125, 6.16595458984375, 6.4095458984375, 6.65313720703125, 6.896728515625, 7.14031982421875, 7.3839111328125, 7.62750244140625, 7.87109375]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 7.0, 12.0, 5.0, 6.0, 12.0, 11.0, 23.0, 32.0, 41.0, 38.0, 65.0, 72.0, 129.0, 177.0, 238.0, 329.0, 542.0, 764.0, 1350.0, 2310.0, 4629.0, 10586.0, 29583.0, 93945.0, 315275.0, 396628.0, 126760.0, 38657.0, 13520.0, 5573.0, 2799.0, 1535.0, 962.0, 635.0, 365.0, 257.0, 165.0, 141.0, 112.0, 76.0, 39.0, 39.0, 35.0, 29.0, 11.0, 15.0, 12.0, 7.0, 5.0, 1.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.9375, -10.6072998046875, -10.277099609375, -9.9468994140625, -9.61669921875, -9.2864990234375, -8.956298828125, -8.6260986328125, -8.2958984375, -7.9656982421875, -7.635498046875, -7.3052978515625, -6.97509765625, -6.6448974609375, -6.314697265625, -5.9844970703125, -5.654296875, -5.3240966796875, -4.993896484375, -4.6636962890625, -4.33349609375, -4.0032958984375, -3.673095703125, -3.3428955078125, -3.0126953125, -2.6824951171875, -2.352294921875, -2.0220947265625, -1.69189453125, -1.3616943359375, -1.031494140625, -0.7012939453125, -0.37109375, -0.0408935546875, 0.289306640625, 0.6195068359375, 0.94970703125, 1.2799072265625, 1.610107421875, 1.9403076171875, 2.2705078125, 2.6007080078125, 2.930908203125, 3.2611083984375, 3.59130859375, 3.9215087890625, 4.251708984375, 4.5819091796875, 4.912109375, 5.2423095703125, 5.572509765625, 5.9027099609375, 6.23291015625, 6.5631103515625, 6.893310546875, 7.2235107421875, 7.5537109375, 7.8839111328125, 8.214111328125, 8.5443115234375, 8.87451171875, 9.2047119140625, 9.534912109375, 9.8651123046875, 10.1953125]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 4.0, 5.0, 5.0, 12.0, 10.0, 13.0, 24.0, 10.0, 28.0, 16.0, 34.0, 33.0, 43.0, 43.0, 36.0, 58.0, 67.0, 96.0, 236.0, 1555.0, 196.0, 104.0, 60.0, 58.0, 41.0, 46.0, 37.0, 27.0, 37.0, 29.0, 16.0, 18.0, 15.0, 10.0, 9.0, 6.0, 4.0, 1.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.515625, -21.7236328125, -20.931640625, -20.1396484375, -19.34765625, -18.5556640625, -17.763671875, -16.9716796875, -16.1796875, -15.3876953125, -14.595703125, -13.8037109375, -13.01171875, -12.2197265625, -11.427734375, -10.6357421875, -9.84375, -9.0517578125, -8.259765625, -7.4677734375, -6.67578125, -5.8837890625, -5.091796875, -4.2998046875, -3.5078125, -2.7158203125, -1.923828125, -1.1318359375, -0.33984375, 0.4521484375, 1.244140625, 2.0361328125, 2.828125, 3.6201171875, 4.412109375, 5.2041015625, 5.99609375, 6.7880859375, 7.580078125, 8.3720703125, 9.1640625, 9.9560546875, 10.748046875, 11.5400390625, 12.33203125, 13.1240234375, 13.916015625, 14.7080078125, 15.5, 16.2919921875, 17.083984375, 17.8759765625, 18.66796875, 19.4599609375, 20.251953125, 21.0439453125, 21.8359375, 22.6279296875, 23.419921875, 24.2119140625, 25.00390625, 25.7958984375, 26.587890625, 27.3798828125, 28.171875]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 7.0, 15.0, 18.0, 22.0, 32.0, 43.0, 47.0, 56.0, 115.0, 198.0, 282.0, 515.0, 1065.0, 12268.0, 2788796.0, 336438.0, 3876.0, 769.0, 349.0, 227.0, 148.0, 88.0, 95.0, 57.0, 46.0, 36.0, 26.0, 24.0, 17.0, 7.0, 4.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-52.5, -50.99267578125, -49.4853515625, -47.97802734375, -46.470703125, -44.96337890625, -43.4560546875, -41.94873046875, -40.44140625, -38.93408203125, -37.4267578125, -35.91943359375, -34.412109375, -32.90478515625, -31.3974609375, -29.89013671875, -28.3828125, -26.87548828125, -25.3681640625, -23.86083984375, -22.353515625, -20.84619140625, -19.3388671875, -17.83154296875, -16.32421875, -14.81689453125, -13.3095703125, -11.80224609375, -10.294921875, -8.78759765625, -7.2802734375, -5.77294921875, -4.265625, -2.75830078125, -1.2509765625, 0.25634765625, 1.763671875, 3.27099609375, 4.7783203125, 6.28564453125, 7.79296875, 9.30029296875, 10.8076171875, 12.31494140625, 13.822265625, 15.32958984375, 16.8369140625, 18.34423828125, 19.8515625, 21.35888671875, 22.8662109375, 24.37353515625, 25.880859375, 27.38818359375, 28.8955078125, 30.40283203125, 31.91015625, 33.41748046875, 34.9248046875, 36.43212890625, 37.939453125, 39.44677734375, 40.9541015625, 42.46142578125, 43.96875]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 8.0, 133.0, 771.0, 100.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-325.0115661621094, -318.57366943359375, -312.1357727050781, -305.6978759765625, -299.25994873046875, -292.8220520019531, -286.3841552734375, -279.9462585449219, -273.50836181640625, -267.0704650878906, -260.632568359375, -254.1946563720703, -247.7567596435547, -241.31886291503906, -234.88095092773438, -228.44305419921875, -222.00515747070312, -215.5672607421875, -209.12936401367188, -202.6914520263672, -196.25355529785156, -189.81565856933594, -183.37774658203125, -176.93984985351562, -170.501953125, -164.06405639648438, -157.62615966796875, -151.18824768066406, -144.75035095214844, -138.3124542236328, -131.87454223632812, -125.4366455078125, -118.99876403808594, -112.56086730957031, -106.12296295166016, -99.68505859375, -93.24716186523438, -86.80926513671875, -80.3713607788086, -73.93345642089844, -67.49555969238281, -61.05765914916992, -54.61975860595703, -48.18185806274414, -41.74395751953125, -35.30605697631836, -28.86815643310547, -22.430255889892578, -15.992355346679688, -9.554454803466797, -3.1165542602539062, 3.3213462829589844, 9.759246826171875, 16.197147369384766, 22.635047912597656, 29.072948455810547, 35.51084899902344, 41.94874954223633, 48.38665008544922, 54.82455062866211, 61.262451171875, 67.70034790039062, 74.13825225830078, 80.57615661621094, 87.01405334472656]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 7.0, 6.0, 7.0, 7.0, 5.0, 12.0, 14.0, 14.0, 18.0, 23.0, 24.0, 24.0, 27.0, 22.0, 34.0, 32.0, 54.0, 43.0, 43.0, 49.0, 51.0, 44.0, 45.0, 39.0, 33.0, 34.0, 40.0, 48.0, 26.0, 25.0, 23.0, 22.0, 24.0, 16.0, 12.0, 12.0, 10.0, 10.0, 8.0, 4.0, 5.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-61.96592330932617, -60.257659912109375, -58.54939270019531, -56.841129302978516, -55.13286590576172, -53.424598693847656, -51.71633529663086, -50.00807189941406, -48.2998046875, -46.5915412902832, -44.88327407836914, -43.175010681152344, -41.46674346923828, -39.758480072021484, -38.05021667480469, -36.341949462890625, -34.63368606567383, -32.92542266845703, -31.21715545654297, -29.508892059326172, -27.800626754760742, -26.092361450195312, -24.384098052978516, -22.675832748413086, -20.967567443847656, -19.259302139282227, -17.551036834716797, -15.8427734375, -14.13450813293457, -12.42624282836914, -10.717978477478027, -9.009714126586914, -7.30145263671875, -5.5931878089904785, -3.884922981262207, -2.1766581535339355, -0.46839332580566406, 1.2398719787597656, 2.948136329650879, 4.656400680541992, 6.364665985107422, 8.072931289672852, 9.781195640563965, 11.489459991455078, 13.197725296020508, 14.905990600585938, 16.614253997802734, 18.322519302368164, 20.030784606933594, 21.739049911499023, 23.447315216064453, 25.15557861328125, 26.86384391784668, 28.57210922241211, 30.280372619628906, 31.988637924194336, 33.696903228759766, 35.40516662597656, 37.113433837890625, 38.82169723510742, 40.52996063232422, 42.23822784423828, 43.94649124145508, 45.654754638671875, 47.36302185058594]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 0.0, 4.0, 1.0, 1.0, 3.0, 4.0, 10.0, 7.0, 11.0, 7.0, 14.0, 15.0, 11.0, 27.0, 14.0, 24.0, 22.0, 27.0, 28.0, 21.0, 38.0, 27.0, 39.0, 39.0, 35.0, 39.0, 38.0, 50.0, 37.0, 48.0, 38.0, 31.0, 32.0, 37.0, 32.0, 31.0, 19.0, 24.0, 21.0, 12.0, 15.0, 10.0, 14.0, 11.0, 13.0, 10.0, 4.0, 3.0, 2.0, 2.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.9375, -8.6708984375, -8.404296875, -8.1376953125, -7.87109375, -7.6044921875, -7.337890625, -7.0712890625, -6.8046875, -6.5380859375, -6.271484375, -6.0048828125, -5.73828125, -5.4716796875, -5.205078125, -4.9384765625, -4.671875, -4.4052734375, -4.138671875, -3.8720703125, -3.60546875, -3.3388671875, -3.072265625, -2.8056640625, -2.5390625, -2.2724609375, -2.005859375, -1.7392578125, -1.47265625, -1.2060546875, -0.939453125, -0.6728515625, -0.40625, -0.1396484375, 0.126953125, 0.3935546875, 0.66015625, 0.9267578125, 1.193359375, 1.4599609375, 1.7265625, 1.9931640625, 2.259765625, 2.5263671875, 2.79296875, 3.0595703125, 3.326171875, 3.5927734375, 3.859375, 4.1259765625, 4.392578125, 4.6591796875, 4.92578125, 5.1923828125, 5.458984375, 5.7255859375, 5.9921875, 6.2587890625, 6.525390625, 6.7919921875, 7.05859375, 7.3251953125, 7.591796875, 7.8583984375, 8.125]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 2.0, 1.0, 8.0, 3.0, 15.0, 13.0, 12.0, 20.0, 20.0, 22.0, 31.0, 51.0, 46.0, 70.0, 87.0, 150.0, 206.0, 255.0, 308.0, 494.0, 3071.0, 4186576.0, 1112.0, 484.0, 313.0, 243.0, 177.0, 140.0, 82.0, 55.0, 53.0, 41.0, 21.0, 17.0, 21.0, 13.0, 14.0, 10.0, 15.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-187.375, -180.767578125, -174.16015625, -167.552734375, -160.9453125, -154.337890625, -147.73046875, -141.123046875, -134.515625, -127.908203125, -121.30078125, -114.693359375, -108.0859375, -101.478515625, -94.87109375, -88.263671875, -81.65625, -75.048828125, -68.44140625, -61.833984375, -55.2265625, -48.619140625, -42.01171875, -35.404296875, -28.796875, -22.189453125, -15.58203125, -8.974609375, -2.3671875, 4.240234375, 10.84765625, 17.455078125, 24.0625, 30.669921875, 37.27734375, 43.884765625, 50.4921875, 57.099609375, 63.70703125, 70.314453125, 76.921875, 83.529296875, 90.13671875, 96.744140625, 103.3515625, 109.958984375, 116.56640625, 123.173828125, 129.78125, 136.388671875, 142.99609375, 149.603515625, 156.2109375, 162.818359375, 169.42578125, 176.033203125, 182.640625, 189.248046875, 195.85546875, 202.462890625, 209.0703125, 215.677734375, 222.28515625, 228.892578125, 235.5]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 7.0, 4.0, 3.0, 8.0, 11.0, 9.0, 13.0, 17.0, 28.0, 48.0, 55.0, 72.0, 109.0, 166.0, 265.0, 424.0, 676.0, 723.0, 532.0, 318.0, 231.0, 118.0, 61.0, 42.0, 47.0, 31.0, 14.0, 18.0, 12.0, 6.0, 3.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.578125, -18.0645751953125, -17.551025390625, -17.0374755859375, -16.52392578125, -16.0103759765625, -15.496826171875, -14.9832763671875, -14.4697265625, -13.9561767578125, -13.442626953125, -12.9290771484375, -12.41552734375, -11.9019775390625, -11.388427734375, -10.8748779296875, -10.361328125, -9.8477783203125, -9.334228515625, -8.8206787109375, -8.30712890625, -7.7935791015625, -7.280029296875, -6.7664794921875, -6.2529296875, -5.7393798828125, -5.225830078125, -4.7122802734375, -4.19873046875, -3.6851806640625, -3.171630859375, -2.6580810546875, -2.14453125, -1.6309814453125, -1.117431640625, -0.6038818359375, -0.09033203125, 0.4232177734375, 0.936767578125, 1.4503173828125, 1.9638671875, 2.4774169921875, 2.990966796875, 3.5045166015625, 4.01806640625, 4.5316162109375, 5.045166015625, 5.5587158203125, 6.072265625, 6.5858154296875, 7.099365234375, 7.6129150390625, 8.12646484375, 8.6400146484375, 9.153564453125, 9.6671142578125, 10.1806640625, 10.6942138671875, 11.207763671875, 11.7213134765625, 12.23486328125, 12.7484130859375, 13.261962890625, 13.7755126953125, 14.2890625]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 2.0, 2.0, 5.0, 4.0, 5.0, 7.0, 11.0, 7.0, 7.0, 15.0, 21.0, 23.0, 23.0, 31.0, 38.0, 33.0, 55.0, 66.0, 106.0, 282.0, 1729.0, 824935.0, 3363315.0, 2759.0, 317.0, 104.0, 71.0, 51.0, 45.0, 33.0, 21.0, 23.0, 23.0, 22.0, 13.0, 21.0, 14.0, 5.0, 8.0, 9.0, 7.0, 4.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-90.5, -87.677734375, -84.85546875, -82.033203125, -79.2109375, -76.388671875, -73.56640625, -70.744140625, -67.921875, -65.099609375, -62.27734375, -59.455078125, -56.6328125, -53.810546875, -50.98828125, -48.166015625, -45.34375, -42.521484375, -39.69921875, -36.876953125, -34.0546875, -31.232421875, -28.41015625, -25.587890625, -22.765625, -19.943359375, -17.12109375, -14.298828125, -11.4765625, -8.654296875, -5.83203125, -3.009765625, -0.1875, 2.634765625, 5.45703125, 8.279296875, 11.1015625, 13.923828125, 16.74609375, 19.568359375, 22.390625, 25.212890625, 28.03515625, 30.857421875, 33.6796875, 36.501953125, 39.32421875, 42.146484375, 44.96875, 47.791015625, 50.61328125, 53.435546875, 56.2578125, 59.080078125, 61.90234375, 64.724609375, 67.546875, 70.369140625, 73.19140625, 76.013671875, 78.8359375, 81.658203125, 84.48046875, 87.302734375, 90.125]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 9.0, 14.0, 29.0, 63.0, 92.0, 116.0, 157.0, 186.0, 132.0, 93.0, 74.0, 34.0, 7.0, 7.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.989965438842773, -17.10354232788086, -15.217117309570312, -13.330694198608398, -11.444270133972168, -9.557846069335938, -7.671422958374023, -5.784998893737793, -3.8985748291015625, -2.012151002883911, -0.12572717666625977, 1.7606964111328125, 3.647120475769043, 5.533544540405273, 7.4199676513671875, 9.306391716003418, 11.192815780639648, 13.079239845275879, 14.96566390991211, 16.852087020874023, 18.738510131835938, 20.624935150146484, 22.5113582611084, 24.397781372070312, 26.28420639038086, 28.170629501342773, 30.05705451965332, 31.943477630615234, 33.82990264892578, 35.71632385253906, 37.60274887084961, 39.489173889160156, 41.37559509277344, 43.262020111083984, 45.148441314697266, 47.03486633300781, 48.92129135131836, 50.807716369628906, 52.69413757324219, 54.580562591552734, 56.46698760986328, 58.35341262817383, 60.23983383178711, 62.126258850097656, 64.01268005371094, 65.89910888671875, 67.78553009033203, 69.67195129394531, 71.55838012695312, 73.4448013305664, 75.33123016357422, 77.2176513671875, 79.10407257080078, 80.9905014038086, 82.87692260742188, 84.76334381103516, 86.64976501464844, 88.53618621826172, 90.42261505126953, 92.30903625488281, 94.1954574584961, 96.0818862915039, 97.96830749511719, 99.85472869873047, 101.74115753173828]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 7.0, 7.0, 8.0, 16.0, 12.0, 17.0, 14.0, 18.0, 23.0, 27.0, 20.0, 32.0, 30.0, 26.0, 36.0, 42.0, 35.0, 39.0, 31.0, 39.0, 39.0, 35.0, 41.0, 37.0, 44.0, 31.0, 37.0, 26.0, 22.0, 22.0, 23.0, 20.0, 23.0, 19.0, 14.0, 15.0, 13.0, 13.0, 18.0, 3.0, 7.0, 4.0, 3.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-40.918212890625, -39.644020080566406, -38.36982345581055, -37.09563064575195, -35.82143783569336, -34.5472412109375, -33.273048400878906, -31.998855590820312, -30.724660873413086, -29.45046615600586, -28.176273345947266, -26.90207862854004, -25.627883911132812, -24.35369110107422, -23.079496383666992, -21.805301666259766, -20.531108856201172, -19.256914138793945, -17.98272132873535, -16.708526611328125, -15.434332847595215, -14.160139083862305, -12.885944366455078, -11.611750602722168, -10.337556838989258, -9.063363075256348, -7.789168834686279, -6.514974594116211, -5.240780830383301, -3.9665870666503906, -2.6923928260803223, -1.418198585510254, -0.14400482177734375, 1.1301891803741455, 2.4043831825256348, 3.678577184677124, 4.952771186828613, 6.226964950561523, 7.501159191131592, 8.77535343170166, 10.04954719543457, 11.32374095916748, 12.59793472290039, 13.872129440307617, 15.146323204040527, 16.420516967773438, 17.694711685180664, 18.96890640258789, 20.243099212646484, 21.51729393005371, 22.791486740112305, 24.06568145751953, 25.339874267578125, 26.61406898498535, 27.888263702392578, 29.162456512451172, 30.4366512298584, 31.710845947265625, 32.98503875732422, 34.25923156738281, 35.53342819213867, 36.807621002197266, 38.08181381225586, 39.35601043701172, 40.63020324707031]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 3.0, 3.0, 2.0, 10.0, 6.0, 9.0, 7.0, 14.0, 16.0, 8.0, 29.0, 28.0, 27.0, 31.0, 20.0, 22.0, 36.0, 35.0, 42.0, 44.0, 41.0, 49.0, 36.0, 35.0, 41.0, 43.0, 30.0, 46.0, 35.0, 28.0, 34.0, 26.0, 31.0, 28.0, 17.0, 13.0, 10.0, 12.0, 18.0, 11.0, 6.0, 6.0, 2.0, 4.0, 4.0, 1.0, 3.0, 1.0, 3.0], "bins": [-9.9296875, -9.66375732421875, -9.3978271484375, -9.13189697265625, -8.865966796875, -8.60003662109375, -8.3341064453125, -8.06817626953125, -7.80224609375, -7.53631591796875, -7.2703857421875, -7.00445556640625, -6.738525390625, -6.47259521484375, -6.2066650390625, -5.94073486328125, -5.6748046875, -5.40887451171875, -5.1429443359375, -4.87701416015625, -4.611083984375, -4.34515380859375, -4.0792236328125, -3.81329345703125, -3.54736328125, -3.28143310546875, -3.0155029296875, -2.74957275390625, -2.483642578125, -2.21771240234375, -1.9517822265625, -1.68585205078125, -1.419921875, -1.15399169921875, -0.8880615234375, -0.62213134765625, -0.356201171875, -0.09027099609375, 0.1756591796875, 0.44158935546875, 0.70751953125, 0.97344970703125, 1.2393798828125, 1.50531005859375, 1.771240234375, 2.03717041015625, 2.3031005859375, 2.56903076171875, 2.8349609375, 3.10089111328125, 3.3668212890625, 3.63275146484375, 3.898681640625, 4.16461181640625, 4.4305419921875, 4.69647216796875, 4.96240234375, 5.22833251953125, 5.4942626953125, 5.76019287109375, 6.026123046875, 6.29205322265625, 6.5579833984375, 6.82391357421875, 7.08984375]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 7.0, 19.0, 14.0, 29.0, 47.0, 55.0, 106.0, 105.0, 160.0, 242.0, 338.0, 515.0, 769.0, 1170.0, 1698.0, 2534.0, 3855.0, 5837.0, 8971.0, 13851.0, 22825.0, 37156.0, 63818.0, 120234.0, 232038.0, 237563.0, 125167.0, 65966.0, 38607.0, 23305.0, 14673.0, 9191.0, 6052.0, 3748.0, 2579.0, 1663.0, 1156.0, 767.0, 532.0, 381.0, 258.0, 169.0, 112.0, 97.0, 62.0, 32.0, 23.0, 21.0, 10.0, 8.0, 7.0, 9.0, 1.0, 2.0, 1.0, 3.0], "bins": [-1.2861328125, -1.2471923828125, -1.208251953125, -1.1693115234375, -1.13037109375, -1.0914306640625, -1.052490234375, -1.0135498046875, -0.974609375, -0.9356689453125, -0.896728515625, -0.8577880859375, -0.81884765625, -0.7799072265625, -0.740966796875, -0.7020263671875, -0.6630859375, -0.6241455078125, -0.585205078125, -0.5462646484375, -0.50732421875, -0.4683837890625, -0.429443359375, -0.3905029296875, -0.3515625, -0.3126220703125, -0.273681640625, -0.2347412109375, -0.19580078125, -0.1568603515625, -0.117919921875, -0.0789794921875, -0.0400390625, -0.0010986328125, 0.037841796875, 0.0767822265625, 0.11572265625, 0.1546630859375, 0.193603515625, 0.2325439453125, 0.271484375, 0.3104248046875, 0.349365234375, 0.3883056640625, 0.42724609375, 0.4661865234375, 0.505126953125, 0.5440673828125, 0.5830078125, 0.6219482421875, 0.660888671875, 0.6998291015625, 0.73876953125, 0.7777099609375, 0.816650390625, 0.8555908203125, 0.89453125, 0.9334716796875, 0.972412109375, 1.0113525390625, 1.05029296875, 1.0892333984375, 1.128173828125, 1.1671142578125, 1.2060546875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 2.0, 6.0, 5.0, 8.0, 14.0, 8.0, 10.0, 13.0, 13.0, 15.0, 18.0, 19.0, 21.0, 19.0, 28.0, 23.0, 26.0, 27.0, 27.0, 34.0, 32.0, 32.0, 45.0, 52.0, 1057.0, 39.0, 34.0, 35.0, 37.0, 27.0, 31.0, 27.0, 33.0, 22.0, 22.0, 21.0, 22.0, 16.0, 14.0, 18.0, 14.0, 14.0, 11.0, 9.0, 4.0, 1.0, 4.0, 3.0, 3.0, 6.0, 2.0, 2.0, 1.0, 2.0, 5.0], "bins": [-4.83984375, -4.69500732421875, -4.5501708984375, -4.40533447265625, -4.260498046875, -4.11566162109375, -3.9708251953125, -3.82598876953125, -3.68115234375, -3.53631591796875, -3.3914794921875, -3.24664306640625, -3.101806640625, -2.95697021484375, -2.8121337890625, -2.66729736328125, -2.5224609375, -2.37762451171875, -2.2327880859375, -2.08795166015625, -1.943115234375, -1.79827880859375, -1.6534423828125, -1.50860595703125, -1.36376953125, -1.21893310546875, -1.0740966796875, -0.92926025390625, -0.784423828125, -0.63958740234375, -0.4947509765625, -0.34991455078125, -0.205078125, -0.06024169921875, 0.0845947265625, 0.22943115234375, 0.374267578125, 0.51910400390625, 0.6639404296875, 0.80877685546875, 0.95361328125, 1.09844970703125, 1.2432861328125, 1.38812255859375, 1.532958984375, 1.67779541015625, 1.8226318359375, 1.96746826171875, 2.1123046875, 2.25714111328125, 2.4019775390625, 2.54681396484375, 2.691650390625, 2.83648681640625, 2.9813232421875, 3.12615966796875, 3.27099609375, 3.41583251953125, 3.5606689453125, 3.70550537109375, 3.850341796875, 3.99517822265625, 4.1400146484375, 4.28485107421875, 4.4296875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 12.0, 29.0, 27.0, 37.0, 81.0, 106.0, 151.0, 230.0, 280.0, 437.0, 559.0, 870.0, 1188.0, 1819.0, 2742.0, 4074.0, 5869.0, 8979.0, 13953.0, 21460.0, 34617.0, 55482.0, 97410.0, 180689.0, 1293192.0, 153727.0, 83459.0, 48787.0, 30271.0, 19365.0, 12322.0, 8167.0, 5441.0, 3562.0, 2450.0, 1618.0, 1092.0, 775.0, 538.0, 407.0, 271.0, 210.0, 118.0, 95.0, 56.0, 44.0, 26.0, 13.0, 9.0, 7.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.97265625, -0.9406280517578125, -0.908599853515625, -0.8765716552734375, -0.84454345703125, -0.8125152587890625, -0.780487060546875, -0.7484588623046875, -0.7164306640625, -0.6844024658203125, -0.652374267578125, -0.6203460693359375, -0.58831787109375, -0.5562896728515625, -0.524261474609375, -0.4922332763671875, -0.460205078125, -0.4281768798828125, -0.396148681640625, -0.3641204833984375, -0.33209228515625, -0.3000640869140625, -0.268035888671875, -0.2360076904296875, -0.2039794921875, -0.1719512939453125, -0.139923095703125, -0.1078948974609375, -0.07586669921875, -0.0438385009765625, -0.011810302734375, 0.0202178955078125, 0.05224609375, 0.0842742919921875, 0.116302490234375, 0.1483306884765625, 0.18035888671875, 0.2123870849609375, 0.244415283203125, 0.2764434814453125, 0.3084716796875, 0.3404998779296875, 0.372528076171875, 0.4045562744140625, 0.43658447265625, 0.4686126708984375, 0.500640869140625, 0.5326690673828125, 0.564697265625, 0.5967254638671875, 0.628753662109375, 0.6607818603515625, 0.69281005859375, 0.7248382568359375, 0.756866455078125, 0.7888946533203125, 0.8209228515625, 0.8529510498046875, 0.884979248046875, 0.9170074462890625, 0.94903564453125, 0.9810638427734375, 1.013092041015625, 1.0451202392578125, 1.0771484375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 7.0, 3.0, 6.0, 9.0, 4.0, 9.0, 15.0, 24.0, 18.0, 20.0, 23.0, 29.0, 50.0, 37.0, 50.0, 69.0, 51.0, 71.0, 64.0, 57.0, 48.0, 50.0, 40.0, 60.0, 33.0, 31.0, 20.0, 21.0, 14.0, 8.0, 11.0, 6.0, 8.0, 9.0, 3.0, 6.0, 5.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0024623870849609375, -0.0023832321166992188, -0.0023040771484375, -0.0022249221801757812, -0.0021457672119140625, -0.0020666122436523438, -0.001987457275390625, -0.0019083023071289062, -0.0018291473388671875, -0.0017499923706054688, -0.00167083740234375, -0.0015916824340820312, -0.0015125274658203125, -0.0014333724975585938, -0.001354217529296875, -0.0012750625610351562, -0.0011959075927734375, -0.0011167526245117188, -0.00103759765625, -0.0009584426879882812, -0.0008792877197265625, -0.0008001327514648438, -0.000720977783203125, -0.0006418228149414062, -0.0005626678466796875, -0.00048351287841796875, -0.00040435791015625, -0.00032520294189453125, -0.0002460479736328125, -0.00016689300537109375, -8.7738037109375e-05, -8.58306884765625e-06, 7.05718994140625e-05, 0.00014972686767578125, 0.0002288818359375, 0.00030803680419921875, 0.0003871917724609375, 0.00046634674072265625, 0.000545501708984375, 0.0006246566772460938, 0.0007038116455078125, 0.0007829666137695312, 0.00086212158203125, 0.0009412765502929688, 0.0010204315185546875, 0.0010995864868164062, 0.001178741455078125, 0.0012578964233398438, 0.0013370513916015625, 0.0014162063598632812, 0.001495361328125, 0.0015745162963867188, 0.0016536712646484375, 0.0017328262329101562, 0.001811981201171875, 0.0018911361694335938, 0.0019702911376953125, 0.0020494461059570312, 0.00212860107421875, 0.0022077560424804688, 0.0022869110107421875, 0.0023660659790039062, 0.002445220947265625, 0.0025243759155273438, 0.0026035308837890625]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 4.0, 4.0, 7.0, 1.0, 6.0, 10.0, 10.0, 15.0, 6.0, 16.0, 28.0, 24.0, 35.0, 46.0, 57.0, 97.0, 123.0, 173.0, 240.0, 408.0, 729.0, 4824.0, 999408.0, 39777.0, 978.0, 498.0, 284.0, 177.0, 146.0, 108.0, 72.0, 54.0, 53.0, 39.0, 16.0, 18.0, 11.0, 9.0, 8.0, 5.0, 10.0, 5.0, 2.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0], "bins": [-0.04962158203125, -0.04810285568237305, -0.046584129333496094, -0.04506540298461914, -0.04354667663574219, -0.042027950286865234, -0.04050922393798828, -0.03899049758911133, -0.037471771240234375, -0.03595304489135742, -0.03443431854248047, -0.032915592193603516, -0.03139686584472656, -0.02987813949584961, -0.028359413146972656, -0.026840686798095703, -0.02532196044921875, -0.023803234100341797, -0.022284507751464844, -0.02076578140258789, -0.019247055053710938, -0.017728328704833984, -0.01620960235595703, -0.014690876007080078, -0.013172149658203125, -0.011653423309326172, -0.010134696960449219, -0.008615970611572266, -0.0070972442626953125, -0.005578517913818359, -0.004059791564941406, -0.002541065216064453, -0.0010223388671875, 0.0004963874816894531, 0.0020151138305664062, 0.0035338401794433594, 0.0050525665283203125, 0.006571292877197266, 0.008090019226074219, 0.009608745574951172, 0.011127471923828125, 0.012646198272705078, 0.014164924621582031, 0.015683650970458984, 0.017202377319335938, 0.01872110366821289, 0.020239830017089844, 0.021758556365966797, 0.02327728271484375, 0.024796009063720703, 0.026314735412597656, 0.02783346176147461, 0.029352188110351562, 0.030870914459228516, 0.03238964080810547, 0.03390836715698242, 0.035427093505859375, 0.03694581985473633, 0.03846454620361328, 0.039983272552490234, 0.04150199890136719, 0.04302072525024414, 0.044539451599121094, 0.04605817794799805, 0.047576904296875]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 34.0, 258.0, 543.0, 169.0, 9.0, 0.0, 3.0], "bins": [-0.015030762180685997, -0.01477746944874525, -0.01452417578548193, -0.014270883053541183, -0.014017589390277863, -0.013764296658337116, -0.01351100392639637, -0.013257710263133049, -0.013004417531192303, -0.012751124799251556, -0.012497831135988235, -0.01224453840404749, -0.011991244740784168, -0.011737952008843422, -0.011484658345580101, -0.011231365613639355, -0.010978072881698608, -0.010724780149757862, -0.010471486486494541, -0.010218193754553795, -0.009964900091290474, -0.009711607359349728, -0.009458314627408981, -0.00920502096414566, -0.00895172730088234, -0.008698434568941593, -0.008445140905678272, -0.008191848173737526, -0.007938554510474205, -0.007685261778533459, -0.007431968580931425, -0.0071786753833293915, -0.006925382651388645, -0.0066720894537866116, -0.006418796256184578, -0.006165503524243832, -0.005912210326641798, -0.005658917129039764, -0.005405623931437731, -0.005152330733835697, -0.0048990375362336636, -0.00464574433863163, -0.004392451141029596, -0.004139157943427563, -0.0038858652114868164, -0.003632572013884783, -0.003379278816282749, -0.0031259856186807156, -0.0028726926539093256, -0.002619399456307292, -0.002366106491535902, -0.0021128132939338684, -0.0018595202127471566, -0.0016062271315604448, -0.0013529339339584112, -0.0010996408527716994, -0.0008463477715849876, -0.0005930546903982759, -0.00033976155100390315, -8.646841160953045e-05, 0.00016682466957718134, 0.00042011775076389313, 0.0006734109483659267, 0.0009267040295526385, 0.0011799971107393503]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 6.0, 7.0, 7.0, 12.0, 7.0, 13.0, 18.0, 15.0, 29.0, 23.0, 19.0, 21.0, 30.0, 38.0, 32.0, 34.0, 41.0, 44.0, 35.0, 32.0, 52.0, 43.0, 47.0, 48.0, 32.0, 43.0, 36.0, 30.0, 25.0, 40.0, 24.0, 22.0, 19.0, 14.0, 15.0, 16.0, 9.0, 5.0, 8.0, 5.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.0015001893043518066, -0.0014580516144633293, -0.001415913924574852, -0.0013737762346863747, -0.0013316385447978973, -0.00128950085490942, -0.0012473631650209427, -0.0012052254751324654, -0.001163087785243988, -0.0011209500953555107, -0.0010788124054670334, -0.001036674715578556, -0.0009945370256900787, -0.0009523993358016014, -0.0009102616459131241, -0.0008681239560246468, -0.0008259862661361694, -0.0007838485762476921, -0.0007417108863592148, -0.0006995731964707375, -0.0006574355065822601, -0.0006152978166937828, -0.0005731601268053055, -0.0005310224369168282, -0.0004888847470283508, -0.0004467470571398735, -0.0004046093672513962, -0.00036247167736291885, -0.00032033398747444153, -0.0002781962975859642, -0.00023605860769748688, -0.00019392091780900955, -0.00015178322792053223, -0.0001096455380320549, -6.750784814357758e-05, -2.537015825510025e-05, 1.6767531633377075e-05, 5.89052215218544e-05, 0.00010104291141033173, 0.00014318060129880905, 0.00018531829118728638, 0.0002274559810757637, 0.00026959367096424103, 0.00031173136085271835, 0.0003538690507411957, 0.000396006740629673, 0.00043814443051815033, 0.00048028212040662766, 0.000522419810295105, 0.0005645575001835823, 0.0006066951900720596, 0.000648832879960537, 0.0006909705698490143, 0.0007331082597374916, 0.0007752459496259689, 0.0008173836395144463, 0.0008595213294029236, 0.0009016590192914009, 0.0009437967091798782, 0.0009859343990683556, 0.0010280720889568329, 0.0010702097788453102, 0.0011123474687337875, 0.0011544851586222649, 0.0011966228485107422]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 3.0, 3.0, 2.0, 10.0, 6.0, 9.0, 7.0, 14.0, 16.0, 8.0, 29.0, 28.0, 27.0, 31.0, 20.0, 22.0, 36.0, 35.0, 42.0, 44.0, 41.0, 49.0, 36.0, 35.0, 41.0, 43.0, 30.0, 46.0, 35.0, 28.0, 34.0, 26.0, 31.0, 28.0, 17.0, 13.0, 10.0, 12.0, 18.0, 11.0, 6.0, 6.0, 2.0, 4.0, 4.0, 1.0, 3.0, 1.0, 3.0], "bins": [-9.9296875, -9.66375732421875, -9.3978271484375, -9.13189697265625, -8.865966796875, -8.60003662109375, -8.3341064453125, -8.06817626953125, -7.80224609375, -7.53631591796875, -7.2703857421875, -7.00445556640625, -6.738525390625, -6.47259521484375, -6.2066650390625, -5.94073486328125, -5.6748046875, -5.40887451171875, -5.1429443359375, -4.87701416015625, -4.611083984375, -4.34515380859375, -4.0792236328125, -3.81329345703125, -3.54736328125, -3.28143310546875, -3.0155029296875, -2.74957275390625, -2.483642578125, -2.21771240234375, -1.9517822265625, -1.68585205078125, -1.419921875, -1.15399169921875, -0.8880615234375, -0.62213134765625, -0.356201171875, -0.09027099609375, 0.1756591796875, 0.44158935546875, 0.70751953125, 0.97344970703125, 1.2393798828125, 1.50531005859375, 1.771240234375, 2.03717041015625, 2.3031005859375, 2.56903076171875, 2.8349609375, 3.10089111328125, 3.3668212890625, 3.63275146484375, 3.898681640625, 4.16461181640625, 4.4305419921875, 4.69647216796875, 4.96240234375, 5.22833251953125, 5.4942626953125, 5.76019287109375, 6.026123046875, 6.29205322265625, 6.5579833984375, 6.82391357421875, 7.08984375]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 4.0, 8.0, 12.0, 15.0, 10.0, 30.0, 40.0, 47.0, 56.0, 83.0, 115.0, 153.0, 203.0, 285.0, 362.0, 415.0, 585.0, 822.0, 996.0, 1602.0, 3100.0, 8499.0, 38525.0, 213550.0, 565462.0, 167967.0, 30173.0, 7128.0, 2723.0, 1479.0, 981.0, 742.0, 563.0, 440.0, 348.0, 272.0, 192.0, 145.0, 120.0, 86.0, 53.0, 40.0, 37.0, 29.0, 19.0, 9.0, 11.0, 7.0, 3.0, 5.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-14.203125, -13.76513671875, -13.3271484375, -12.88916015625, -12.451171875, -12.01318359375, -11.5751953125, -11.13720703125, -10.69921875, -10.26123046875, -9.8232421875, -9.38525390625, -8.947265625, -8.50927734375, -8.0712890625, -7.63330078125, -7.1953125, -6.75732421875, -6.3193359375, -5.88134765625, -5.443359375, -5.00537109375, -4.5673828125, -4.12939453125, -3.69140625, -3.25341796875, -2.8154296875, -2.37744140625, -1.939453125, -1.50146484375, -1.0634765625, -0.62548828125, -0.1875, 0.25048828125, 0.6884765625, 1.12646484375, 1.564453125, 2.00244140625, 2.4404296875, 2.87841796875, 3.31640625, 3.75439453125, 4.1923828125, 4.63037109375, 5.068359375, 5.50634765625, 5.9443359375, 6.38232421875, 6.8203125, 7.25830078125, 7.6962890625, 8.13427734375, 8.572265625, 9.01025390625, 9.4482421875, 9.88623046875, 10.32421875, 10.76220703125, 11.2001953125, 11.63818359375, 12.076171875, 12.51416015625, 12.9521484375, 13.39013671875, 13.828125]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 3.0, 4.0, 7.0, 6.0, 4.0, 7.0, 8.0, 7.0, 11.0, 17.0, 15.0, 17.0, 19.0, 19.0, 37.0, 32.0, 32.0, 34.0, 40.0, 53.0, 90.0, 126.0, 315.0, 1472.0, 161.0, 96.0, 58.0, 56.0, 37.0, 37.0, 35.0, 27.0, 20.0, 19.0, 24.0, 19.0, 14.0, 12.0, 7.0, 11.0, 6.0, 5.0, 7.0, 6.0, 2.0, 4.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-20.625, -19.984375, -19.34375, -18.703125, -18.0625, -17.421875, -16.78125, -16.140625, -15.5, -14.859375, -14.21875, -13.578125, -12.9375, -12.296875, -11.65625, -11.015625, -10.375, -9.734375, -9.09375, -8.453125, -7.8125, -7.171875, -6.53125, -5.890625, -5.25, -4.609375, -3.96875, -3.328125, -2.6875, -2.046875, -1.40625, -0.765625, -0.125, 0.515625, 1.15625, 1.796875, 2.4375, 3.078125, 3.71875, 4.359375, 5.0, 5.640625, 6.28125, 6.921875, 7.5625, 8.203125, 8.84375, 9.484375, 10.125, 10.765625, 11.40625, 12.046875, 12.6875, 13.328125, 13.96875, 14.609375, 15.25, 15.890625, 16.53125, 17.171875, 17.8125, 18.453125, 19.09375, 19.734375, 20.375]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 4.0, 5.0, 6.0, 8.0, 7.0, 9.0, 9.0, 7.0, 18.0, 17.0, 30.0, 37.0, 46.0, 69.0, 94.0, 131.0, 211.0, 361.0, 670.0, 2060.0, 2540297.0, 598117.0, 1849.0, 660.0, 341.0, 188.0, 110.0, 91.0, 68.0, 51.0, 27.0, 28.0, 16.0, 17.0, 13.0, 6.0, 2.0, 5.0, 3.0, 7.0, 6.0, 3.0, 2.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.25, -67.9052734375, -65.560546875, -63.2158203125, -60.87109375, -58.5263671875, -56.181640625, -53.8369140625, -51.4921875, -49.1474609375, -46.802734375, -44.4580078125, -42.11328125, -39.7685546875, -37.423828125, -35.0791015625, -32.734375, -30.3896484375, -28.044921875, -25.7001953125, -23.35546875, -21.0107421875, -18.666015625, -16.3212890625, -13.9765625, -11.6318359375, -9.287109375, -6.9423828125, -4.59765625, -2.2529296875, 0.091796875, 2.4365234375, 4.78125, 7.1259765625, 9.470703125, 11.8154296875, 14.16015625, 16.5048828125, 18.849609375, 21.1943359375, 23.5390625, 25.8837890625, 28.228515625, 30.5732421875, 32.91796875, 35.2626953125, 37.607421875, 39.9521484375, 42.296875, 44.6416015625, 46.986328125, 49.3310546875, 51.67578125, 54.0205078125, 56.365234375, 58.7099609375, 61.0546875, 63.3994140625, 65.744140625, 68.0888671875, 70.43359375, 72.7783203125, 75.123046875, 77.4677734375, 79.8125]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 104.0, 611.0, 272.0, 24.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.70269775390625, -81.51537322998047, -76.32804870605469, -71.14073181152344, -65.95340728759766, -60.766082763671875, -55.578758239746094, -50.39143753051758, -45.2041130065918, -40.016788482666016, -34.8294677734375, -29.64214324951172, -24.45482063293457, -19.267498016357422, -14.08017349243164, -8.892852783203125, -3.7055282592773438, 1.481794834136963, 6.6691179275512695, 11.856441497802734, 17.043764114379883, 22.23108673095703, 27.418411254882812, 32.60573196411133, 37.79305648803711, 42.98038101196289, 48.167701721191406, 53.35502624511719, 58.54235076904297, 63.729671478271484, 68.9169921875, 74.10431671142578, 79.29164123535156, 84.47896575927734, 89.66629028320312, 94.85360717773438, 100.04093170166016, 105.22825622558594, 110.41558074951172, 115.6029052734375, 120.79022216796875, 125.97754669189453, 131.1648712158203, 136.35218811035156, 141.53952026367188, 146.72683715820312, 151.91415405273438, 157.1014862060547, 162.288818359375, 167.47613525390625, 172.66346740722656, 177.8507843017578, 183.03811645507812, 188.22543334960938, 193.41275024414062, 198.60008239746094, 203.7873992919922, 208.97471618652344, 214.16204833984375, 219.349365234375, 224.5366973876953, 229.72401428222656, 234.91134643554688, 240.09866333007812, 245.28598022460938]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 12.0, 10.0, 10.0, 10.0, 13.0, 13.0, 23.0, 23.0, 22.0, 27.0, 32.0, 33.0, 44.0, 43.0, 39.0, 30.0, 37.0, 34.0, 46.0, 54.0, 46.0, 36.0, 37.0, 42.0, 38.0, 30.0, 27.0, 24.0, 25.0, 24.0, 16.0, 26.0, 13.0, 13.0, 16.0, 6.0, 9.0, 6.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-70.62963104248047, -68.70393371582031, -66.77824401855469, -64.85254669189453, -62.92685317993164, -61.00115966796875, -59.07546615600586, -57.14977264404297, -55.22407531738281, -53.29838180541992, -51.37268829345703, -49.446990966796875, -47.521297454833984, -45.595603942871094, -43.6699104309082, -41.74421691894531, -39.81852340698242, -37.89282989501953, -35.96713638305664, -34.04144287109375, -32.115745544433594, -30.190052032470703, -28.264358520507812, -26.338665008544922, -24.4129695892334, -22.487276077270508, -20.561580657958984, -18.635887145996094, -16.710193634033203, -14.78449821472168, -12.858804702758789, -10.933110237121582, -9.007415771484375, -7.081721305847168, -5.156027317047119, -3.2303333282470703, -1.3046388626098633, 0.6210556030273438, 2.5467491149902344, 4.472443580627441, 6.398138046264648, 8.323832511901855, 10.249526977539062, 12.175220489501953, 14.10091495513916, 16.026609420776367, 17.952302932739258, 19.87799835205078, 21.803691864013672, 23.729385375976562, 25.655080795288086, 27.580774307250977, 29.5064697265625, 31.43216323852539, 33.35785675048828, 35.28355026245117, 37.20924377441406, 39.13493728637695, 41.060630798339844, 42.986328125, 44.91202163696289, 46.83771514892578, 48.76340866088867, 50.68910217285156, 52.61479949951172]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 8.0, 8.0, 4.0, 12.0, 14.0, 14.0, 11.0, 13.0, 15.0, 11.0, 20.0, 22.0, 29.0, 27.0, 34.0, 27.0, 27.0, 41.0, 42.0, 37.0, 49.0, 36.0, 41.0, 43.0, 39.0, 34.0, 30.0, 26.0, 28.0, 22.0, 36.0, 31.0, 19.0, 16.0, 25.0, 25.0, 14.0, 15.0, 9.0, 13.0, 9.0, 2.0, 5.0, 8.0, 5.0, 5.0, 3.0, 0.0, 1.0, 2.0], "bins": [-8.734375, -8.4910888671875, -8.247802734375, -8.0045166015625, -7.76123046875, -7.5179443359375, -7.274658203125, -7.0313720703125, -6.7880859375, -6.5447998046875, -6.301513671875, -6.0582275390625, -5.81494140625, -5.5716552734375, -5.328369140625, -5.0850830078125, -4.841796875, -4.5985107421875, -4.355224609375, -4.1119384765625, -3.86865234375, -3.6253662109375, -3.382080078125, -3.1387939453125, -2.8955078125, -2.6522216796875, -2.408935546875, -2.1656494140625, -1.92236328125, -1.6790771484375, -1.435791015625, -1.1925048828125, -0.94921875, -0.7059326171875, -0.462646484375, -0.2193603515625, 0.02392578125, 0.2672119140625, 0.510498046875, 0.7537841796875, 0.9970703125, 1.2403564453125, 1.483642578125, 1.7269287109375, 1.97021484375, 2.2135009765625, 2.456787109375, 2.7000732421875, 2.943359375, 3.1866455078125, 3.429931640625, 3.6732177734375, 3.91650390625, 4.1597900390625, 4.403076171875, 4.6463623046875, 4.8896484375, 5.1329345703125, 5.376220703125, 5.6195068359375, 5.86279296875, 6.1060791015625, 6.349365234375, 6.5926513671875, 6.8359375]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 11.0, 5.0, 5.0, 16.0, 25.0, 18.0, 23.0, 36.0, 42.0, 41.0, 55.0, 73.0, 103.0, 135.0, 203.0, 350.0, 629.0, 1620.0, 4959.0, 25966.0, 442687.0, 2952451.0, 715213.0, 39665.0, 6184.0, 1795.0, 768.0, 395.0, 225.0, 140.0, 107.0, 63.0, 71.0, 38.0, 45.0, 22.0, 24.0, 14.0, 18.0, 10.0, 9.0, 7.0, 4.0, 5.0, 6.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.171875, -19.489990234375, -18.80810546875, -18.126220703125, -17.4443359375, -16.762451171875, -16.08056640625, -15.398681640625, -14.716796875, -14.034912109375, -13.35302734375, -12.671142578125, -11.9892578125, -11.307373046875, -10.62548828125, -9.943603515625, -9.26171875, -8.579833984375, -7.89794921875, -7.216064453125, -6.5341796875, -5.852294921875, -5.17041015625, -4.488525390625, -3.806640625, -3.124755859375, -2.44287109375, -1.760986328125, -1.0791015625, -0.397216796875, 0.28466796875, 0.966552734375, 1.6484375, 2.330322265625, 3.01220703125, 3.694091796875, 4.3759765625, 5.057861328125, 5.73974609375, 6.421630859375, 7.103515625, 7.785400390625, 8.46728515625, 9.149169921875, 9.8310546875, 10.512939453125, 11.19482421875, 11.876708984375, 12.55859375, 13.240478515625, 13.92236328125, 14.604248046875, 15.2861328125, 15.968017578125, 16.64990234375, 17.331787109375, 18.013671875, 18.695556640625, 19.37744140625, 20.059326171875, 20.7412109375, 21.423095703125, 22.10498046875, 22.786865234375, 23.46875]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 14.0, 13.0, 16.0, 36.0, 34.0, 50.0, 71.0, 85.0, 103.0, 145.0, 195.0, 292.0, 424.0, 548.0, 553.0, 391.0, 271.0, 207.0, 186.0, 111.0, 81.0, 69.0, 52.0, 28.0, 27.0, 21.0, 16.0, 12.0, 4.0, 5.0, 4.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-18.59375, -18.1181640625, -17.642578125, -17.1669921875, -16.69140625, -16.2158203125, -15.740234375, -15.2646484375, -14.7890625, -14.3134765625, -13.837890625, -13.3623046875, -12.88671875, -12.4111328125, -11.935546875, -11.4599609375, -10.984375, -10.5087890625, -10.033203125, -9.5576171875, -9.08203125, -8.6064453125, -8.130859375, -7.6552734375, -7.1796875, -6.7041015625, -6.228515625, -5.7529296875, -5.27734375, -4.8017578125, -4.326171875, -3.8505859375, -3.375, -2.8994140625, -2.423828125, -1.9482421875, -1.47265625, -0.9970703125, -0.521484375, -0.0458984375, 0.4296875, 0.9052734375, 1.380859375, 1.8564453125, 2.33203125, 2.8076171875, 3.283203125, 3.7587890625, 4.234375, 4.7099609375, 5.185546875, 5.6611328125, 6.13671875, 6.6123046875, 7.087890625, 7.5634765625, 8.0390625, 8.5146484375, 8.990234375, 9.4658203125, 9.94140625, 10.4169921875, 10.892578125, 11.3681640625, 11.84375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 6.0, 3.0, 11.0, 13.0, 22.0, 28.0, 45.0, 79.0, 146.0, 299.0, 751.0, 2681.0, 45325.0, 3944409.0, 194252.0, 4319.0, 1056.0, 390.0, 193.0, 86.0, 67.0, 28.0, 27.0, 23.0, 9.0, 4.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-61.84375, -60.2431640625, -58.642578125, -57.0419921875, -55.44140625, -53.8408203125, -52.240234375, -50.6396484375, -49.0390625, -47.4384765625, -45.837890625, -44.2373046875, -42.63671875, -41.0361328125, -39.435546875, -37.8349609375, -36.234375, -34.6337890625, -33.033203125, -31.4326171875, -29.83203125, -28.2314453125, -26.630859375, -25.0302734375, -23.4296875, -21.8291015625, -20.228515625, -18.6279296875, -17.02734375, -15.4267578125, -13.826171875, -12.2255859375, -10.625, -9.0244140625, -7.423828125, -5.8232421875, -4.22265625, -2.6220703125, -1.021484375, 0.5791015625, 2.1796875, 3.7802734375, 5.380859375, 6.9814453125, 8.58203125, 10.1826171875, 11.783203125, 13.3837890625, 14.984375, 16.5849609375, 18.185546875, 19.7861328125, 21.38671875, 22.9873046875, 24.587890625, 26.1884765625, 27.7890625, 29.3896484375, 30.990234375, 32.5908203125, 34.19140625, 35.7919921875, 37.392578125, 38.9931640625, 40.59375]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 66.0, 928.0, 22.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-255.44949340820312, -234.90330505371094, -214.3571014404297, -193.8109130859375, -173.26470947265625, -152.71852111816406, -132.17233276367188, -111.62612915039062, -91.07994079589844, -70.53374481201172, -49.987552642822266, -29.441360473632812, -8.895164489746094, 11.651031494140625, 32.19721984863281, 52.74342346191406, 73.28961181640625, 93.83580780029297, 114.38200378417969, 134.92819213867188, 155.47439575195312, 176.0205841064453, 196.5667724609375, 217.11297607421875, 237.65916442871094, 258.2053527832031, 278.7515563964844, 299.2977294921875, 319.84393310546875, 340.39013671875, 360.93634033203125, 381.4825439453125, 402.02874755859375, 422.574951171875, 443.1211242675781, 463.6673278808594, 484.2135314941406, 504.75970458984375, 525.305908203125, 545.8521118164062, 566.3983154296875, 586.9445190429688, 607.49072265625, 628.036865234375, 648.5830688476562, 669.1292724609375, 689.6754760742188, 710.2216796875, 730.767822265625, 751.3140258789062, 771.8602294921875, 792.4063720703125, 812.9525756835938, 833.498779296875, 854.0449829101562, 874.5911865234375, 895.1373901367188, 915.68359375, 936.2297973632812, 956.7760009765625, 977.3221435546875, 997.8683471679688, 1018.41455078125, 1038.960693359375, 1059.5069580078125]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 3.0, 6.0, 4.0, 12.0, 18.0, 14.0, 17.0, 22.0, 22.0, 23.0, 37.0, 31.0, 32.0, 40.0, 46.0, 47.0, 30.0, 51.0, 44.0, 40.0, 49.0, 48.0, 29.0, 40.0, 37.0, 28.0, 35.0, 26.0, 29.0, 18.0, 20.0, 25.0, 12.0, 11.0, 10.0, 13.0, 9.0, 8.0, 7.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-54.12510681152344, -52.422367095947266, -50.71963119506836, -49.01689147949219, -47.314151763916016, -45.611412048339844, -43.90867614746094, -42.205936431884766, -40.503196716308594, -38.80045700073242, -37.097721099853516, -35.394981384277344, -33.69224166870117, -31.989503860473633, -30.286766052246094, -28.584026336669922, -26.881290435791016, -25.178552627563477, -23.475812911987305, -21.773075103759766, -20.070335388183594, -18.367597579956055, -16.664859771728516, -14.96212100982666, -13.259382247924805, -11.55664348602295, -9.853904724121094, -8.151166915893555, -6.448428153991699, -4.745689392089844, -3.0429515838623047, -1.3402128219604492, 0.36252593994140625, 2.0652644634246826, 3.768002986907959, 5.470741271972656, 7.173480033874512, 8.876218795776367, 10.578956604003906, 12.281695365905762, 13.984434127807617, 15.687172889709473, 17.389911651611328, 19.092649459838867, 20.795387268066406, 22.498126983642578, 24.200864791870117, 25.903602600097656, 27.606342315673828, 29.309080123901367, 31.01181983947754, 32.71455764770508, 34.41729736328125, 36.120033264160156, 37.82277297973633, 39.5255126953125, 41.228248596191406, 42.93098831176758, 44.633724212646484, 46.336463928222656, 48.03920364379883, 49.741943359375, 51.444679260253906, 53.14741897583008, 54.85015869140625]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 8.0, 7.0, 7.0, 5.0, 13.0, 7.0, 6.0, 16.0, 19.0, 10.0, 19.0, 18.0, 23.0, 31.0, 31.0, 37.0, 25.0, 30.0, 35.0, 25.0, 43.0, 38.0, 39.0, 34.0, 38.0, 34.0, 35.0, 32.0, 38.0, 28.0, 24.0, 30.0, 34.0, 28.0, 27.0, 26.0, 17.0, 15.0, 13.0, 6.0, 10.0, 11.0, 11.0, 3.0, 8.0, 2.0, 0.0, 5.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-6.2890625, -6.0947265625, -5.900390625, -5.7060546875, -5.51171875, -5.3173828125, -5.123046875, -4.9287109375, -4.734375, -4.5400390625, -4.345703125, -4.1513671875, -3.95703125, -3.7626953125, -3.568359375, -3.3740234375, -3.1796875, -2.9853515625, -2.791015625, -2.5966796875, -2.40234375, -2.2080078125, -2.013671875, -1.8193359375, -1.625, -1.4306640625, -1.236328125, -1.0419921875, -0.84765625, -0.6533203125, -0.458984375, -0.2646484375, -0.0703125, 0.1240234375, 0.318359375, 0.5126953125, 0.70703125, 0.9013671875, 1.095703125, 1.2900390625, 1.484375, 1.6787109375, 1.873046875, 2.0673828125, 2.26171875, 2.4560546875, 2.650390625, 2.8447265625, 3.0390625, 3.2333984375, 3.427734375, 3.6220703125, 3.81640625, 4.0107421875, 4.205078125, 4.3994140625, 4.59375, 4.7880859375, 4.982421875, 5.1767578125, 5.37109375, 5.5654296875, 5.759765625, 5.9541015625, 6.1484375]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 5.0, 2.0, 4.0, 4.0, 3.0, 2.0, 5.0, 7.0, 13.0, 13.0, 13.0, 30.0, 40.0, 58.0, 96.0, 97.0, 172.0, 257.0, 355.0, 540.0, 839.0, 1230.0, 1794.0, 2704.0, 4144.0, 6283.0, 9665.0, 14809.0, 24173.0, 40022.0, 72024.0, 135111.0, 241710.0, 217100.0, 116577.0, 62148.0, 35808.0, 21592.0, 13486.0, 8656.0, 5741.0, 3668.0, 2500.0, 1607.0, 1095.0, 733.0, 515.0, 346.0, 227.0, 157.0, 127.0, 86.0, 59.0, 33.0, 27.0, 18.0, 16.0, 8.0, 9.0, 2.0, 3.0, 3.0, 2.0], "bins": [-0.99169921875, -0.962432861328125, -0.93316650390625, -0.903900146484375, -0.8746337890625, -0.845367431640625, -0.81610107421875, -0.786834716796875, -0.757568359375, -0.728302001953125, -0.69903564453125, -0.669769287109375, -0.6405029296875, -0.611236572265625, -0.58197021484375, -0.552703857421875, -0.5234375, -0.494171142578125, -0.46490478515625, -0.435638427734375, -0.4063720703125, -0.377105712890625, -0.34783935546875, -0.318572998046875, -0.289306640625, -0.260040283203125, -0.23077392578125, -0.201507568359375, -0.1722412109375, -0.142974853515625, -0.11370849609375, -0.084442138671875, -0.05517578125, -0.025909423828125, 0.00335693359375, 0.032623291015625, 0.0618896484375, 0.091156005859375, 0.12042236328125, 0.149688720703125, 0.178955078125, 0.208221435546875, 0.23748779296875, 0.266754150390625, 0.2960205078125, 0.325286865234375, 0.35455322265625, 0.383819580078125, 0.4130859375, 0.442352294921875, 0.47161865234375, 0.500885009765625, 0.5301513671875, 0.559417724609375, 0.58868408203125, 0.617950439453125, 0.647216796875, 0.676483154296875, 0.70574951171875, 0.735015869140625, 0.7642822265625, 0.793548583984375, 0.82281494140625, 0.852081298828125, 0.88134765625]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 2.0, 6.0, 6.0, 8.0, 20.0, 21.0, 28.0, 24.0, 26.0, 29.0, 31.0, 42.0, 50.0, 45.0, 41.0, 51.0, 36.0, 1076.0, 51.0, 47.0, 49.0, 34.0, 44.0, 34.0, 30.0, 28.0, 31.0, 30.0, 28.0, 12.0, 16.0, 11.0, 11.0, 3.0, 6.0, 6.0, 4.0, 6.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.22265625, -5.057861328125, -4.89306640625, -4.728271484375, -4.5634765625, -4.398681640625, -4.23388671875, -4.069091796875, -3.904296875, -3.739501953125, -3.57470703125, -3.409912109375, -3.2451171875, -3.080322265625, -2.91552734375, -2.750732421875, -2.5859375, -2.421142578125, -2.25634765625, -2.091552734375, -1.9267578125, -1.761962890625, -1.59716796875, -1.432373046875, -1.267578125, -1.102783203125, -0.93798828125, -0.773193359375, -0.6083984375, -0.443603515625, -0.27880859375, -0.114013671875, 0.05078125, 0.215576171875, 0.38037109375, 0.545166015625, 0.7099609375, 0.874755859375, 1.03955078125, 1.204345703125, 1.369140625, 1.533935546875, 1.69873046875, 1.863525390625, 2.0283203125, 2.193115234375, 2.35791015625, 2.522705078125, 2.6875, 2.852294921875, 3.01708984375, 3.181884765625, 3.3466796875, 3.511474609375, 3.67626953125, 3.841064453125, 4.005859375, 4.170654296875, 4.33544921875, 4.500244140625, 4.6650390625, 4.829833984375, 4.99462890625, 5.159423828125, 5.32421875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 4.0, 9.0, 13.0, 24.0, 32.0, 49.0, 65.0, 114.0, 166.0, 230.0, 368.0, 530.0, 848.0, 1229.0, 1824.0, 2943.0, 4540.0, 7182.0, 11775.0, 19017.0, 31536.0, 53413.0, 96875.0, 192010.0, 1316835.0, 157571.0, 80839.0, 45822.0, 27084.0, 16408.0, 9932.0, 6278.0, 3993.0, 2621.0, 1668.0, 1077.0, 744.0, 471.0, 352.0, 216.0, 136.0, 94.0, 72.0, 39.0, 30.0, 12.0, 12.0, 10.0, 9.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0], "bins": [-0.96240234375, -0.9335479736328125, -0.904693603515625, -0.8758392333984375, -0.84698486328125, -0.8181304931640625, -0.789276123046875, -0.7604217529296875, -0.7315673828125, -0.7027130126953125, -0.673858642578125, -0.6450042724609375, -0.61614990234375, -0.5872955322265625, -0.558441162109375, -0.5295867919921875, -0.500732421875, -0.4718780517578125, -0.443023681640625, -0.4141693115234375, -0.38531494140625, -0.3564605712890625, -0.327606201171875, -0.2987518310546875, -0.2698974609375, -0.2410430908203125, -0.212188720703125, -0.1833343505859375, -0.15447998046875, -0.1256256103515625, -0.096771240234375, -0.0679168701171875, -0.0390625, -0.0102081298828125, 0.018646240234375, 0.0475006103515625, 0.07635498046875, 0.1052093505859375, 0.134063720703125, 0.1629180908203125, 0.1917724609375, 0.2206268310546875, 0.249481201171875, 0.2783355712890625, 0.30718994140625, 0.3360443115234375, 0.364898681640625, 0.3937530517578125, 0.422607421875, 0.4514617919921875, 0.480316162109375, 0.5091705322265625, 0.53802490234375, 0.5668792724609375, 0.595733642578125, 0.6245880126953125, 0.6534423828125, 0.6822967529296875, 0.711151123046875, 0.7400054931640625, 0.76885986328125, 0.7977142333984375, 0.826568603515625, 0.8554229736328125, 0.88427734375]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 5.0, 3.0, 5.0, 5.0, 9.0, 3.0, 8.0, 8.0, 11.0, 10.0, 16.0, 25.0, 18.0, 27.0, 22.0, 29.0, 32.0, 54.0, 51.0, 53.0, 55.0, 43.0, 55.0, 58.0, 54.0, 44.0, 39.0, 36.0, 35.0, 27.0, 22.0, 21.0, 20.0, 19.0, 21.0, 14.0, 9.0, 9.0, 4.0, 3.0, 1.0, 5.0, 3.0, 2.0, 2.0, 5.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.0017480850219726562, -0.0016879290342330933, -0.0016277730464935303, -0.0015676170587539673, -0.0015074610710144043, -0.0014473050832748413, -0.0013871490955352783, -0.0013269931077957153, -0.0012668371200561523, -0.0012066811323165894, -0.0011465251445770264, -0.0010863691568374634, -0.0010262131690979004, -0.0009660571813583374, -0.0009059011936187744, -0.0008457452058792114, -0.0007855892181396484, -0.0007254332304000854, -0.0006652772426605225, -0.0006051212549209595, -0.0005449652671813965, -0.0004848092794418335, -0.0004246532917022705, -0.0003644973039627075, -0.00030434131622314453, -0.00024418532848358154, -0.00018402934074401855, -0.00012387335300445557, -6.371736526489258e-05, -3.56137752532959e-06, 5.65946102142334e-05, 0.00011675059795379639, 0.00017690658569335938, 0.00023706257343292236, 0.00029721856117248535, 0.00035737454891204834, 0.00041753053665161133, 0.0004776865243911743, 0.0005378425121307373, 0.0005979984998703003, 0.0006581544876098633, 0.0007183104753494263, 0.0007784664630889893, 0.0008386224508285522, 0.0008987784385681152, 0.0009589344263076782, 0.0010190904140472412, 0.0010792464017868042, 0.0011394023895263672, 0.0011995583772659302, 0.0012597143650054932, 0.0013198703527450562, 0.0013800263404846191, 0.0014401823282241821, 0.0015003383159637451, 0.001560494303703308, 0.001620650291442871, 0.001680806279182434, 0.001740962266921997, 0.00180111825466156, 0.001861274242401123, 0.001921430230140686, 0.001981586217880249, 0.002041742205619812, 0.002101898193359375]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 6.0, 7.0, 6.0, 8.0, 4.0, 5.0, 13.0, 14.0, 12.0, 17.0, 25.0, 35.0, 42.0, 67.0, 68.0, 93.0, 132.0, 139.0, 277.0, 393.0, 699.0, 2378.0, 932495.0, 108628.0, 1244.0, 553.0, 352.0, 217.0, 150.0, 113.0, 83.0, 72.0, 42.0, 30.0, 29.0, 22.0, 15.0, 11.0, 11.0, 13.0, 10.0, 9.0, 2.0, 7.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.044708251953125, -0.04345989227294922, -0.04221153259277344, -0.040963172912597656, -0.039714813232421875, -0.038466453552246094, -0.03721809387207031, -0.03596973419189453, -0.03472137451171875, -0.03347301483154297, -0.03222465515136719, -0.030976295471191406, -0.029727935791015625, -0.028479576110839844, -0.027231216430664062, -0.02598285675048828, -0.0247344970703125, -0.02348613739013672, -0.022237777709960938, -0.020989418029785156, -0.019741058349609375, -0.018492698669433594, -0.017244338989257812, -0.01599597930908203, -0.01474761962890625, -0.013499259948730469, -0.012250900268554688, -0.011002540588378906, -0.009754180908203125, -0.008505821228027344, -0.0072574615478515625, -0.006009101867675781, -0.0047607421875, -0.0035123825073242188, -0.0022640228271484375, -0.0010156631469726562, 0.000232696533203125, 0.0014810562133789062, 0.0027294158935546875, 0.003977775573730469, 0.00522613525390625, 0.006474494934082031, 0.0077228546142578125, 0.008971214294433594, 0.010219573974609375, 0.011467933654785156, 0.012716293334960938, 0.013964653015136719, 0.0152130126953125, 0.01646137237548828, 0.017709732055664062, 0.018958091735839844, 0.020206451416015625, 0.021454811096191406, 0.022703170776367188, 0.02395153045654297, 0.02519989013671875, 0.02644824981689453, 0.027696609497070312, 0.028944969177246094, 0.030193328857421875, 0.031441688537597656, 0.03269004821777344, 0.03393840789794922, 0.035186767578125]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 38.0, 577.0, 383.0, 15.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.011961775831878185, -0.01168915443122387, -0.011416533961892128, -0.011143912561237812, -0.01087129209190607, -0.010598670691251755, -0.010326050221920013, -0.010053428821265697, -0.009780808351933956, -0.00950818695127964, -0.009235566481947899, -0.008962945081293583, -0.008690324611961842, -0.008417703211307526, -0.008145082741975784, -0.007872461341321468, -0.00759984040632844, -0.007327219471335411, -0.007054598536342382, -0.006781977601349354, -0.006509356666356325, -0.0062367357313632965, -0.0059641143307089806, -0.005691493861377239, -0.005418872460722923, -0.005146251525729895, -0.004873630590736866, -0.004601009655743837, -0.004328388720750809, -0.00405576778575778, -0.0037831466179341078, -0.003510525682941079, -0.003237904980778694, -0.0029652840457856655, -0.002692663110792637, -0.0024200421757996082, -0.0021474212408065796, -0.0018748001893982291, -0.0016021791379898787, -0.00132955820299685, -0.0010569372680038214, -0.0007843163330107927, -0.0005116953398101032, -0.00023907434660941362, 3.354658838361502e-05, 0.00030616752337664366, 0.0005787885747849941, 0.0008514095097780228, 0.0011240304447710514, 0.00139665137976408, 0.0016692723147571087, 0.0019418933661654592, 0.002214514184743166, 0.0024871351197361946, 0.002759756287559867, 0.0030323772225528955, 0.003304998157545924, 0.003577619092538953, 0.0038502400275319815, 0.004122861195355654, 0.004395482130348682, 0.004668103065341711, 0.00494072400033474, 0.005213344935327768, 0.005485965870320797]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 8.0, 1.0, 8.0, 6.0, 8.0, 9.0, 16.0, 16.0, 22.0, 16.0, 26.0, 26.0, 37.0, 31.0, 33.0, 35.0, 29.0, 41.0, 29.0, 35.0, 43.0, 47.0, 55.0, 42.0, 39.0, 48.0, 21.0, 49.0, 28.0, 25.0, 27.0, 22.0, 26.0, 19.0, 14.0, 10.0, 18.0, 7.0, 8.0, 13.0, 10.0, 5.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009658932685852051, -0.0009272890165448189, -0.0008886847645044327, -0.0008500805124640465, -0.0008114762604236603, -0.0007728720083832741, -0.0007342677563428879, -0.0006956635043025017, -0.0006570592522621155, -0.0006184550002217293, -0.0005798507481813431, -0.0005412464961409569, -0.0005026422441005707, -0.0004640379920601845, -0.0004254337400197983, -0.0003868294879794121, -0.0003482252359390259, -0.0003096209838986397, -0.0002710167318582535, -0.00023241247981786728, -0.00019380822777748108, -0.00015520397573709488, -0.00011659972369670868, -7.799547165632248e-05, -3.939121961593628e-05, -7.869675755500793e-07, 3.781728446483612e-05, 7.642153650522232e-05, 0.00011502578854560852, 0.00015363004058599472, 0.00019223429262638092, 0.00023083854466676712, 0.0002694427967071533, 0.0003080470487475395, 0.0003466513007879257, 0.0003852555528283119, 0.0004238598048686981, 0.0004624640569090843, 0.0005010683089494705, 0.0005396725609898567, 0.0005782768130302429, 0.0006168810650706291, 0.0006554853171110153, 0.0006940895691514015, 0.0007326938211917877, 0.0007712980732321739, 0.0008099023252725601, 0.0008485065773129463, 0.0008871108293533325, 0.0009257150813937187, 0.0009643193334341049, 0.0010029235854744911, 0.0010415278375148773, 0.0010801320895552635, 0.0011187363415956497, 0.001157340593636036, 0.0011959448456764221, 0.0012345490977168083, 0.0012731533497571945, 0.0013117576017975807, 0.001350361853837967, 0.0013889661058783531, 0.0014275703579187393, 0.0014661746099591255, 0.0015047788619995117]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 8.0, 7.0, 7.0, 5.0, 13.0, 7.0, 6.0, 16.0, 19.0, 10.0, 19.0, 18.0, 23.0, 31.0, 31.0, 37.0, 25.0, 30.0, 35.0, 25.0, 43.0, 38.0, 39.0, 34.0, 38.0, 34.0, 35.0, 32.0, 38.0, 28.0, 24.0, 30.0, 34.0, 28.0, 27.0, 26.0, 17.0, 15.0, 13.0, 6.0, 10.0, 11.0, 11.0, 3.0, 7.0, 3.0, 0.0, 5.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-6.2890625, -6.0947265625, -5.900390625, -5.7060546875, -5.51171875, -5.3173828125, -5.123046875, -4.9287109375, -4.734375, -4.5400390625, -4.345703125, -4.1513671875, -3.95703125, -3.7626953125, -3.568359375, -3.3740234375, -3.1796875, -2.9853515625, -2.791015625, -2.5966796875, -2.40234375, -2.2080078125, -2.013671875, -1.8193359375, -1.625, -1.4306640625, -1.236328125, -1.0419921875, -0.84765625, -0.6533203125, -0.458984375, -0.2646484375, -0.0703125, 0.1240234375, 0.318359375, 0.5126953125, 0.70703125, 0.9013671875, 1.095703125, 1.2900390625, 1.484375, 1.6787109375, 1.873046875, 2.0673828125, 2.26171875, 2.4560546875, 2.650390625, 2.8447265625, 3.0390625, 3.2333984375, 3.427734375, 3.6220703125, 3.81640625, 4.0107421875, 4.205078125, 4.3994140625, 4.59375, 4.7880859375, 4.982421875, 5.1767578125, 5.37109375, 5.5654296875, 5.759765625, 5.9541015625, 6.1484375]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 5.0, 2.0, 9.0, 4.0, 17.0, 21.0, 30.0, 38.0, 51.0, 81.0, 102.0, 105.0, 163.0, 233.0, 307.0, 423.0, 666.0, 868.0, 1246.0, 1838.0, 2869.0, 6120.0, 21018.0, 156219.0, 681606.0, 139995.0, 19743.0, 5770.0, 2902.0, 1892.0, 1132.0, 828.0, 612.0, 450.0, 324.0, 219.0, 189.0, 128.0, 95.0, 75.0, 36.0, 22.0, 19.0, 28.0, 15.0, 17.0, 8.0, 8.0, 2.0, 1.0, 5.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-15.984375, -15.4921875, -15.0, -14.5078125, -14.015625, -13.5234375, -13.03125, -12.5390625, -12.046875, -11.5546875, -11.0625, -10.5703125, -10.078125, -9.5859375, -9.09375, -8.6015625, -8.109375, -7.6171875, -7.125, -6.6328125, -6.140625, -5.6484375, -5.15625, -4.6640625, -4.171875, -3.6796875, -3.1875, -2.6953125, -2.203125, -1.7109375, -1.21875, -0.7265625, -0.234375, 0.2578125, 0.75, 1.2421875, 1.734375, 2.2265625, 2.71875, 3.2109375, 3.703125, 4.1953125, 4.6875, 5.1796875, 5.671875, 6.1640625, 6.65625, 7.1484375, 7.640625, 8.1328125, 8.625, 9.1171875, 9.609375, 10.1015625, 10.59375, 11.0859375, 11.578125, 12.0703125, 12.5625, 13.0546875, 13.546875, 14.0390625, 14.53125, 15.0234375, 15.515625]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 7.0, 2.0, 3.0, 7.0, 3.0, 3.0, 10.0, 13.0, 13.0, 12.0, 24.0, 14.0, 18.0, 28.0, 35.0, 38.0, 33.0, 38.0, 57.0, 72.0, 109.0, 227.0, 1587.0, 238.0, 93.0, 46.0, 37.0, 31.0, 34.0, 35.0, 29.0, 23.0, 23.0, 19.0, 20.0, 14.0, 13.0, 10.0, 9.0, 5.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-18.515625, -17.94482421875, -17.3740234375, -16.80322265625, -16.232421875, -15.66162109375, -15.0908203125, -14.52001953125, -13.94921875, -13.37841796875, -12.8076171875, -12.23681640625, -11.666015625, -11.09521484375, -10.5244140625, -9.95361328125, -9.3828125, -8.81201171875, -8.2412109375, -7.67041015625, -7.099609375, -6.52880859375, -5.9580078125, -5.38720703125, -4.81640625, -4.24560546875, -3.6748046875, -3.10400390625, -2.533203125, -1.96240234375, -1.3916015625, -0.82080078125, -0.25, 0.32080078125, 0.8916015625, 1.46240234375, 2.033203125, 2.60400390625, 3.1748046875, 3.74560546875, 4.31640625, 4.88720703125, 5.4580078125, 6.02880859375, 6.599609375, 7.17041015625, 7.7412109375, 8.31201171875, 8.8828125, 9.45361328125, 10.0244140625, 10.59521484375, 11.166015625, 11.73681640625, 12.3076171875, 12.87841796875, 13.44921875, 14.02001953125, 14.5908203125, 15.16162109375, 15.732421875, 16.30322265625, 16.8740234375, 17.44482421875, 18.015625]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 6.0, 2.0, 6.0, 10.0, 13.0, 5.0, 12.0, 17.0, 26.0, 31.0, 31.0, 38.0, 58.0, 71.0, 90.0, 140.0, 189.0, 319.0, 609.0, 1575.0, 39710.0, 3096200.0, 4163.0, 980.0, 459.0, 242.0, 179.0, 117.0, 84.0, 58.0, 72.0, 40.0, 32.0, 26.0, 17.0, 12.0, 15.0, 8.0, 14.0, 7.0, 6.0, 7.0, 1.0, 4.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-54.5625, -52.87255859375, -51.1826171875, -49.49267578125, -47.802734375, -46.11279296875, -44.4228515625, -42.73291015625, -41.04296875, -39.35302734375, -37.6630859375, -35.97314453125, -34.283203125, -32.59326171875, -30.9033203125, -29.21337890625, -27.5234375, -25.83349609375, -24.1435546875, -22.45361328125, -20.763671875, -19.07373046875, -17.3837890625, -15.69384765625, -14.00390625, -12.31396484375, -10.6240234375, -8.93408203125, -7.244140625, -5.55419921875, -3.8642578125, -2.17431640625, -0.484375, 1.20556640625, 2.8955078125, 4.58544921875, 6.275390625, 7.96533203125, 9.6552734375, 11.34521484375, 13.03515625, 14.72509765625, 16.4150390625, 18.10498046875, 19.794921875, 21.48486328125, 23.1748046875, 24.86474609375, 26.5546875, 28.24462890625, 29.9345703125, 31.62451171875, 33.314453125, 35.00439453125, 36.6943359375, 38.38427734375, 40.07421875, 41.76416015625, 43.4541015625, 45.14404296875, 46.833984375, 48.52392578125, 50.2138671875, 51.90380859375, 53.59375]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 19.0, 82.0, 253.0, 365.0, 225.0, 43.0, 14.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.48968505859375, -102.51563262939453, -99.54158782958984, -96.56753540039062, -93.59349060058594, -90.61943817138672, -87.6453857421875, -84.67134094238281, -81.6972885131836, -78.72323608398438, -75.74919128417969, -72.77513885498047, -69.80109405517578, -66.82704162597656, -63.85299301147461, -60.878944396972656, -57.9048957824707, -54.93084716796875, -51.9567985534668, -48.982749938964844, -46.008697509765625, -43.03464889526367, -40.06060028076172, -37.0865478515625, -34.11250305175781, -31.13845443725586, -28.164403915405273, -25.19035530090332, -22.216304779052734, -19.24225616455078, -16.268207550048828, -13.294157028198242, -10.320106506347656, -7.346056938171387, -4.372007846832275, -1.397958755493164, 1.5760908126831055, 4.550140380859375, 7.524188995361328, 10.498239517211914, 13.472288131713867, 16.44633674621582, 19.420387268066406, 22.39443588256836, 25.368484497070312, 28.3425350189209, 31.31658363342285, 34.29063415527344, 37.26468276977539, 40.238731384277344, 43.2127799987793, 46.18682861328125, 49.16088104248047, 52.13492965698242, 55.108978271484375, 58.083030700683594, 61.05707550048828, 64.0311279296875, 67.00517272949219, 69.9792251586914, 72.9532699584961, 75.92732238769531, 78.9013671875, 81.87541961669922, 84.84947204589844]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 7.0, 4.0, 4.0, 12.0, 19.0, 14.0, 13.0, 14.0, 22.0, 21.0, 33.0, 34.0, 25.0, 36.0, 40.0, 34.0, 42.0, 45.0, 34.0, 56.0, 41.0, 45.0, 51.0, 44.0, 43.0, 26.0, 33.0, 30.0, 24.0, 28.0, 24.0, 25.0, 13.0, 16.0, 10.0, 4.0, 5.0, 6.0, 7.0, 6.0, 4.0, 3.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-59.913509368896484, -58.10139083862305, -56.28927230834961, -54.477149963378906, -52.66503143310547, -50.85291290283203, -49.040794372558594, -47.228675842285156, -45.41655731201172, -43.60443878173828, -41.792320251464844, -39.980201721191406, -38.1680793762207, -36.355960845947266, -34.54384231567383, -32.73172378540039, -30.91960334777832, -29.107484817504883, -27.295364379882812, -25.483245849609375, -23.671127319335938, -21.8590087890625, -20.04688835144043, -18.234769821166992, -16.422649383544922, -14.610529899597168, -12.79841136932373, -10.986291885375977, -9.174173355102539, -7.362053871154785, -5.549934387207031, -3.7378158569335938, -1.9256973266601562, -0.113578200340271, 1.6985409259796143, 3.510660171508789, 5.322779178619385, 7.1348981857299805, 8.947017669677734, 10.759136199951172, 12.571255683898926, 14.38337516784668, 16.195493698120117, 18.007614135742188, 19.819732666015625, 21.631851196289062, 23.4439697265625, 25.256088256835938, 27.068208694458008, 28.880327224731445, 30.692447662353516, 32.50456619262695, 34.31668472290039, 36.12880325317383, 37.94092559814453, 39.75304412841797, 41.565162658691406, 43.377281188964844, 45.18939971923828, 47.00151824951172, 48.81364059448242, 50.62575912475586, 52.4378776550293, 54.249996185302734, 56.06211471557617]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 2.0, 5.0, 9.0, 5.0, 7.0, 13.0, 13.0, 14.0, 22.0, 18.0, 27.0, 35.0, 27.0, 18.0, 25.0, 31.0, 35.0, 35.0, 48.0, 40.0, 28.0, 34.0, 26.0, 41.0, 32.0, 37.0, 28.0, 40.0, 34.0, 22.0, 33.0, 27.0, 30.0, 15.0, 28.0, 17.0, 14.0, 16.0, 12.0, 10.0, 12.0, 6.0, 3.0, 4.0, 5.0, 4.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-6.35546875, -6.15106201171875, -5.9466552734375, -5.74224853515625, -5.537841796875, -5.33343505859375, -5.1290283203125, -4.92462158203125, -4.72021484375, -4.51580810546875, -4.3114013671875, -4.10699462890625, -3.902587890625, -3.69818115234375, -3.4937744140625, -3.28936767578125, -3.0849609375, -2.88055419921875, -2.6761474609375, -2.47174072265625, -2.267333984375, -2.06292724609375, -1.8585205078125, -1.65411376953125, -1.44970703125, -1.24530029296875, -1.0408935546875, -0.83648681640625, -0.632080078125, -0.42767333984375, -0.2232666015625, -0.01885986328125, 0.185546875, 0.38995361328125, 0.5943603515625, 0.79876708984375, 1.003173828125, 1.20758056640625, 1.4119873046875, 1.61639404296875, 1.82080078125, 2.02520751953125, 2.2296142578125, 2.43402099609375, 2.638427734375, 2.84283447265625, 3.0472412109375, 3.25164794921875, 3.4560546875, 3.66046142578125, 3.8648681640625, 4.06927490234375, 4.273681640625, 4.47808837890625, 4.6824951171875, 4.88690185546875, 5.09130859375, 5.29571533203125, 5.5001220703125, 5.70452880859375, 5.908935546875, 6.11334228515625, 6.3177490234375, 6.52215576171875, 6.7265625]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 3.0, 6.0, 12.0, 13.0, 14.0, 24.0, 34.0, 46.0, 79.0, 108.0, 131.0, 175.0, 241.0, 368.0, 517.0, 716.0, 1126.0, 1638.0, 2727.0, 4618.0, 9205.0, 21567.0, 72090.0, 315362.0, 1094449.0, 1680991.0, 728873.0, 181559.0, 44781.0, 15179.0, 6974.0, 3886.0, 2314.0, 1395.0, 923.0, 600.0, 439.0, 324.0, 219.0, 159.0, 122.0, 86.0, 65.0, 40.0, 35.0, 14.0, 9.0, 11.0, 9.0, 5.0, 6.0, 0.0, 3.0, 1.0, 2.0], "bins": [-9.4453125, -9.1700439453125, -8.894775390625, -8.6195068359375, -8.34423828125, -8.0689697265625, -7.793701171875, -7.5184326171875, -7.2431640625, -6.9678955078125, -6.692626953125, -6.4173583984375, -6.14208984375, -5.8668212890625, -5.591552734375, -5.3162841796875, -5.041015625, -4.7657470703125, -4.490478515625, -4.2152099609375, -3.93994140625, -3.6646728515625, -3.389404296875, -3.1141357421875, -2.8388671875, -2.5635986328125, -2.288330078125, -2.0130615234375, -1.73779296875, -1.4625244140625, -1.187255859375, -0.9119873046875, -0.63671875, -0.3614501953125, -0.086181640625, 0.1890869140625, 0.46435546875, 0.7396240234375, 1.014892578125, 1.2901611328125, 1.5654296875, 1.8406982421875, 2.115966796875, 2.3912353515625, 2.66650390625, 2.9417724609375, 3.217041015625, 3.4923095703125, 3.767578125, 4.0428466796875, 4.318115234375, 4.5933837890625, 4.86865234375, 5.1439208984375, 5.419189453125, 5.6944580078125, 5.9697265625, 6.2449951171875, 6.520263671875, 6.7955322265625, 7.07080078125, 7.3460693359375, 7.621337890625, 7.8966064453125, 8.171875]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 6.0, 4.0, 19.0, 30.0, 49.0, 89.0, 156.0, 262.0, 459.0, 716.0, 843.0, 560.0, 359.0, 203.0, 131.0, 73.0, 54.0, 22.0, 18.0, 3.0, 7.0, 7.0, 1.0, 0.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.453125, -13.805419921875, -13.15771484375, -12.510009765625, -11.8623046875, -11.214599609375, -10.56689453125, -9.919189453125, -9.271484375, -8.623779296875, -7.97607421875, -7.328369140625, -6.6806640625, -6.032958984375, -5.38525390625, -4.737548828125, -4.08984375, -3.442138671875, -2.79443359375, -2.146728515625, -1.4990234375, -0.851318359375, -0.20361328125, 0.444091796875, 1.091796875, 1.739501953125, 2.38720703125, 3.034912109375, 3.6826171875, 4.330322265625, 4.97802734375, 5.625732421875, 6.2734375, 6.921142578125, 7.56884765625, 8.216552734375, 8.8642578125, 9.511962890625, 10.15966796875, 10.807373046875, 11.455078125, 12.102783203125, 12.75048828125, 13.398193359375, 14.0458984375, 14.693603515625, 15.34130859375, 15.989013671875, 16.63671875, 17.284423828125, 17.93212890625, 18.579833984375, 19.2275390625, 19.875244140625, 20.52294921875, 21.170654296875, 21.818359375, 22.466064453125, 23.11376953125, 23.761474609375, 24.4091796875, 25.056884765625, 25.70458984375, 26.352294921875, 27.0]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 7.0, 7.0, 8.0, 10.0, 6.0, 31.0, 38.0, 72.0, 124.0, 275.0, 579.0, 1417.0, 5360.0, 2686681.0, 1492535.0, 4670.0, 1364.0, 560.0, 242.0, 143.0, 53.0, 36.0, 21.0, 12.0, 9.0, 6.0, 5.0, 5.0, 2.0, 2.0, 2.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-63.09375, -61.51513671875, -59.9365234375, -58.35791015625, -56.779296875, -55.20068359375, -53.6220703125, -52.04345703125, -50.46484375, -48.88623046875, -47.3076171875, -45.72900390625, -44.150390625, -42.57177734375, -40.9931640625, -39.41455078125, -37.8359375, -36.25732421875, -34.6787109375, -33.10009765625, -31.521484375, -29.94287109375, -28.3642578125, -26.78564453125, -25.20703125, -23.62841796875, -22.0498046875, -20.47119140625, -18.892578125, -17.31396484375, -15.7353515625, -14.15673828125, -12.578125, -10.99951171875, -9.4208984375, -7.84228515625, -6.263671875, -4.68505859375, -3.1064453125, -1.52783203125, 0.05078125, 1.62939453125, 3.2080078125, 4.78662109375, 6.365234375, 7.94384765625, 9.5224609375, 11.10107421875, 12.6796875, 14.25830078125, 15.8369140625, 17.41552734375, 18.994140625, 20.57275390625, 22.1513671875, 23.72998046875, 25.30859375, 26.88720703125, 28.4658203125, 30.04443359375, 31.623046875, 33.20166015625, 34.7802734375, 36.35888671875, 37.9375]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 68.0, 689.0, 252.0, 2.0, 0.0, 2.0], "bins": [-572.313232421875, -562.7169799804688, -553.1207275390625, -543.5244750976562, -533.92822265625, -524.3319702148438, -514.7357177734375, -505.13946533203125, -495.543212890625, -485.94696044921875, -476.3507080078125, -466.75445556640625, -457.158203125, -447.56195068359375, -437.9656982421875, -428.36944580078125, -418.7732238769531, -409.1769714355469, -399.5807189941406, -389.9844665527344, -380.3882141113281, -370.7919616699219, -361.1957092285156, -351.5994873046875, -342.00323486328125, -332.406982421875, -322.81072998046875, -313.2144775390625, -303.61822509765625, -294.02197265625, -284.42572021484375, -274.8294677734375, -265.2332458496094, -255.63699340820312, -246.04074096679688, -236.44448852539062, -226.84823608398438, -217.25198364257812, -207.65574645996094, -198.0594940185547, -188.46324157714844, -178.8669891357422, -169.27073669433594, -159.6744842529297, -150.0782470703125, -140.48199462890625, -130.8857421875, -121.28948974609375, -111.6932373046875, -102.09698486328125, -92.500732421875, -82.90448760986328, -73.30823516845703, -63.71198272705078, -54.1157341003418, -44.51948547363281, -34.92323303222656, -25.326982498168945, -15.730731964111328, -6.134481430053711, 3.4617691040039062, 13.058021545410156, 22.65427017211914, 32.250518798828125, 41.846771240234375]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 4.0, 11.0, 7.0, 10.0, 14.0, 22.0, 27.0, 29.0, 16.0, 26.0, 33.0, 39.0, 43.0, 54.0, 49.0, 20.0, 51.0, 42.0, 60.0, 59.0, 47.0, 46.0, 42.0, 38.0, 34.0, 27.0, 26.0, 22.0, 30.0, 20.0, 15.0, 7.0, 5.0, 4.0, 9.0, 3.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-59.777099609375, -58.08835220336914, -56.39960479736328, -54.71086120605469, -53.02211380004883, -51.33336639404297, -49.64461898803711, -47.95587158203125, -46.267127990722656, -44.5783805847168, -42.88963317871094, -41.200889587402344, -39.512142181396484, -37.823394775390625, -36.134647369384766, -34.445899963378906, -32.75715255737305, -31.068405151367188, -29.37965965270996, -27.6909122467041, -26.002166748046875, -24.313419342041016, -22.624671936035156, -20.935924530029297, -19.24717903137207, -17.55843162536621, -15.869686126708984, -14.180938720703125, -12.492192268371582, -10.803445816040039, -9.11469841003418, -7.425951957702637, -5.737205505371094, -4.048459053039551, -2.3597121238708496, -0.6709651947021484, 1.0177812576293945, 2.7065277099609375, 4.395275115966797, 6.08402156829834, 7.772768020629883, 9.461514472961426, 11.150260925292969, 12.839008331298828, 14.527754783630371, 16.216501235961914, 17.905248641967773, 19.593994140625, 21.28274154663086, 22.97148895263672, 24.660234451293945, 26.348981857299805, 28.03772735595703, 29.72647476196289, 31.41522216796875, 33.10396957397461, 34.79271697998047, 36.48146438598633, 38.17021179199219, 39.85895538330078, 41.54770278930664, 43.2364501953125, 44.92519760131836, 46.61394500732422, 48.30268859863281]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 8.0, 8.0, 7.0, 11.0, 15.0, 17.0, 15.0, 15.0, 20.0, 13.0, 28.0, 29.0, 31.0, 32.0, 30.0, 44.0, 33.0, 34.0, 35.0, 42.0, 33.0, 33.0, 39.0, 38.0, 39.0, 34.0, 43.0, 30.0, 25.0, 19.0, 29.0, 19.0, 24.0, 15.0, 23.0, 20.0, 8.0, 9.0, 9.0, 8.0, 7.0, 4.0, 4.0, 7.0, 3.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 3.0], "bins": [-5.18359375, -5.02191162109375, -4.8602294921875, -4.69854736328125, -4.536865234375, -4.37518310546875, -4.2135009765625, -4.05181884765625, -3.89013671875, -3.72845458984375, -3.5667724609375, -3.40509033203125, -3.243408203125, -3.08172607421875, -2.9200439453125, -2.75836181640625, -2.5966796875, -2.43499755859375, -2.2733154296875, -2.11163330078125, -1.949951171875, -1.78826904296875, -1.6265869140625, -1.46490478515625, -1.30322265625, -1.14154052734375, -0.9798583984375, -0.81817626953125, -0.656494140625, -0.49481201171875, -0.3331298828125, -0.17144775390625, -0.009765625, 0.15191650390625, 0.3135986328125, 0.47528076171875, 0.636962890625, 0.79864501953125, 0.9603271484375, 1.12200927734375, 1.28369140625, 1.44537353515625, 1.6070556640625, 1.76873779296875, 1.930419921875, 2.09210205078125, 2.2537841796875, 2.41546630859375, 2.5771484375, 2.73883056640625, 2.9005126953125, 3.06219482421875, 3.223876953125, 3.38555908203125, 3.5472412109375, 3.70892333984375, 3.87060546875, 4.03228759765625, 4.1939697265625, 4.35565185546875, 4.517333984375, 4.67901611328125, 4.8406982421875, 5.00238037109375, 5.1640625]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 2.0, 7.0, 3.0, 9.0, 11.0, 20.0, 19.0, 25.0, 49.0, 78.0, 104.0, 147.0, 226.0, 290.0, 424.0, 636.0, 883.0, 1204.0, 1724.0, 2552.0, 3515.0, 5090.0, 7600.0, 11518.0, 17491.0, 27830.0, 45550.0, 77357.0, 143757.0, 242942.0, 194204.0, 103851.0, 58858.0, 35076.0, 21881.0, 13976.0, 9203.0, 6233.0, 4265.0, 2950.0, 2166.0, 1421.0, 1026.0, 687.0, 475.0, 338.0, 277.0, 185.0, 135.0, 72.0, 71.0, 50.0, 33.0, 20.0, 19.0, 16.0, 7.0, 2.0, 2.0, 4.0], "bins": [-0.7373046875, -0.7154541015625, -0.693603515625, -0.6717529296875, -0.64990234375, -0.6280517578125, -0.606201171875, -0.5843505859375, -0.5625, -0.5406494140625, -0.518798828125, -0.4969482421875, -0.47509765625, -0.4532470703125, -0.431396484375, -0.4095458984375, -0.3876953125, -0.3658447265625, -0.343994140625, -0.3221435546875, -0.30029296875, -0.2784423828125, -0.256591796875, -0.2347412109375, -0.212890625, -0.1910400390625, -0.169189453125, -0.1473388671875, -0.12548828125, -0.1036376953125, -0.081787109375, -0.0599365234375, -0.0380859375, -0.0162353515625, 0.005615234375, 0.0274658203125, 0.04931640625, 0.0711669921875, 0.093017578125, 0.1148681640625, 0.13671875, 0.1585693359375, 0.180419921875, 0.2022705078125, 0.22412109375, 0.2459716796875, 0.267822265625, 0.2896728515625, 0.3115234375, 0.3333740234375, 0.355224609375, 0.3770751953125, 0.39892578125, 0.4207763671875, 0.442626953125, 0.4644775390625, 0.486328125, 0.5081787109375, 0.530029296875, 0.5518798828125, 0.57373046875, 0.5955810546875, 0.617431640625, 0.6392822265625, 0.6611328125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 6.0, 5.0, 6.0, 5.0, 7.0, 7.0, 7.0, 15.0, 20.0, 17.0, 15.0, 23.0, 28.0, 30.0, 27.0, 37.0, 37.0, 45.0, 43.0, 42.0, 37.0, 46.0, 1069.0, 42.0, 30.0, 30.0, 28.0, 33.0, 31.0, 31.0, 29.0, 28.0, 25.0, 18.0, 24.0, 10.0, 17.0, 9.0, 13.0, 12.0, 7.0, 4.0, 11.0, 7.0, 8.0, 5.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.34765625, -3.240570068359375, -3.13348388671875, -3.026397705078125, -2.9193115234375, -2.812225341796875, -2.70513916015625, -2.598052978515625, -2.490966796875, -2.383880615234375, -2.27679443359375, -2.169708251953125, -2.0626220703125, -1.955535888671875, -1.84844970703125, -1.741363525390625, -1.63427734375, -1.527191162109375, -1.42010498046875, -1.313018798828125, -1.2059326171875, -1.098846435546875, -0.99176025390625, -0.884674072265625, -0.777587890625, -0.670501708984375, -0.56341552734375, -0.456329345703125, -0.3492431640625, -0.242156982421875, -0.13507080078125, -0.027984619140625, 0.0791015625, 0.186187744140625, 0.29327392578125, 0.400360107421875, 0.5074462890625, 0.614532470703125, 0.72161865234375, 0.828704833984375, 0.935791015625, 1.042877197265625, 1.14996337890625, 1.257049560546875, 1.3641357421875, 1.471221923828125, 1.57830810546875, 1.685394287109375, 1.79248046875, 1.899566650390625, 2.00665283203125, 2.113739013671875, 2.2208251953125, 2.327911376953125, 2.43499755859375, 2.542083740234375, 2.649169921875, 2.756256103515625, 2.86334228515625, 2.970428466796875, 3.0775146484375, 3.184600830078125, 3.29168701171875, 3.398773193359375, 3.505859375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 9.0, 9.0, 17.0, 31.0, 36.0, 68.0, 85.0, 133.0, 157.0, 228.0, 355.0, 469.0, 672.0, 1089.0, 1483.0, 2191.0, 3192.0, 4766.0, 7217.0, 11068.0, 16962.0, 27024.0, 44358.0, 75640.0, 138781.0, 1286648.0, 202179.0, 109386.0, 60815.0, 36375.0, 22621.0, 14592.0, 9336.0, 5961.0, 4172.0, 2822.0, 1822.0, 1350.0, 971.0, 634.0, 428.0, 303.0, 229.0, 164.0, 84.0, 69.0, 37.0, 30.0, 31.0, 20.0, 7.0, 8.0, 4.0, 0.0, 0.0, 1.0], "bins": [-0.693359375, -0.6728515625, -0.65234375, -0.6318359375, -0.611328125, -0.5908203125, -0.5703125, -0.5498046875, -0.529296875, -0.5087890625, -0.48828125, -0.4677734375, -0.447265625, -0.4267578125, -0.40625, -0.3857421875, -0.365234375, -0.3447265625, -0.32421875, -0.3037109375, -0.283203125, -0.2626953125, -0.2421875, -0.2216796875, -0.201171875, -0.1806640625, -0.16015625, -0.1396484375, -0.119140625, -0.0986328125, -0.078125, -0.0576171875, -0.037109375, -0.0166015625, 0.00390625, 0.0244140625, 0.044921875, 0.0654296875, 0.0859375, 0.1064453125, 0.126953125, 0.1474609375, 0.16796875, 0.1884765625, 0.208984375, 0.2294921875, 0.25, 0.2705078125, 0.291015625, 0.3115234375, 0.33203125, 0.3525390625, 0.373046875, 0.3935546875, 0.4140625, 0.4345703125, 0.455078125, 0.4755859375, 0.49609375, 0.5166015625, 0.537109375, 0.5576171875, 0.578125, 0.5986328125, 0.619140625]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 7.0, 0.0, 4.0, 2.0, 7.0, 8.0, 7.0, 13.0, 7.0, 12.0, 16.0, 23.0, 26.0, 20.0, 26.0, 18.0, 41.0, 39.0, 42.0, 50.0, 47.0, 49.0, 61.0, 45.0, 49.0, 41.0, 55.0, 44.0, 40.0, 35.0, 35.0, 28.0, 14.0, 21.0, 21.0, 22.0, 12.0, 7.0, 6.0, 6.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00131988525390625, -0.0012701302766799927, -0.0012203752994537354, -0.001170620322227478, -0.0011208653450012207, -0.0010711103677749634, -0.001021355390548706, -0.0009716004133224487, -0.0009218454360961914, -0.0008720904588699341, -0.0008223354816436768, -0.0007725805044174194, -0.0007228255271911621, -0.0006730705499649048, -0.0006233155727386475, -0.0005735605955123901, -0.0005238056182861328, -0.0004740506410598755, -0.00042429566383361816, -0.00037454068660736084, -0.0003247857093811035, -0.0002750307321548462, -0.00022527575492858887, -0.00017552077770233154, -0.00012576580047607422, -7.60108232498169e-05, -2.625584602355957e-05, 2.3499131202697754e-05, 7.325410842895508e-05, 0.0001230090856552124, 0.00017276406288146973, 0.00022251904010772705, 0.0002722740173339844, 0.0003220289945602417, 0.000371783971786499, 0.00042153894901275635, 0.00047129392623901367, 0.000521048903465271, 0.0005708038806915283, 0.0006205588579177856, 0.000670313835144043, 0.0007200688123703003, 0.0007698237895965576, 0.0008195787668228149, 0.0008693337440490723, 0.0009190887212753296, 0.0009688436985015869, 0.0010185986757278442, 0.0010683536529541016, 0.0011181086301803589, 0.0011678636074066162, 0.0012176185846328735, 0.0012673735618591309, 0.0013171285390853882, 0.0013668835163116455, 0.0014166384935379028, 0.0014663934707641602, 0.0015161484479904175, 0.0015659034252166748, 0.0016156584024429321, 0.0016654133796691895, 0.0017151683568954468, 0.001764923334121704, 0.0018146783113479614, 0.0018644332885742188]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 7.0, 4.0, 5.0, 14.0, 18.0, 24.0, 29.0, 39.0, 53.0, 55.0, 69.0, 112.0, 133.0, 199.0, 257.0, 380.0, 612.0, 1264.0, 307306.0, 734440.0, 1467.0, 641.0, 384.0, 260.0, 178.0, 144.0, 99.0, 91.0, 58.0, 46.0, 45.0, 31.0, 25.0, 20.0, 11.0, 8.0, 12.0, 9.0, 4.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.027557373046875, -0.026670217514038086, -0.025783061981201172, -0.024895906448364258, -0.024008750915527344, -0.02312159538269043, -0.022234439849853516, -0.0213472843170166, -0.020460128784179688, -0.019572973251342773, -0.01868581771850586, -0.017798662185668945, -0.01691150665283203, -0.016024351119995117, -0.015137195587158203, -0.014250040054321289, -0.013362884521484375, -0.012475728988647461, -0.011588573455810547, -0.010701417922973633, -0.009814262390136719, -0.008927106857299805, -0.00803995132446289, -0.0071527957916259766, -0.0062656402587890625, -0.0053784847259521484, -0.004491329193115234, -0.0036041736602783203, -0.0027170181274414062, -0.0018298625946044922, -0.0009427070617675781, -5.555152893066406e-05, 0.00083160400390625, 0.001718759536743164, 0.002605915069580078, 0.003493070602416992, 0.004380226135253906, 0.00526738166809082, 0.006154537200927734, 0.0070416927337646484, 0.007928848266601562, 0.008816003799438477, 0.00970315933227539, 0.010590314865112305, 0.011477470397949219, 0.012364625930786133, 0.013251781463623047, 0.014138936996459961, 0.015026092529296875, 0.01591324806213379, 0.016800403594970703, 0.017687559127807617, 0.01857471466064453, 0.019461870193481445, 0.02034902572631836, 0.021236181259155273, 0.022123336791992188, 0.0230104923248291, 0.023897647857666016, 0.02478480339050293, 0.025671958923339844, 0.026559114456176758, 0.027446269989013672, 0.028333425521850586, 0.0292205810546875]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 7.0, 31.0, 149.0, 338.0, 315.0, 133.0, 30.0, 8.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002386812586337328, -0.0023185203317552805, -0.0022502278443425894, -0.002181935589760542, -0.002113643102347851, -0.0020453508477658033, -0.0019770583603531122, -0.0019087661057710648, -0.0018404737347736955, -0.0017721813637763262, -0.0017038889927789569, -0.0016355966217815876, -0.0015673043671995401, -0.001499011879786849, -0.0014307196252048016, -0.0013624272542074323, -0.001294134883210063, -0.0012258425122126937, -0.0011575501412153244, -0.0010892577702179551, -0.0010209653992205858, -0.0009526730864308774, -0.0008843807736411691, -0.0008160884026437998, -0.0007477960316464305, -0.0006795036606490612, -0.0006112112896516919, -0.0005429189768619835, -0.00047462660586461425, -0.00040633423486724496, -0.0003380418929737061, -0.0002697495510801673, -0.00020145741291344166, -0.0001331650564679876, -6.487270002253354e-05, 3.419656422920525e-06, 7.171201286837459e-05, 0.00014000438386574388, 0.0002082967257592827, 0.00027658906765282154, 0.00034488143865019083, 0.0004131738096475601, 0.00048146615154109895, 0.0005497584934346378, 0.0006180508644320071, 0.0006863432354293764, 0.0007546355482190847, 0.000822927919216454, 0.0008912202902138233, 0.0009595126612111926, 0.001027805032208562, 0.0010960974032059312, 0.0011643897742033005, 0.001232682028785348, 0.0013009743997827172, 0.0013692667707800865, 0.0014375591417774558, 0.001505851512774825, 0.0015741438837721944, 0.0016424362547695637, 0.0017107285093516111, 0.0017790209967643023, 0.0018473132513463497, 0.001915605622343719, 0.0019838979933410883]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 4.0, 4.0, 5.0, 5.0, 6.0, 9.0, 13.0, 8.0, 15.0, 17.0, 16.0, 20.0, 27.0, 30.0, 24.0, 26.0, 29.0, 40.0, 36.0, 37.0, 52.0, 38.0, 36.0, 45.0, 28.0, 40.0, 44.0, 35.0, 36.0, 32.0, 24.0, 34.0, 21.0, 30.0, 22.0, 20.0, 16.0, 15.0, 19.0, 16.0, 8.0, 7.0, 6.0, 3.0, 4.0, 5.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007917284965515137, -0.000765705481171608, -0.0007396824657917023, -0.0007136594504117966, -0.0006876364350318909, -0.0006616134196519852, -0.0006355904042720795, -0.0006095673888921738, -0.0005835443735122681, -0.0005575213581323624, -0.0005314983427524567, -0.000505475327372551, -0.00047945231199264526, -0.00045342929661273956, -0.00042740628123283386, -0.00040138326585292816, -0.00037536025047302246, -0.00034933723509311676, -0.00032331421971321106, -0.00029729120433330536, -0.00027126818895339966, -0.00024524517357349396, -0.00021922215819358826, -0.00019319914281368256, -0.00016717612743377686, -0.00014115311205387115, -0.00011513009667396545, -8.910708129405975e-05, -6.308406591415405e-05, -3.706105053424835e-05, -1.1038035154342651e-05, 1.498498022556305e-05, 4.100799560546875e-05, 6.703101098537445e-05, 9.305402636528015e-05, 0.00011907704174518585, 0.00014510005712509155, 0.00017112307250499725, 0.00019714608788490295, 0.00022316910326480865, 0.00024919211864471436, 0.00027521513402462006, 0.00030123814940452576, 0.00032726116478443146, 0.00035328418016433716, 0.00037930719554424286, 0.00040533021092414856, 0.00043135322630405426, 0.00045737624168395996, 0.00048339925706386566, 0.0005094222724437714, 0.0005354452878236771, 0.0005614683032035828, 0.0005874913185834885, 0.0006135143339633942, 0.0006395373493432999, 0.0006655603647232056, 0.0006915833801031113, 0.000717606395483017, 0.0007436294108629227, 0.0007696524262428284, 0.0007956754416227341, 0.0008216984570026398, 0.0008477214723825455, 0.0008737444877624512]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 8.0, 8.0, 7.0, 11.0, 15.0, 17.0, 15.0, 15.0, 20.0, 13.0, 28.0, 29.0, 31.0, 32.0, 30.0, 44.0, 33.0, 34.0, 35.0, 42.0, 33.0, 33.0, 39.0, 38.0, 39.0, 34.0, 43.0, 30.0, 25.0, 19.0, 29.0, 19.0, 24.0, 15.0, 23.0, 20.0, 8.0, 9.0, 9.0, 8.0, 7.0, 4.0, 4.0, 7.0, 3.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 3.0], "bins": [-5.18359375, -5.02191162109375, -4.8602294921875, -4.69854736328125, -4.536865234375, -4.37518310546875, -4.2135009765625, -4.05181884765625, -3.89013671875, -3.72845458984375, -3.5667724609375, -3.40509033203125, -3.243408203125, -3.08172607421875, -2.9200439453125, -2.75836181640625, -2.5966796875, -2.43499755859375, -2.2733154296875, -2.11163330078125, -1.949951171875, -1.78826904296875, -1.6265869140625, -1.46490478515625, -1.30322265625, -1.14154052734375, -0.9798583984375, -0.81817626953125, -0.656494140625, -0.49481201171875, -0.3331298828125, -0.17144775390625, -0.009765625, 0.15191650390625, 0.3135986328125, 0.47528076171875, 0.636962890625, 0.79864501953125, 0.9603271484375, 1.12200927734375, 1.28369140625, 1.44537353515625, 1.6070556640625, 1.76873779296875, 1.930419921875, 2.09210205078125, 2.2537841796875, 2.41546630859375, 2.5771484375, 2.73883056640625, 2.9005126953125, 3.06219482421875, 3.223876953125, 3.38555908203125, 3.5472412109375, 3.70892333984375, 3.87060546875, 4.03228759765625, 4.1939697265625, 4.35565185546875, 4.517333984375, 4.67901611328125, 4.8406982421875, 5.00238037109375, 5.1640625]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 1.0, 4.0, 5.0, 2.0, 7.0, 10.0, 14.0, 16.0, 30.0, 28.0, 53.0, 63.0, 79.0, 102.0, 138.0, 188.0, 255.0, 451.0, 635.0, 1093.0, 1865.0, 3850.0, 9967.0, 31448.0, 144473.0, 612458.0, 183214.0, 37003.0, 11409.0, 4286.0, 2108.0, 1123.0, 688.0, 445.0, 296.0, 222.0, 129.0, 101.0, 72.0, 50.0, 39.0, 37.0, 19.0, 23.0, 10.0, 18.0, 10.0, 4.0, 8.0, 2.0, 3.0, 7.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.2421875, -8.9295654296875, -8.616943359375, -8.3043212890625, -7.99169921875, -7.6790771484375, -7.366455078125, -7.0538330078125, -6.7412109375, -6.4285888671875, -6.115966796875, -5.8033447265625, -5.49072265625, -5.1781005859375, -4.865478515625, -4.5528564453125, -4.240234375, -3.9276123046875, -3.614990234375, -3.3023681640625, -2.98974609375, -2.6771240234375, -2.364501953125, -2.0518798828125, -1.7392578125, -1.4266357421875, -1.114013671875, -0.8013916015625, -0.48876953125, -0.1761474609375, 0.136474609375, 0.4490966796875, 0.76171875, 1.0743408203125, 1.386962890625, 1.6995849609375, 2.01220703125, 2.3248291015625, 2.637451171875, 2.9500732421875, 3.2626953125, 3.5753173828125, 3.887939453125, 4.2005615234375, 4.51318359375, 4.8258056640625, 5.138427734375, 5.4510498046875, 5.763671875, 6.0762939453125, 6.388916015625, 6.7015380859375, 7.01416015625, 7.3267822265625, 7.639404296875, 7.9520263671875, 8.2646484375, 8.5772705078125, 8.889892578125, 9.2025146484375, 9.51513671875, 9.8277587890625, 10.140380859375, 10.4530029296875, 10.765625]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 8.0, 7.0, 13.0, 13.0, 15.0, 12.0, 17.0, 21.0, 28.0, 30.0, 33.0, 42.0, 57.0, 82.0, 125.0, 1651.0, 441.0, 90.0, 58.0, 50.0, 55.0, 44.0, 41.0, 23.0, 20.0, 16.0, 12.0, 10.0, 13.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-18.5625, -17.98046875, -17.3984375, -16.81640625, -16.234375, -15.65234375, -15.0703125, -14.48828125, -13.90625, -13.32421875, -12.7421875, -12.16015625, -11.578125, -10.99609375, -10.4140625, -9.83203125, -9.25, -8.66796875, -8.0859375, -7.50390625, -6.921875, -6.33984375, -5.7578125, -5.17578125, -4.59375, -4.01171875, -3.4296875, -2.84765625, -2.265625, -1.68359375, -1.1015625, -0.51953125, 0.0625, 0.64453125, 1.2265625, 1.80859375, 2.390625, 2.97265625, 3.5546875, 4.13671875, 4.71875, 5.30078125, 5.8828125, 6.46484375, 7.046875, 7.62890625, 8.2109375, 8.79296875, 9.375, 9.95703125, 10.5390625, 11.12109375, 11.703125, 12.28515625, 12.8671875, 13.44921875, 14.03125, 14.61328125, 15.1953125, 15.77734375, 16.359375, 16.94140625, 17.5234375, 18.10546875, 18.6875]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 12.0, 10.0, 18.0, 16.0, 26.0, 35.0, 40.0, 64.0, 113.0, 226.0, 430.0, 1158.0, 203593.0, 2937381.0, 1407.0, 506.0, 273.0, 136.0, 67.0, 41.0, 21.0, 25.0, 24.0, 16.0, 14.0, 10.0, 9.0, 10.0, 3.0, 5.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.34375, -52.6494140625, -50.955078125, -49.2607421875, -47.56640625, -45.8720703125, -44.177734375, -42.4833984375, -40.7890625, -39.0947265625, -37.400390625, -35.7060546875, -34.01171875, -32.3173828125, -30.623046875, -28.9287109375, -27.234375, -25.5400390625, -23.845703125, -22.1513671875, -20.45703125, -18.7626953125, -17.068359375, -15.3740234375, -13.6796875, -11.9853515625, -10.291015625, -8.5966796875, -6.90234375, -5.2080078125, -3.513671875, -1.8193359375, -0.125, 1.5693359375, 3.263671875, 4.9580078125, 6.65234375, 8.3466796875, 10.041015625, 11.7353515625, 13.4296875, 15.1240234375, 16.818359375, 18.5126953125, 20.20703125, 21.9013671875, 23.595703125, 25.2900390625, 26.984375, 28.6787109375, 30.373046875, 32.0673828125, 33.76171875, 35.4560546875, 37.150390625, 38.8447265625, 40.5390625, 42.2333984375, 43.927734375, 45.6220703125, 47.31640625, 49.0107421875, 50.705078125, 52.3994140625, 54.09375]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 50.0, 182.0, 464.0, 257.0, 46.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.63360595703125, -14.008525848388672, -12.38344669342041, -10.758367538452148, -9.13328742980957, -7.508207321166992, -5.8831281661987305, -4.258049011230469, -2.6329689025878906, -1.0078892707824707, 0.6171903610229492, 2.242269992828369, 3.867349624633789, 5.492429733276367, 7.117508888244629, 8.74258804321289, 10.367668151855469, 11.992748260498047, 13.617827415466309, 15.24290657043457, 16.86798667907715, 18.493066787719727, 20.118144989013672, 21.74322509765625, 23.368305206298828, 24.993385314941406, 26.618465423583984, 28.24354362487793, 29.868623733520508, 31.493703842163086, 33.11878204345703, 34.74386215209961, 36.36894226074219, 37.994022369384766, 39.619102478027344, 41.24418258666992, 42.8692626953125, 44.49433898925781, 46.11941909790039, 47.74449920654297, 49.36957931518555, 50.994659423828125, 52.6197395324707, 54.24481964111328, 55.869895935058594, 57.49497985839844, 59.12005615234375, 60.74513626098633, 62.370216369628906, 63.995296478271484, 65.62037658691406, 67.24545288085938, 68.87053680419922, 70.49561309814453, 72.12069702148438, 73.74577331542969, 75.370849609375, 76.99592590332031, 78.62100982666016, 80.24608612060547, 81.87117004394531, 83.49624633789062, 85.12133026123047, 86.74640655517578, 88.37149047851562]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 3.0, 3.0, 5.0, 6.0, 8.0, 14.0, 16.0, 10.0, 27.0, 33.0, 40.0, 37.0, 46.0, 38.0, 56.0, 49.0, 44.0, 48.0, 63.0, 61.0, 57.0, 44.0, 55.0, 39.0, 27.0, 39.0, 32.0, 25.0, 20.0, 18.0, 9.0, 12.0, 10.0, 4.0, 1.0, 5.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.127288818359375, -33.85502243041992, -32.582759857177734, -31.31049346923828, -30.03822898864746, -28.76596450805664, -27.493698120117188, -26.221433639526367, -24.949169158935547, -23.676904678344727, -22.404640197753906, -21.132373809814453, -19.860109329223633, -18.587844848632812, -17.31557846069336, -16.04331398010254, -14.771049499511719, -13.498785018920898, -12.226519584655762, -10.954254150390625, -9.681989669799805, -8.409725189208984, -7.137459754943848, -5.865194320678711, -4.592929840087891, -3.320664882659912, -2.0483999252319336, -0.7761349678039551, 0.49612998962402344, 1.768394947052002, 3.0406599044799805, 4.312925338745117, 5.585186004638672, 6.85745096206665, 8.129715919494629, 9.401981353759766, 10.674245834350586, 11.946510314941406, 13.218775749206543, 14.49104118347168, 15.7633056640625, 17.03557014465332, 18.30783462524414, 19.580101013183594, 20.852365493774414, 22.124629974365234, 23.396896362304688, 24.669160842895508, 25.941425323486328, 27.21368980407715, 28.48595428466797, 29.758220672607422, 31.030485153198242, 32.30274963378906, 33.575016021728516, 34.84728240966797, 36.119544982910156, 37.39181137084961, 38.6640739440918, 39.93634033203125, 41.20860290527344, 42.48086929321289, 43.753135681152344, 45.02539825439453, 46.297664642333984]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 5.0, 1.0, 8.0, 11.0, 10.0, 14.0, 13.0, 23.0, 27.0, 22.0, 30.0, 29.0, 37.0, 27.0, 49.0, 57.0, 51.0, 43.0, 44.0, 39.0, 43.0, 42.0, 56.0, 47.0, 33.0, 27.0, 32.0, 43.0, 28.0, 21.0, 18.0, 14.0, 13.0, 6.0, 3.0, 9.0, 5.0, 5.0, 8.0, 3.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.046875, -5.815673828125, -5.58447265625, -5.353271484375, -5.1220703125, -4.890869140625, -4.65966796875, -4.428466796875, -4.197265625, -3.966064453125, -3.73486328125, -3.503662109375, -3.2724609375, -3.041259765625, -2.81005859375, -2.578857421875, -2.34765625, -2.116455078125, -1.88525390625, -1.654052734375, -1.4228515625, -1.191650390625, -0.96044921875, -0.729248046875, -0.498046875, -0.266845703125, -0.03564453125, 0.195556640625, 0.4267578125, 0.657958984375, 0.88916015625, 1.120361328125, 1.3515625, 1.582763671875, 1.81396484375, 2.045166015625, 2.2763671875, 2.507568359375, 2.73876953125, 2.969970703125, 3.201171875, 3.432373046875, 3.66357421875, 3.894775390625, 4.1259765625, 4.357177734375, 4.58837890625, 4.819580078125, 5.05078125, 5.281982421875, 5.51318359375, 5.744384765625, 5.9755859375, 6.206787109375, 6.43798828125, 6.669189453125, 6.900390625, 7.131591796875, 7.36279296875, 7.593994140625, 7.8251953125, 8.056396484375, 8.28759765625, 8.518798828125, 8.75]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 12.0, 9.0, 19.0, 13.0, 31.0, 30.0, 41.0, 64.0, 77.0, 105.0, 137.0, 202.0, 275.0, 471.0, 687.0, 1201.0, 4167.0, 226606.0, 3923754.0, 31036.0, 2425.0, 976.0, 579.0, 401.0, 244.0, 178.0, 119.0, 101.0, 91.0, 52.0, 44.0, 27.0, 25.0, 27.0, 18.0, 15.0, 8.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.1875, -36.73828125, -35.2890625, -33.83984375, -32.390625, -30.94140625, -29.4921875, -28.04296875, -26.59375, -25.14453125, -23.6953125, -22.24609375, -20.796875, -19.34765625, -17.8984375, -16.44921875, -15.0, -13.55078125, -12.1015625, -10.65234375, -9.203125, -7.75390625, -6.3046875, -4.85546875, -3.40625, -1.95703125, -0.5078125, 0.94140625, 2.390625, 3.83984375, 5.2890625, 6.73828125, 8.1875, 9.63671875, 11.0859375, 12.53515625, 13.984375, 15.43359375, 16.8828125, 18.33203125, 19.78125, 21.23046875, 22.6796875, 24.12890625, 25.578125, 27.02734375, 28.4765625, 29.92578125, 31.375, 32.82421875, 34.2734375, 35.72265625, 37.171875, 38.62109375, 40.0703125, 41.51953125, 42.96875, 44.41796875, 45.8671875, 47.31640625, 48.765625, 50.21484375, 51.6640625, 53.11328125, 54.5625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 3.0, 3.0, 5.0, 8.0, 13.0, 21.0, 29.0, 31.0, 77.0, 130.0, 180.0, 313.0, 456.0, 670.0, 653.0, 524.0, 333.0, 225.0, 127.0, 89.0, 63.0, 33.0, 18.0, 15.0, 11.0, 12.0, 4.0, 10.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.2890625, -9.89404296875, -9.4990234375, -9.10400390625, -8.708984375, -8.31396484375, -7.9189453125, -7.52392578125, -7.12890625, -6.73388671875, -6.3388671875, -5.94384765625, -5.548828125, -5.15380859375, -4.7587890625, -4.36376953125, -3.96875, -3.57373046875, -3.1787109375, -2.78369140625, -2.388671875, -1.99365234375, -1.5986328125, -1.20361328125, -0.80859375, -0.41357421875, -0.0185546875, 0.37646484375, 0.771484375, 1.16650390625, 1.5615234375, 1.95654296875, 2.3515625, 2.74658203125, 3.1416015625, 3.53662109375, 3.931640625, 4.32666015625, 4.7216796875, 5.11669921875, 5.51171875, 5.90673828125, 6.3017578125, 6.69677734375, 7.091796875, 7.48681640625, 7.8818359375, 8.27685546875, 8.671875, 9.06689453125, 9.4619140625, 9.85693359375, 10.251953125, 10.64697265625, 11.0419921875, 11.43701171875, 11.83203125, 12.22705078125, 12.6220703125, 13.01708984375, 13.412109375, 13.80712890625, 14.2021484375, 14.59716796875, 14.9921875]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 4.0, 5.0, 13.0, 14.0, 32.0, 47.0, 93.0, 204.0, 524.0, 1460.0, 5838.0, 36938.0, 836389.0, 3186583.0, 110482.0, 11732.0, 2579.0, 781.0, 291.0, 133.0, 59.0, 36.0, 23.0, 9.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.6796875, -15.1239013671875, -14.568115234375, -14.0123291015625, -13.45654296875, -12.9007568359375, -12.344970703125, -11.7891845703125, -11.2333984375, -10.6776123046875, -10.121826171875, -9.5660400390625, -9.01025390625, -8.4544677734375, -7.898681640625, -7.3428955078125, -6.787109375, -6.2313232421875, -5.675537109375, -5.1197509765625, -4.56396484375, -4.0081787109375, -3.452392578125, -2.8966064453125, -2.3408203125, -1.7850341796875, -1.229248046875, -0.6734619140625, -0.11767578125, 0.4381103515625, 0.993896484375, 1.5496826171875, 2.10546875, 2.6612548828125, 3.217041015625, 3.7728271484375, 4.32861328125, 4.8843994140625, 5.440185546875, 5.9959716796875, 6.5517578125, 7.1075439453125, 7.663330078125, 8.2191162109375, 8.77490234375, 9.3306884765625, 9.886474609375, 10.4422607421875, 10.998046875, 11.5538330078125, 12.109619140625, 12.6654052734375, 13.22119140625, 13.7769775390625, 14.332763671875, 14.8885498046875, 15.4443359375, 16.0001220703125, 16.555908203125, 17.1116943359375, 17.66748046875, 18.2232666015625, 18.779052734375, 19.3348388671875, 19.890625]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 7.0, 15.0, 20.0, 36.0, 92.0, 130.0, 178.0, 160.0, 138.0, 96.0, 60.0, 26.0, 26.0, 8.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.20745086669922, -50.938514709472656, -47.669578552246094, -44.40064239501953, -41.13170623779297, -37.862770080566406, -34.593833923339844, -31.32489776611328, -28.05596160888672, -24.787025451660156, -21.518089294433594, -18.24915313720703, -14.980216979980469, -11.711280822753906, -8.442344665527344, -5.173408508300781, -1.9044723510742188, 1.3644638061523438, 4.633399963378906, 7.902336120605469, 11.171272277832031, 14.440208435058594, 17.709144592285156, 20.97808074951172, 24.24701690673828, 27.515953063964844, 30.784889221191406, 34.05382537841797, 37.32276153564453, 40.591697692871094, 43.860633850097656, 47.12957000732422, 50.39851379394531, 53.667449951171875, 56.93638610839844, 60.205322265625, 63.47425842285156, 66.74319458007812, 70.01213073730469, 73.28106689453125, 76.55000305175781, 79.81893920898438, 83.08787536621094, 86.3568115234375, 89.62574768066406, 92.89468383789062, 96.16361999511719, 99.43255615234375, 102.70149230957031, 105.97042846679688, 109.23936462402344, 112.50830078125, 115.77723693847656, 119.04617309570312, 122.31510925292969, 125.58404541015625, 128.8529815673828, 132.12191772460938, 135.39085388183594, 138.6597900390625, 141.92872619628906, 145.19766235351562, 148.4665985107422, 151.73553466796875, 155.0044708251953]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 6.0, 3.0, 5.0, 2.0, 4.0, 3.0, 6.0, 4.0, 10.0, 10.0, 6.0, 6.0, 20.0, 27.0, 19.0, 23.0, 23.0, 30.0, 38.0, 35.0, 36.0, 39.0, 35.0, 40.0, 36.0, 44.0, 46.0, 43.0, 37.0, 25.0, 39.0, 27.0, 29.0, 33.0, 34.0, 31.0, 19.0, 25.0, 23.0, 18.0, 20.0, 13.0, 8.0, 4.0, 5.0, 8.0, 5.0, 4.0, 5.0, 6.0, 1.0, 1.0, 1.0, 1.0], "bins": [-42.063720703125, -40.90061950683594, -39.737518310546875, -38.57441711425781, -37.41131591796875, -36.24821090698242, -35.08510971069336, -33.9220085144043, -32.758907318115234, -31.595806121826172, -30.43270492553711, -29.269601821899414, -28.10650062561035, -26.94339942932129, -25.780296325683594, -24.61719512939453, -23.45409393310547, -22.290992736816406, -21.127891540527344, -19.96478843688965, -18.801687240600586, -17.638586044311523, -16.475482940673828, -15.312381744384766, -14.149280548095703, -12.98617935180664, -11.823077201843262, -10.659975051879883, -9.49687385559082, -8.333772659301758, -7.170670509338379, -6.007568359375, -4.8444671630859375, -3.681365489959717, -2.518263816833496, -1.3551621437072754, -0.1920604705810547, 0.971041202545166, 2.1341428756713867, 3.2972450256347656, 4.460346221923828, 5.623447895050049, 6.7865495681762695, 7.94965124130249, 9.112752914428711, 10.275854110717773, 11.438956260681152, 12.602058410644531, 13.765159606933594, 14.928260803222656, 16.09136199951172, 17.254465103149414, 18.417566299438477, 19.58066749572754, 20.743770599365234, 21.906871795654297, 23.06997299194336, 24.233074188232422, 25.396175384521484, 26.55927848815918, 27.722379684448242, 28.885480880737305, 30.048583984375, 31.211685180664062, 32.374786376953125]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 5.0, 8.0, 6.0, 6.0, 8.0, 8.0, 13.0, 12.0, 17.0, 30.0, 24.0, 29.0, 48.0, 38.0, 33.0, 38.0, 47.0, 45.0, 39.0, 41.0, 54.0, 49.0, 49.0, 36.0, 43.0, 34.0, 35.0, 36.0, 25.0, 23.0, 26.0, 24.0, 16.0, 8.0, 11.0, 7.0, 10.0, 8.0, 2.0, 5.0, 7.0, 3.0, 1.0, 1.0, 1.0], "bins": [-81.625, -79.52294921875, -77.4208984375, -75.31884765625, -73.216796875, -71.11474609375, -69.0126953125, -66.91064453125, -64.80859375, -62.70654296875, -60.6044921875, -58.50244140625, -56.400390625, -54.29833984375, -52.1962890625, -50.09423828125, -47.9921875, -45.89013671875, -43.7880859375, -41.68603515625, -39.583984375, -37.48193359375, -35.3798828125, -33.27783203125, -31.17578125, -29.07373046875, -26.9716796875, -24.86962890625, -22.767578125, -20.66552734375, -18.5634765625, -16.46142578125, -14.359375, -12.25732421875, -10.1552734375, -8.05322265625, -5.951171875, -3.84912109375, -1.7470703125, 0.35498046875, 2.45703125, 4.55908203125, 6.6611328125, 8.76318359375, 10.865234375, 12.96728515625, 15.0693359375, 17.17138671875, 19.2734375, 21.37548828125, 23.4775390625, 25.57958984375, 27.681640625, 29.78369140625, 31.8857421875, 33.98779296875, 36.08984375, 38.19189453125, 40.2939453125, 42.39599609375, 44.498046875, 46.60009765625, 48.7021484375, 50.80419921875, 52.90625]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 1.0, 5.0, 10.0, 18.0, 14.0, 32.0, 54.0, 67.0, 96.0, 152.0, 209.0, 323.0, 442.0, 622.0, 909.0, 1446.0, 2093.0, 3199.0, 4563.0, 6971.0, 10482.0, 16616.0, 26390.0, 44190.0, 77391.0, 143717.0, 234219.0, 201818.0, 112405.0, 61888.0, 35822.0, 21905.0, 13622.0, 8877.0, 5826.0, 3951.0, 2606.0, 1750.0, 1224.0, 860.0, 569.0, 396.0, 249.0, 177.0, 124.0, 85.0, 57.0, 54.0, 27.0, 17.0, 9.0, 6.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.7734375, -6.55352783203125, -6.3336181640625, -6.11370849609375, -5.893798828125, -5.67388916015625, -5.4539794921875, -5.23406982421875, -5.01416015625, -4.79425048828125, -4.5743408203125, -4.35443115234375, -4.134521484375, -3.91461181640625, -3.6947021484375, -3.47479248046875, -3.2548828125, -3.03497314453125, -2.8150634765625, -2.59515380859375, -2.375244140625, -2.15533447265625, -1.9354248046875, -1.71551513671875, -1.49560546875, -1.27569580078125, -1.0557861328125, -0.83587646484375, -0.615966796875, -0.39605712890625, -0.1761474609375, 0.04376220703125, 0.263671875, 0.48358154296875, 0.7034912109375, 0.92340087890625, 1.143310546875, 1.36322021484375, 1.5831298828125, 1.80303955078125, 2.02294921875, 2.24285888671875, 2.4627685546875, 2.68267822265625, 2.902587890625, 3.12249755859375, 3.3424072265625, 3.56231689453125, 3.7822265625, 4.00213623046875, 4.2220458984375, 4.44195556640625, 4.661865234375, 4.88177490234375, 5.1016845703125, 5.32159423828125, 5.54150390625, 5.76141357421875, 5.9813232421875, 6.20123291015625, 6.421142578125, 6.64105224609375, 6.8609619140625, 7.08087158203125, 7.30078125]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 6.0, 5.0, 15.0, 15.0, 20.0, 17.0, 16.0, 26.0, 24.0, 27.0, 27.0, 32.0, 30.0, 57.0, 52.0, 50.0, 39.0, 1079.0, 52.0, 44.0, 32.0, 39.0, 37.0, 47.0, 22.0, 28.0, 26.0, 27.0, 20.0, 18.0, 21.0, 17.0, 8.0, 7.0, 5.0, 9.0, 9.0, 8.0, 5.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.75, -37.4443359375, -36.138671875, -34.8330078125, -33.52734375, -32.2216796875, -30.916015625, -29.6103515625, -28.3046875, -26.9990234375, -25.693359375, -24.3876953125, -23.08203125, -21.7763671875, -20.470703125, -19.1650390625, -17.859375, -16.5537109375, -15.248046875, -13.9423828125, -12.63671875, -11.3310546875, -10.025390625, -8.7197265625, -7.4140625, -6.1083984375, -4.802734375, -3.4970703125, -2.19140625, -0.8857421875, 0.419921875, 1.7255859375, 3.03125, 4.3369140625, 5.642578125, 6.9482421875, 8.25390625, 9.5595703125, 10.865234375, 12.1708984375, 13.4765625, 14.7822265625, 16.087890625, 17.3935546875, 18.69921875, 20.0048828125, 21.310546875, 22.6162109375, 23.921875, 25.2275390625, 26.533203125, 27.8388671875, 29.14453125, 30.4501953125, 31.755859375, 33.0615234375, 34.3671875, 35.6728515625, 36.978515625, 38.2841796875, 39.58984375, 40.8955078125, 42.201171875, 43.5068359375, 44.8125]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 7.0, 6.0, 5.0, 9.0, 23.0, 52.0, 42.0, 58.0, 100.0, 121.0, 211.0, 288.0, 430.0, 576.0, 842.0, 1238.0, 1806.0, 2688.0, 3880.0, 5711.0, 8710.0, 12860.0, 20017.0, 31006.0, 48289.0, 81736.0, 150304.0, 1291970.0, 180584.0, 96526.0, 55521.0, 34871.0, 22244.0, 14539.0, 9595.0, 6478.0, 4317.0, 2899.0, 1983.0, 1374.0, 1008.0, 696.0, 480.0, 306.0, 217.0, 175.0, 120.0, 72.0, 50.0, 32.0, 19.0, 15.0, 21.0, 10.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.29296875, -6.08758544921875, -5.8822021484375, -5.67681884765625, -5.471435546875, -5.26605224609375, -5.0606689453125, -4.85528564453125, -4.64990234375, -4.44451904296875, -4.2391357421875, -4.03375244140625, -3.828369140625, -3.62298583984375, -3.4176025390625, -3.21221923828125, -3.0068359375, -2.80145263671875, -2.5960693359375, -2.39068603515625, -2.185302734375, -1.97991943359375, -1.7745361328125, -1.56915283203125, -1.36376953125, -1.15838623046875, -0.9530029296875, -0.74761962890625, -0.542236328125, -0.33685302734375, -0.1314697265625, 0.07391357421875, 0.279296875, 0.48468017578125, 0.6900634765625, 0.89544677734375, 1.100830078125, 1.30621337890625, 1.5115966796875, 1.71697998046875, 1.92236328125, 2.12774658203125, 2.3331298828125, 2.53851318359375, 2.743896484375, 2.94927978515625, 3.1546630859375, 3.36004638671875, 3.5654296875, 3.77081298828125, 3.9761962890625, 4.18157958984375, 4.386962890625, 4.59234619140625, 4.7977294921875, 5.00311279296875, 5.20849609375, 5.41387939453125, 5.6192626953125, 5.82464599609375, 6.030029296875, 6.23541259765625, 6.4407958984375, 6.64617919921875, 6.8515625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 7.0, 2.0, 6.0, 4.0, 10.0, 6.0, 17.0, 7.0, 15.0, 19.0, 24.0, 33.0, 34.0, 40.0, 70.0, 75.0, 84.0, 93.0, 91.0, 75.0, 61.0, 46.0, 36.0, 33.0, 24.0, 18.0, 17.0, 14.0, 8.0, 8.0, 10.0, 2.0, 7.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.027679443359375, -0.02662801742553711, -0.02557659149169922, -0.024525165557861328, -0.023473739624023438, -0.022422313690185547, -0.021370887756347656, -0.020319461822509766, -0.019268035888671875, -0.018216609954833984, -0.017165184020996094, -0.016113758087158203, -0.015062332153320312, -0.014010906219482422, -0.012959480285644531, -0.01190805435180664, -0.01085662841796875, -0.00980520248413086, -0.008753776550292969, -0.007702350616455078, -0.0066509246826171875, -0.005599498748779297, -0.004548072814941406, -0.0034966468811035156, -0.002445220947265625, -0.0013937950134277344, -0.00034236907958984375, 0.0007090568542480469, 0.0017604827880859375, 0.002811908721923828, 0.0038633346557617188, 0.004914760589599609, 0.0059661865234375, 0.007017612457275391, 0.008069038391113281, 0.009120464324951172, 0.010171890258789062, 0.011223316192626953, 0.012274742126464844, 0.013326168060302734, 0.014377593994140625, 0.015429019927978516, 0.016480445861816406, 0.017531871795654297, 0.018583297729492188, 0.019634723663330078, 0.02068614959716797, 0.02173757553100586, 0.02278900146484375, 0.02384042739868164, 0.02489185333251953, 0.025943279266357422, 0.026994705200195312, 0.028046131134033203, 0.029097557067871094, 0.030148983001708984, 0.031200408935546875, 0.032251834869384766, 0.033303260803222656, 0.03435468673706055, 0.03540611267089844, 0.03645753860473633, 0.03750896453857422, 0.03856039047241211, 0.03961181640625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 3.0, 5.0, 7.0, 6.0, 7.0, 10.0, 18.0, 21.0, 22.0, 49.0, 61.0, 78.0, 129.0, 204.0, 341.0, 602.0, 1261.0, 3811.0, 16075.0, 104197.0, 616194.0, 260882.0, 33900.0, 6635.0, 2028.0, 835.0, 396.0, 264.0, 144.0, 111.0, 74.0, 52.0, 37.0, 25.0, 11.0, 18.0, 14.0, 7.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.277099609375, -0.26955223083496094, -0.2620048522949219, -0.2544574737548828, -0.24691009521484375, -0.2393627166748047, -0.23181533813476562, -0.22426795959472656, -0.2167205810546875, -0.20917320251464844, -0.20162582397460938, -0.1940784454345703, -0.18653106689453125, -0.1789836883544922, -0.17143630981445312, -0.16388893127441406, -0.156341552734375, -0.14879417419433594, -0.14124679565429688, -0.1336994171142578, -0.12615203857421875, -0.11860466003417969, -0.11105728149414062, -0.10350990295410156, -0.0959625244140625, -0.08841514587402344, -0.08086776733398438, -0.07332038879394531, -0.06577301025390625, -0.05822563171386719, -0.050678253173828125, -0.04313087463378906, -0.03558349609375, -0.028036117553710938, -0.020488739013671875, -0.012941360473632812, -0.00539398193359375, 0.0021533966064453125, 0.009700775146484375, 0.017248153686523438, 0.0247955322265625, 0.03234291076660156, 0.039890289306640625, 0.04743766784667969, 0.05498504638671875, 0.06253242492675781, 0.07007980346679688, 0.07762718200683594, 0.085174560546875, 0.09272193908691406, 0.10026931762695312, 0.10781669616699219, 0.11536407470703125, 0.12291145324707031, 0.13045883178710938, 0.13800621032714844, 0.1455535888671875, 0.15310096740722656, 0.16064834594726562, 0.1681957244873047, 0.17574310302734375, 0.1832904815673828, 0.19083786010742188, 0.19838523864746094, 0.2059326171875]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 6.0, 11.0, 16.0, 39.0, 58.0, 141.0, 178.0, 189.0, 155.0, 102.0, 62.0, 29.0, 13.0, 5.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.07190457731485367, -0.07035074383020401, -0.06879691034555435, -0.0672430694103241, -0.06568923592567444, -0.06413540244102478, -0.06258156895637512, -0.061027731746435165, -0.05947389826178551, -0.05792006477713585, -0.05636622756719589, -0.054812394082546234, -0.05325855687260628, -0.05170472338795662, -0.05015088617801666, -0.048597052693367004, -0.047043219208717346, -0.04548938572406769, -0.04393554851412773, -0.04238171502947807, -0.040827877819538116, -0.03927404433488846, -0.0377202108502388, -0.03616637364029884, -0.03461253643035889, -0.03305870294570923, -0.03150486573576927, -0.029951032251119614, -0.028397196903824806, -0.02684336155653, -0.02528952620923519, -0.023735690861940384, -0.022181859239935875, -0.020628023892641068, -0.01907418854534626, -0.017520353198051453, -0.015966519713401794, -0.014412684366106987, -0.01285884901881218, -0.011305014602839947, -0.00975117925554514, -0.008197343908250332, -0.006643509492278099, -0.005089674144983292, -0.0035358392633497715, -0.0019820043817162514, -0.00042816903442144394, 0.0011256653815507889, 0.0026795007288455963, 0.0042333356104791164, 0.0057871704921126366, 0.007341005839407444, 0.008894840255379677, 0.010448675602674484, 0.012002510949969292, 0.013556345365941525, 0.015110180713236332, 0.016664015129208565, 0.018217850476503372, 0.01977168582379818, 0.021325521171092987, 0.022879354655742645, 0.024433191865682602, 0.02598702535033226, 0.027540860697627068]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 5.0, 4.0, 9.0, 13.0, 5.0, 9.0, 14.0, 7.0, 17.0, 12.0, 14.0, 24.0, 31.0, 21.0, 30.0, 34.0, 34.0, 34.0, 35.0, 40.0, 36.0, 43.0, 41.0, 44.0, 47.0, 39.0, 42.0, 46.0, 28.0, 25.0, 33.0, 27.0, 13.0, 26.0, 13.0, 20.0, 19.0, 10.0, 12.0, 10.0, 9.0, 13.0, 4.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.013593435287475586, -0.013115603476762772, -0.012637771666049957, -0.012159939855337143, -0.011682108044624329, -0.011204276233911514, -0.0107264444231987, -0.010248612612485886, -0.009770780801773071, -0.009292948991060257, -0.008815117180347443, -0.008337285369634628, -0.007859453558921814, -0.007381621748209, -0.006903789937496185, -0.006425958126783371, -0.005948126316070557, -0.005470294505357742, -0.004992462694644928, -0.004514630883932114, -0.004036799073219299, -0.003558967262506485, -0.0030811354517936707, -0.0026033036410808563, -0.002125471830368042, -0.0016476400196552277, -0.0011698082089424133, -0.000691976398229599, -0.00021414458751678467, 0.00026368722319602966, 0.000741519033908844, 0.0012193508446216583, 0.0016971826553344727, 0.002175014466047287, 0.0026528462767601013, 0.0031306780874729156, 0.00360850989818573, 0.004086341708898544, 0.004564173519611359, 0.005042005330324173, 0.005519837141036987, 0.005997668951749802, 0.006475500762462616, 0.00695333257317543, 0.007431164383888245, 0.007908996194601059, 0.008386828005313873, 0.008864659816026688, 0.009342491626739502, 0.009820323437452316, 0.01029815524816513, 0.010775987058877945, 0.01125381886959076, 0.011731650680303574, 0.012209482491016388, 0.012687314301729202, 0.013165146112442017, 0.013642977923154831, 0.014120809733867645, 0.01459864154458046, 0.015076473355293274, 0.015554305166006088, 0.016032136976718903, 0.016509968787431717, 0.01698780059814453]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 5.0, 7.0, 7.0, 6.0, 8.0, 8.0, 13.0, 12.0, 17.0, 30.0, 23.0, 30.0, 48.0, 38.0, 36.0, 35.0, 47.0, 45.0, 39.0, 43.0, 53.0, 49.0, 48.0, 37.0, 42.0, 34.0, 35.0, 35.0, 27.0, 22.0, 26.0, 24.0, 16.0, 8.0, 11.0, 7.0, 10.0, 8.0, 2.0, 5.0, 8.0, 2.0, 1.0, 1.0, 1.0], "bins": [-81.6875, -79.5830078125, -77.478515625, -75.3740234375, -73.26953125, -71.1650390625, -69.060546875, -66.9560546875, -64.8515625, -62.7470703125, -60.642578125, -58.5380859375, -56.43359375, -54.3291015625, -52.224609375, -50.1201171875, -48.015625, -45.9111328125, -43.806640625, -41.7021484375, -39.59765625, -37.4931640625, -35.388671875, -33.2841796875, -31.1796875, -29.0751953125, -26.970703125, -24.8662109375, -22.76171875, -20.6572265625, -18.552734375, -16.4482421875, -14.34375, -12.2392578125, -10.134765625, -8.0302734375, -5.92578125, -3.8212890625, -1.716796875, 0.3876953125, 2.4921875, 4.5966796875, 6.701171875, 8.8056640625, 10.91015625, 13.0146484375, 15.119140625, 17.2236328125, 19.328125, 21.4326171875, 23.537109375, 25.6416015625, 27.74609375, 29.8505859375, 31.955078125, 34.0595703125, 36.1640625, 38.2685546875, 40.373046875, 42.4775390625, 44.58203125, 46.6865234375, 48.791015625, 50.8955078125, 53.0]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 4.0, 7.0, 4.0, 7.0, 8.0, 16.0, 15.0, 18.0, 26.0, 24.0, 32.0, 56.0, 79.0, 100.0, 186.0, 225.0, 422.0, 720.0, 1158.0, 2120.0, 4237.0, 9434.0, 27848.0, 118959.0, 544028.0, 260591.0, 50619.0, 14899.0, 5843.0, 2890.0, 1574.0, 854.0, 522.0, 336.0, 232.0, 118.0, 81.0, 63.0, 51.0, 35.0, 30.0, 27.0, 17.0, 4.0, 5.0, 8.0, 5.0, 11.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-16.03125, -15.555908203125, -15.08056640625, -14.605224609375, -14.1298828125, -13.654541015625, -13.17919921875, -12.703857421875, -12.228515625, -11.753173828125, -11.27783203125, -10.802490234375, -10.3271484375, -9.851806640625, -9.37646484375, -8.901123046875, -8.42578125, -7.950439453125, -7.47509765625, -6.999755859375, -6.5244140625, -6.049072265625, -5.57373046875, -5.098388671875, -4.623046875, -4.147705078125, -3.67236328125, -3.197021484375, -2.7216796875, -2.246337890625, -1.77099609375, -1.295654296875, -0.8203125, -0.344970703125, 0.13037109375, 0.605712890625, 1.0810546875, 1.556396484375, 2.03173828125, 2.507080078125, 2.982421875, 3.457763671875, 3.93310546875, 4.408447265625, 4.8837890625, 5.359130859375, 5.83447265625, 6.309814453125, 6.78515625, 7.260498046875, 7.73583984375, 8.211181640625, 8.6865234375, 9.161865234375, 9.63720703125, 10.112548828125, 10.587890625, 11.063232421875, 11.53857421875, 12.013916015625, 12.4892578125, 12.964599609375, 13.43994140625, 13.915283203125, 14.390625]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 8.0, 15.0, 23.0, 43.0, 48.0, 97.0, 115.0, 147.0, 2148.0, 125.0, 98.0, 84.0, 47.0, 31.0, 15.0, 2.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-237.0, -229.861328125, -222.72265625, -215.583984375, -208.4453125, -201.306640625, -194.16796875, -187.029296875, -179.890625, -172.751953125, -165.61328125, -158.474609375, -151.3359375, -144.197265625, -137.05859375, -129.919921875, -122.78125, -115.642578125, -108.50390625, -101.365234375, -94.2265625, -87.087890625, -79.94921875, -72.810546875, -65.671875, -58.533203125, -51.39453125, -44.255859375, -37.1171875, -29.978515625, -22.83984375, -15.701171875, -8.5625, -1.423828125, 5.71484375, 12.853515625, 19.9921875, 27.130859375, 34.26953125, 41.408203125, 48.546875, 55.685546875, 62.82421875, 69.962890625, 77.1015625, 84.240234375, 91.37890625, 98.517578125, 105.65625, 112.794921875, 119.93359375, 127.072265625, 134.2109375, 141.349609375, 148.48828125, 155.626953125, 162.765625, 169.904296875, 177.04296875, 184.181640625, 191.3203125, 198.458984375, 205.59765625, 212.736328125, 219.875]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 4.0, 10.0, 7.0, 16.0, 16.0, 21.0, 48.0, 113.0, 199.0, 387.0, 922.0, 2918.0, 37296.0, 3060608.0, 38402.0, 2942.0, 947.0, 381.0, 209.0, 113.0, 43.0, 29.0, 27.0, 14.0, 7.0, 1.0, 6.0, 6.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.6875, -41.33251953125, -39.9775390625, -38.62255859375, -37.267578125, -35.91259765625, -34.5576171875, -33.20263671875, -31.84765625, -30.49267578125, -29.1376953125, -27.78271484375, -26.427734375, -25.07275390625, -23.7177734375, -22.36279296875, -21.0078125, -19.65283203125, -18.2978515625, -16.94287109375, -15.587890625, -14.23291015625, -12.8779296875, -11.52294921875, -10.16796875, -8.81298828125, -7.4580078125, -6.10302734375, -4.748046875, -3.39306640625, -2.0380859375, -0.68310546875, 0.671875, 2.02685546875, 3.3818359375, 4.73681640625, 6.091796875, 7.44677734375, 8.8017578125, 10.15673828125, 11.51171875, 12.86669921875, 14.2216796875, 15.57666015625, 16.931640625, 18.28662109375, 19.6416015625, 20.99658203125, 22.3515625, 23.70654296875, 25.0615234375, 26.41650390625, 27.771484375, 29.12646484375, 30.4814453125, 31.83642578125, 33.19140625, 34.54638671875, 35.9013671875, 37.25634765625, 38.611328125, 39.96630859375, 41.3212890625, 42.67626953125, 44.03125]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 7.0, 7.0, 4.0, 7.0, 17.0, 46.0, 88.0, 193.0, 283.0, 213.0, 83.0, 29.0, 13.0, 3.0, 5.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-101.46654510498047, -94.00914001464844, -86.5517349243164, -79.09432983398438, -71.63692474365234, -64.17951965332031, -56.72211837768555, -49.264713287353516, -41.807308197021484, -34.34990310668945, -26.892498016357422, -19.435094833374023, -11.977689743041992, -4.520286560058594, 2.9371185302734375, 10.394523620605469, 17.8519287109375, 25.30933380126953, 32.76673889160156, 40.224143981933594, 47.681549072265625, 55.13895034790039, 62.59635543823242, 70.05375671386719, 77.51116943359375, 84.96857452392578, 92.42597961425781, 99.88338470458984, 107.34078979492188, 114.79818725585938, 122.25559997558594, 129.71299743652344, 137.17039489746094, 144.62779235839844, 152.085205078125, 159.5426025390625, 167.00001525878906, 174.45741271972656, 181.91482543945312, 189.37222290039062, 196.8296356201172, 204.2870330810547, 211.74444580078125, 219.20184326171875, 226.6592559814453, 234.1166534423828, 241.57406616210938, 249.03146362304688, 256.4888610839844, 263.9462585449219, 271.4036560058594, 278.861083984375, 286.3184814453125, 293.77587890625, 301.2332763671875, 308.6907043457031, 316.1481018066406, 323.6054992675781, 331.0628967285156, 338.52032470703125, 345.97772216796875, 353.43511962890625, 360.89251708984375, 368.3499450683594, 375.8073425292969]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 7.0, 4.0, 11.0, 8.0, 16.0, 12.0, 21.0, 17.0, 22.0, 26.0, 31.0, 25.0, 24.0, 43.0, 29.0, 38.0, 47.0, 42.0, 38.0, 46.0, 55.0, 39.0, 38.0, 42.0, 21.0, 35.0, 35.0, 31.0, 33.0, 27.0, 16.0, 21.0, 13.0, 18.0, 17.0, 15.0, 8.0, 4.0, 6.0, 8.0, 6.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-107.51020812988281, -104.12420654296875, -100.73821258544922, -97.35221099853516, -93.9662094116211, -90.58021545410156, -87.1942138671875, -83.80821228027344, -80.4222183227539, -77.03621673583984, -73.65022277832031, -70.26422119140625, -66.87821960449219, -63.492225646972656, -60.106224060058594, -56.7202262878418, -53.334224700927734, -49.94822692871094, -46.562225341796875, -43.17622756958008, -39.79022979736328, -36.40422821044922, -33.01823043823242, -29.632232666015625, -26.246232986450195, -22.860233306884766, -19.47423553466797, -16.08823585510254, -12.702237129211426, -9.316238403320312, -5.930238723754883, -2.544240951538086, 0.8417587280273438, 4.227757453918457, 7.6137566566467285, 10.999755859375, 14.385754585266113, 17.771753311157227, 21.157752990722656, 24.543750762939453, 27.929750442504883, 31.315750122070312, 34.70174789428711, 38.087745666503906, 41.47374725341797, 44.859745025634766, 48.24574279785156, 51.631744384765625, 55.01774215698242, 58.40373992919922, 61.78974151611328, 65.17573547363281, 68.56173706054688, 71.94773864746094, 75.333740234375, 78.71973419189453, 82.1057357788086, 85.49173736572266, 88.87773132324219, 92.26373291015625, 95.64973449707031, 99.03572845458984, 102.4217300415039, 105.80772399902344, 109.1937255859375]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 9.0, 15.0, 33.0, 57.0, 78.0, 125.0, 206.0, 278.0, 379.0, 613.0, 953.0, 1889.0, 1040796.0, 1104.0, 625.0, 434.0, 310.0, 229.0, 165.0, 105.0, 63.0, 46.0, 18.0, 16.0, 7.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-71.52371215820312, -69.69764709472656, -67.87158966064453, -66.0455322265625, -64.21946716308594, -62.39340591430664, -60.567344665527344, -58.74128341674805, -56.91522216796875, -55.08916091918945, -53.263099670410156, -51.43703842163086, -49.61097717285156, -47.784915924072266, -45.95885467529297, -44.13279342651367, -42.306732177734375, -40.48067092895508, -38.65460968017578, -36.828548431396484, -35.00248718261719, -33.17642593383789, -31.350364685058594, -29.524303436279297, -27.6982421875, -25.872180938720703, -24.046119689941406, -22.22005844116211, -20.393997192382812, -18.567935943603516, -16.74187469482422, -14.915813446044922, -13.089752197265625, -11.263690948486328, -9.437629699707031, -7.611568450927734, -5.7855072021484375, -3.9594459533691406, -2.1333847045898438, -0.3073234558105469, 1.51873779296875, 3.344799041748047, 5.170860290527344, 6.996921539306641, 8.822982788085938, 10.649044036865234, 12.475105285644531, 14.301166534423828, 16.127227783203125, 17.953289031982422, 19.77935028076172, 21.605411529541016, 23.431472778320312, 25.25753402709961, 27.083595275878906, 28.909656524658203, 30.7357177734375, 32.5617790222168, 34.387840270996094, 36.21390151977539, 38.03996276855469, 39.866024017333984, 41.69208526611328, 43.51814651489258, 45.344207763671875]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 6.0, 7.0, 6.0, 6.0, 11.0, 9.0, 20.0, 47.0, 135.0, 44084.0, 51419584.0, 106.0, 45.0, 32.0, 11.0, 5.0, 7.0, 1.0, 3.0, 1.0, 1.0, 3.0, 6.0, 8.0, 6.0, 0.0, 4.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3738.0, -3582.353759765625, -3426.70751953125, -3271.061279296875, -3115.4150390625, -2959.768798828125, -2804.12255859375, -2648.4765625, -2492.830078125, -2337.183837890625, -2181.53759765625, -2025.891357421875, -1870.2451171875, -1714.598876953125, -1558.9527587890625, -1403.3065185546875, -1247.660400390625, -1092.01416015625, -936.367919921875, -780.7217407226562, -625.0755004882812, -469.42926025390625, -313.7830810546875, -158.1368408203125, -2.4906005859375, 153.15562438964844, 308.8018493652344, 464.44805908203125, 620.0942993164062, 775.7405395507812, 931.38671875, 1087.032958984375, 1242.67919921875, 1398.325439453125, 1553.9716796875, 1709.617919921875, 1865.26416015625, 2020.910400390625, 2176.556640625, 2332.20263671875, 2487.84912109375, 2643.495361328125, 2799.1416015625, 2954.787841796875, 3110.43408203125, 3266.080322265625, 3421.7265625, 3577.37255859375, 3733.018798828125, 3888.6650390625, 4044.311279296875, 4199.95751953125, 4355.603515625, 4511.25, 4666.89599609375, 4822.54248046875, 4978.1884765625, 5133.83447265625, 5289.48095703125, 5445.126953125, 5600.7734375, 5756.41943359375, 5912.06591796875, 6067.7119140625, 6223.3583984375]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 3.0, 5.0, 5.0, 8.0, 16.0, 21.0, 24.0, 41.0, 81.0, 124.0, 151.0, 216.0, 361.0, 467.0, 720.0, 1025.0, 1452.0, 2191.0, 3210.0, 4492.0, 6664.0, 9964.0, 14955.0, 22921.0, 35894.0, 56951.0, 92879.0, 158900.0, 292016.0, 620144.0, 3797450.0, 528428.0, 260328.0, 144165.0, 85236.0, 51846.0, 32885.0, 21479.0, 13939.0, 9217.0, 6369.0, 4406.0, 2906.0, 2043.0, 1484.0, 978.0, 735.0, 565.0, 332.0, 221.0, 164.0, 125.0, 87.0, 56.0, 36.0, 21.0, 14.0, 13.0, 9.0, 10.0, 3.0, 1.0, 2.0], "bins": [-3.087890625, -2.989593505859375, -2.89129638671875, -2.792999267578125, -2.6947021484375, -2.596405029296875, -2.49810791015625, -2.399810791015625, -2.301513671875, -2.203216552734375, -2.10491943359375, -2.006622314453125, -1.9083251953125, -1.810028076171875, -1.71173095703125, -1.613433837890625, -1.51513671875, -1.416839599609375, -1.31854248046875, -1.220245361328125, -1.1219482421875, -1.023651123046875, -0.92535400390625, -0.827056884765625, -0.728759765625, -0.630462646484375, -0.53216552734375, -0.433868408203125, -0.3355712890625, -0.237274169921875, -0.13897705078125, -0.040679931640625, 0.0576171875, 0.155914306640625, 0.25421142578125, 0.352508544921875, 0.4508056640625, 0.549102783203125, 0.64739990234375, 0.745697021484375, 0.843994140625, 0.942291259765625, 1.04058837890625, 1.138885498046875, 1.2371826171875, 1.335479736328125, 1.43377685546875, 1.532073974609375, 1.63037109375, 1.728668212890625, 1.82696533203125, 1.925262451171875, 2.0235595703125, 2.121856689453125, 2.22015380859375, 2.318450927734375, 2.416748046875, 2.515045166015625, 2.61334228515625, 2.711639404296875, 2.8099365234375, 2.908233642578125, 3.00653076171875, 3.104827880859375, 3.203125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 4.0, 5.0, 4.0, 5.0, 6.0, 11.0, 14.0, 15.0, 4.0, 18.0, 24.0, 18.0, 29.0, 29.0, 26.0, 32.0, 26.0, 29.0, 33.0, 34.0, 54.0, 88.0, 377.0, 637.0, 84.0, 28.0, 40.0, 44.0, 33.0, 33.0, 38.0, 19.0, 22.0, 32.0, 20.0, 16.0, 15.0, 11.0, 16.0, 16.0, 6.0, 5.0, 8.0, 4.0, 6.0, 5.0, 3.0, 4.0, 3.0], "bins": [-15.171875, -14.774658203125, -14.37744140625, -13.980224609375, -13.5830078125, -13.185791015625, -12.78857421875, -12.391357421875, -11.994140625, -11.596923828125, -11.19970703125, -10.802490234375, -10.4052734375, -10.008056640625, -9.61083984375, -9.213623046875, -8.81640625, -8.419189453125, -8.02197265625, -7.624755859375, -7.2275390625, -6.830322265625, -6.43310546875, -6.035888671875, -5.638671875, -5.241455078125, -4.84423828125, -4.447021484375, -4.0498046875, -3.652587890625, -3.25537109375, -2.858154296875, -2.4609375, -2.063720703125, -1.66650390625, -1.269287109375, -0.8720703125, -0.474853515625, -0.07763671875, 0.319580078125, 0.716796875, 1.114013671875, 1.51123046875, 1.908447265625, 2.3056640625, 2.702880859375, 3.10009765625, 3.497314453125, 3.89453125, 4.291748046875, 4.68896484375, 5.086181640625, 5.4833984375, 5.880615234375, 6.27783203125, 6.675048828125, 7.072265625, 7.469482421875, 7.86669921875, 8.263916015625, 8.6611328125, 9.058349609375, 9.45556640625, 9.852783203125, 10.25]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 14.0, 5.0, 8.0, 9.0, 9.0, 25.0, 40.0, 62.0, 63.0, 110.0, 146.0, 242.0, 359.0, 566.0, 880.0, 1373.0, 2292.0, 3680.0, 6089.0, 10063.0, 17544.0, 30879.0, 55932.0, 106812.0, 214971.0, 503150.0, 4047304.0, 733867.0, 269354.0, 130454.0, 67825.0, 36782.0, 20477.0, 11741.0, 7091.0, 4230.0, 2497.0, 1599.0, 1090.0, 636.0, 414.0, 275.0, 159.0, 110.0, 78.0, 39.0, 29.0, 36.0, 12.0, 8.0, 5.0, 2.0, 0.0, 4.0, 2.0, 3.0, 2.0], "bins": [-5.30078125, -5.14324951171875, -4.9857177734375, -4.82818603515625, -4.670654296875, -4.51312255859375, -4.3555908203125, -4.19805908203125, -4.04052734375, -3.88299560546875, -3.7254638671875, -3.56793212890625, -3.410400390625, -3.25286865234375, -3.0953369140625, -2.93780517578125, -2.7802734375, -2.62274169921875, -2.4652099609375, -2.30767822265625, -2.150146484375, -1.99261474609375, -1.8350830078125, -1.67755126953125, -1.52001953125, -1.36248779296875, -1.2049560546875, -1.04742431640625, -0.889892578125, -0.73236083984375, -0.5748291015625, -0.41729736328125, -0.259765625, -0.10223388671875, 0.0552978515625, 0.21282958984375, 0.370361328125, 0.52789306640625, 0.6854248046875, 0.84295654296875, 1.00048828125, 1.15802001953125, 1.3155517578125, 1.47308349609375, 1.630615234375, 1.78814697265625, 1.9456787109375, 2.10321044921875, 2.2607421875, 2.41827392578125, 2.5758056640625, 2.73333740234375, 2.890869140625, 3.04840087890625, 3.2059326171875, 3.36346435546875, 3.52099609375, 3.67852783203125, 3.8360595703125, 3.99359130859375, 4.151123046875, 4.30865478515625, 4.4661865234375, 4.62371826171875, 4.78125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 6.0, 6.0, 12.0, 13.0, 11.0, 10.0, 16.0, 16.0, 20.0, 31.0, 19.0, 23.0, 41.0, 44.0, 38.0, 48.0, 55.0, 83.0, 286.0, 674.0, 109.0, 47.0, 52.0, 46.0, 33.0, 37.0, 33.0, 38.0, 30.0, 21.0, 24.0, 17.0, 17.0, 16.0, 5.0, 16.0, 4.0, 7.0, 4.0, 7.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.578125, -8.2965087890625, -8.014892578125, -7.7332763671875, -7.45166015625, -7.1700439453125, -6.888427734375, -6.6068115234375, -6.3251953125, -6.0435791015625, -5.761962890625, -5.4803466796875, -5.19873046875, -4.9171142578125, -4.635498046875, -4.3538818359375, -4.072265625, -3.7906494140625, -3.509033203125, -3.2274169921875, -2.94580078125, -2.6641845703125, -2.382568359375, -2.1009521484375, -1.8193359375, -1.5377197265625, -1.256103515625, -0.9744873046875, -0.69287109375, -0.4112548828125, -0.129638671875, 0.1519775390625, 0.43359375, 0.7152099609375, 0.996826171875, 1.2784423828125, 1.56005859375, 1.8416748046875, 2.123291015625, 2.4049072265625, 2.6865234375, 2.9681396484375, 3.249755859375, 3.5313720703125, 3.81298828125, 4.0946044921875, 4.376220703125, 4.6578369140625, 4.939453125, 5.2210693359375, 5.502685546875, 5.7843017578125, 6.06591796875, 6.3475341796875, 6.629150390625, 6.9107666015625, 7.1923828125, 7.4739990234375, 7.755615234375, 8.0372314453125, 8.31884765625, 8.6004638671875, 8.882080078125, 9.1636962890625, 9.4453125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 6.0, 10.0, 8.0, 11.0, 20.0, 26.0, 20.0, 21.0, 48.0, 52.0, 68.0, 92.0, 82.0, 151.0, 191.0, 218.0, 275.0, 419.0, 542.0, 709.0, 952.0, 1341.0, 2153.0, 3316.0, 5494.0, 10757.0, 22427.0, 62965.0, 2998295.0, 3066450.0, 63480.0, 23367.0, 10816.0, 5686.0, 3423.0, 2183.0, 1364.0, 984.0, 718.0, 603.0, 398.0, 272.0, 225.0, 177.0, 136.0, 113.0, 88.0, 72.0, 47.0, 44.0, 38.0, 33.0, 14.0, 11.0, 13.0, 15.0, 3.0, 2.0, 3.0, 3.0, 3.0], "bins": [-13.546875, -13.12353515625, -12.7001953125, -12.27685546875, -11.853515625, -11.43017578125, -11.0068359375, -10.58349609375, -10.16015625, -9.73681640625, -9.3134765625, -8.89013671875, -8.466796875, -8.04345703125, -7.6201171875, -7.19677734375, -6.7734375, -6.35009765625, -5.9267578125, -5.50341796875, -5.080078125, -4.65673828125, -4.2333984375, -3.81005859375, -3.38671875, -2.96337890625, -2.5400390625, -2.11669921875, -1.693359375, -1.27001953125, -0.8466796875, -0.42333984375, 0.0, 0.42333984375, 0.8466796875, 1.27001953125, 1.693359375, 2.11669921875, 2.5400390625, 2.96337890625, 3.38671875, 3.81005859375, 4.2333984375, 4.65673828125, 5.080078125, 5.50341796875, 5.9267578125, 6.35009765625, 6.7734375, 7.19677734375, 7.6201171875, 8.04345703125, 8.466796875, 8.89013671875, 9.3134765625, 9.73681640625, 10.16015625, 10.58349609375, 11.0068359375, 11.43017578125, 11.853515625, 12.27685546875, 12.7001953125, 13.12353515625, 13.546875]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 4.0, 7.0, 8.0, 10.0, 7.0, 13.0, 13.0, 15.0, 13.0, 14.0, 24.0, 22.0, 21.0, 22.0, 25.0, 22.0, 33.0, 37.0, 46.0, 78.0, 116.0, 243.0, 506.0, 177.0, 91.0, 71.0, 47.0, 36.0, 48.0, 41.0, 25.0, 23.0, 24.0, 20.0, 17.0, 17.0, 13.0, 11.0, 16.0, 8.0, 6.0, 8.0, 6.0, 6.0, 8.0, 3.0, 5.0, 0.0, 2.0, 0.0, 2.0], "bins": [-6.40625, -6.22637939453125, -6.0465087890625, -5.86663818359375, -5.686767578125, -5.50689697265625, -5.3270263671875, -5.14715576171875, -4.96728515625, -4.78741455078125, -4.6075439453125, -4.42767333984375, -4.247802734375, -4.06793212890625, -3.8880615234375, -3.70819091796875, -3.5283203125, -3.34844970703125, -3.1685791015625, -2.98870849609375, -2.808837890625, -2.62896728515625, -2.4490966796875, -2.26922607421875, -2.08935546875, -1.90948486328125, -1.7296142578125, -1.54974365234375, -1.369873046875, -1.19000244140625, -1.0101318359375, -0.83026123046875, -0.650390625, -0.47052001953125, -0.2906494140625, -0.11077880859375, 0.069091796875, 0.24896240234375, 0.4288330078125, 0.60870361328125, 0.78857421875, 0.96844482421875, 1.1483154296875, 1.32818603515625, 1.508056640625, 1.68792724609375, 1.8677978515625, 2.04766845703125, 2.2275390625, 2.40740966796875, 2.5872802734375, 2.76715087890625, 2.947021484375, 3.12689208984375, 3.3067626953125, 3.48663330078125, 3.66650390625, 3.84637451171875, 4.0262451171875, 4.20611572265625, 4.385986328125, 4.56585693359375, 4.7457275390625, 4.92559814453125, 5.10546875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 6.0, 4.0, 10.0, 14.0, 41.0, 106.0, 341.0, 353.0, 85.0, 31.0, 9.0, 6.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-62.273681640625, -61.02841567993164, -59.78315353393555, -58.53788757324219, -57.292625427246094, -56.047359466552734, -54.802093505859375, -53.55683135986328, -52.31156539916992, -51.06629943847656, -49.82103729248047, -48.57577133178711, -47.33050537109375, -46.085243225097656, -44.8399772644043, -43.59471130371094, -42.349449157714844, -41.104183197021484, -39.85892105102539, -38.61365509033203, -37.36839294433594, -36.12312698364258, -34.87786102294922, -33.632598876953125, -32.387332916259766, -31.14206886291504, -29.896804809570312, -28.651538848876953, -27.406274795532227, -26.1610107421875, -24.91574478149414, -23.670480728149414, -22.425214767456055, -21.179950714111328, -19.93468475341797, -18.689420700073242, -17.444156646728516, -16.19889259338379, -14.953627586364746, -13.708362579345703, -12.463098526000977, -11.21783447265625, -9.972569465637207, -8.727304458618164, -7.4820404052734375, -6.236775875091553, -4.991511344909668, -3.746246337890625, -2.5009822845458984, -1.2557177543640137, -0.010453224182128906, 1.2348113059997559, 2.4800758361816406, 3.7253403663635254, 4.97060489654541, 6.215869903564453, 7.46113395690918, 8.706398010253906, 9.95166301727295, 11.196928024291992, 12.442192077636719, 13.687456130981445, 14.932721138000488, 16.17798614501953, 17.423250198364258]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 7.0, 9.0, 12.0, 10.0, 11.0, 12.0, 21.0, 18.0, 29.0, 24.0, 21.0, 25.0, 23.0, 31.0, 32.0, 35.0, 39.0, 48.0, 38.0, 39.0, 45.0, 47.0, 36.0, 49.0, 38.0, 40.0, 38.0, 37.0, 27.0, 22.0, 26.0, 23.0, 14.0, 9.0, 13.0, 14.0, 11.0, 3.0, 7.0, 7.0, 4.0, 4.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.506961822509766, -8.229288101196289, -7.951613903045654, -7.673940181732178, -7.396266460418701, -7.118592262268066, -6.84091854095459, -6.563244819641113, -6.285571098327637, -6.00789737701416, -5.730223178863525, -5.452549457550049, -5.174875736236572, -4.8972015380859375, -4.619527816772461, -4.341854095458984, -4.06417989730835, -3.786505937576294, -3.5088322162628174, -3.2311582565307617, -2.953484535217285, -2.6758105754852295, -2.398136615753174, -2.1204628944396973, -1.8427889347076416, -1.5651150941848755, -1.2874412536621094, -1.0097672939300537, -0.7320934534072876, -0.4544196128845215, -0.17674565315246582, 0.10092818737030029, 0.3786020278930664, 0.6562758684158325, 0.9339497685432434, 1.2116236686706543, 1.4892975091934204, 1.7669713497161865, 2.044645309448242, 2.3223190307617188, 2.5999929904937744, 2.87766695022583, 3.1553406715393066, 3.4330146312713623, 3.710688591003418, 3.9883623123168945, 4.266036033630371, 4.543710231781006, 4.821383953094482, 5.099057674407959, 5.376731872558594, 5.65440559387207, 5.932079315185547, 6.209753036499023, 6.487427234649658, 6.765100955963135, 7.0427751541137695, 7.320448875427246, 7.598123073577881, 7.875796794891357, 8.153470993041992, 8.431144714355469, 8.708818435668945, 8.986492156982422, 9.264165878295898]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 3.0, 9.0, 12.0, 18.0, 23.0, 54.0, 72.0, 87.0, 165.0, 255.0, 438.0, 692.0, 1353.0, 2765.0, 6494.0, 19200.0, 119560.0, 3969088.0, 51699.0, 12588.0, 4720.0, 2175.0, 1100.0, 609.0, 374.0, 239.0, 150.0, 95.0, 67.0, 45.0, 41.0, 22.0, 15.0, 15.0, 7.0, 8.0, 4.0, 5.0, 6.0, 5.0, 4.0, 3.0, 4.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1680908203125, -0.1602039337158203, -0.15231704711914062, -0.14443016052246094, -0.13654327392578125, -0.12865638732910156, -0.12076950073242188, -0.11288261413574219, -0.1049957275390625, -0.09710884094238281, -0.08922195434570312, -0.08133506774902344, -0.07344818115234375, -0.06556129455566406, -0.057674407958984375, -0.04978752136230469, -0.041900634765625, -0.03401374816894531, -0.026126861572265625, -0.018239974975585938, -0.01035308837890625, -0.0024662017822265625, 0.005420684814453125, 0.013307571411132812, 0.0211944580078125, 0.029081344604492188, 0.036968231201171875, 0.04485511779785156, 0.05274200439453125, 0.06062889099121094, 0.06851577758789062, 0.07640266418457031, 0.08428955078125, 0.09217643737792969, 0.10006332397460938, 0.10795021057128906, 0.11583709716796875, 0.12372398376464844, 0.13161087036132812, 0.1394977569580078, 0.1473846435546875, 0.1552715301513672, 0.16315841674804688, 0.17104530334472656, 0.17893218994140625, 0.18681907653808594, 0.19470596313476562, 0.2025928497314453, 0.210479736328125, 0.2183666229248047, 0.22625350952148438, 0.23414039611816406, 0.24202728271484375, 0.24991416931152344, 0.2578010559082031, 0.2656879425048828, 0.2735748291015625, 0.2814617156982422, 0.2893486022949219, 0.29723548889160156, 0.30512237548828125, 0.31300926208496094, 0.3208961486816406, 0.3287830352783203, 0.336669921875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 6.0, 6.0, 13.0, 7.0, 11.0, 18.0, 24.0, 142.0, 653.0, 32.0, 18.0, 9.0, 11.0, 9.0, 13.0, 2.0, 6.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0281982421875, -0.026807308197021484, -0.02541637420654297, -0.024025440216064453, -0.022634506225585938, -0.021243572235107422, -0.019852638244628906, -0.01846170425415039, -0.017070770263671875, -0.01567983627319336, -0.014288902282714844, -0.012897968292236328, -0.011507034301757812, -0.010116100311279297, -0.008725166320800781, -0.007334232330322266, -0.00594329833984375, -0.004552364349365234, -0.0031614303588867188, -0.0017704963684082031, -0.0003795623779296875, 0.0010113716125488281, 0.0024023056030273438, 0.0037932395935058594, 0.005184173583984375, 0.006575107574462891, 0.007966041564941406, 0.009356975555419922, 0.010747909545898438, 0.012138843536376953, 0.013529777526855469, 0.014920711517333984, 0.0163116455078125, 0.017702579498291016, 0.01909351348876953, 0.020484447479248047, 0.021875381469726562, 0.023266315460205078, 0.024657249450683594, 0.02604818344116211, 0.027439117431640625, 0.02883005142211914, 0.030220985412597656, 0.03161191940307617, 0.03300285339355469, 0.0343937873840332, 0.03578472137451172, 0.037175655364990234, 0.03856658935546875, 0.039957523345947266, 0.04134845733642578, 0.0427393913269043, 0.04413032531738281, 0.04552125930786133, 0.046912193298339844, 0.04830312728881836, 0.049694061279296875, 0.05108499526977539, 0.052475929260253906, 0.05386686325073242, 0.05525779724121094, 0.05664873123168945, 0.05803966522216797, 0.059430599212646484, 0.060821533203125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 7.0, 9.0, 8.0, 8.0, 16.0, 30.0, 40.0, 51.0, 74.0, 111.0, 204.0, 321.0, 568.0, 885.0, 1808.0, 3456.0, 7550.0, 19259.0, 60975.0, 328875.0, 3197429.0, 467160.0, 71311.0, 20100.0, 7324.0, 3208.0, 1529.0, 753.0, 433.0, 270.0, 167.0, 114.0, 77.0, 48.0, 25.0, 24.0, 14.0, 12.0, 6.0, 6.0, 1.0, 3.0, 5.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.16162109375, -0.1561565399169922, -0.15069198608398438, -0.14522743225097656, -0.13976287841796875, -0.13429832458496094, -0.12883377075195312, -0.12336921691894531, -0.1179046630859375, -0.11244010925292969, -0.10697555541992188, -0.10151100158691406, -0.09604644775390625, -0.09058189392089844, -0.08511734008789062, -0.07965278625488281, -0.074188232421875, -0.06872367858886719, -0.06325912475585938, -0.05779457092285156, -0.05233001708984375, -0.04686546325683594, -0.041400909423828125, -0.03593635559082031, -0.0304718017578125, -0.025007247924804688, -0.019542694091796875, -0.014078140258789062, -0.00861358642578125, -0.0031490325927734375, 0.002315521240234375, 0.0077800750732421875, 0.01324462890625, 0.018709182739257812, 0.024173736572265625, 0.029638290405273438, 0.03510284423828125, 0.04056739807128906, 0.046031951904296875, 0.05149650573730469, 0.0569610595703125, 0.06242561340332031, 0.06789016723632812, 0.07335472106933594, 0.07881927490234375, 0.08428382873535156, 0.08974838256835938, 0.09521293640136719, 0.100677490234375, 0.10614204406738281, 0.11160659790039062, 0.11707115173339844, 0.12253570556640625, 0.12800025939941406, 0.13346481323242188, 0.1389293670654297, 0.1443939208984375, 0.1498584747314453, 0.15532302856445312, 0.16078758239746094, 0.16625213623046875, 0.17171669006347656, 0.17718124389648438, 0.1826457977294922, 0.1881103515625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 4.0, 2.0, 5.0, 6.0, 6.0, 9.0, 14.0, 7.0, 17.0, 22.0, 27.0, 23.0, 39.0, 46.0, 77.0, 106.0, 173.0, 269.0, 553.0, 1237.0, 605.0, 308.0, 172.0, 96.0, 81.0, 54.0, 39.0, 22.0, 13.0, 12.0, 10.0, 7.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0699462890625, -0.0680837631225586, -0.06622123718261719, -0.06435871124267578, -0.062496185302734375, -0.06063365936279297, -0.05877113342285156, -0.056908607482910156, -0.05504608154296875, -0.053183555603027344, -0.05132102966308594, -0.04945850372314453, -0.047595977783203125, -0.04573345184326172, -0.04387092590332031, -0.042008399963378906, -0.0401458740234375, -0.038283348083496094, -0.03642082214355469, -0.03455829620361328, -0.032695770263671875, -0.03083324432373047, -0.028970718383789062, -0.027108192443847656, -0.02524566650390625, -0.023383140563964844, -0.021520614624023438, -0.01965808868408203, -0.017795562744140625, -0.01593303680419922, -0.014070510864257812, -0.012207984924316406, -0.010345458984375, -0.008482933044433594, -0.0066204071044921875, -0.004757881164550781, -0.002895355224609375, -0.0010328292846679688, 0.0008296966552734375, 0.0026922225952148438, 0.00455474853515625, 0.006417274475097656, 0.008279800415039062, 0.010142326354980469, 0.012004852294921875, 0.013867378234863281, 0.015729904174804688, 0.017592430114746094, 0.0194549560546875, 0.021317481994628906, 0.023180007934570312, 0.02504253387451172, 0.026905059814453125, 0.02876758575439453, 0.030630111694335938, 0.032492637634277344, 0.03435516357421875, 0.036217689514160156, 0.03808021545410156, 0.03994274139404297, 0.041805267333984375, 0.04366779327392578, 0.04553031921386719, 0.047392845153808594, 0.04925537109375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 6.0, 8.0, 22.0, 44.0, 79.0, 177.0, 335.0, 214.0, 83.0, 22.0, 8.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4162243604660034, -1.388873815536499, -1.361523151397705, -1.3341726064682007, -1.3068219423294067, -1.2794713973999023, -1.2521207332611084, -1.224770188331604, -1.1974196434020996, -1.1700690984725952, -1.1427184343338013, -1.1153678894042969, -1.088017225265503, -1.0606666803359985, -1.0333160161972046, -1.0059654712677002, -0.9786148071289062, -0.9512642025947571, -0.9239135980606079, -0.8965629935264587, -0.8692123889923096, -0.8418618440628052, -0.814511239528656, -0.7871606349945068, -0.7598100304603577, -0.7324594259262085, -0.7051088213920593, -0.6777582168579102, -0.6504076719284058, -0.6230570077896118, -0.5957064628601074, -0.5683558583259583, -0.5410052537918091, -0.5136546492576599, -0.48630404472351074, -0.45895346999168396, -0.4316028654575348, -0.4042522609233856, -0.37690168619155884, -0.34955108165740967, -0.3222004771232605, -0.29484987258911133, -0.26749926805496216, -0.24014869332313538, -0.2127980887889862, -0.18544748425483704, -0.15809689462184906, -0.13074630498886108, -0.10339570045471191, -0.07604510337114334, -0.04869450628757477, -0.021343909204006195, 0.006006687879562378, 0.03335729241371155, 0.060707882046699524, 0.0880584716796875, 0.11540907621383667, 0.14275968074798584, 0.17011027038097382, 0.1974608600139618, 0.22481146454811096, 0.25216206908226013, 0.2795126438140869, 0.3068632483482361, 0.33421385288238525]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 12.0, 17.0, 26.0, 37.0, 53.0, 65.0, 94.0, 93.0, 97.0, 87.0, 87.0, 96.0, 69.0, 52.0, 44.0, 24.0, 17.0, 13.0, 8.0, 6.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6731529235839844, -0.6549403071403503, -0.6367277503013611, -0.618515133857727, -0.6003025770187378, -0.5820899605751038, -0.5638773441314697, -0.5456647872924805, -0.5274521708488464, -0.5092395544052124, -0.49102699756622314, -0.4728143811225891, -0.45460179448127747, -0.4363892078399658, -0.4181765913963318, -0.39996400475502014, -0.3817514181137085, -0.36353883147239685, -0.3453262448310852, -0.32711362838745117, -0.3089010417461395, -0.2906884551048279, -0.27247583866119385, -0.2542632520198822, -0.23605066537857056, -0.2178380787372589, -0.19962547719478607, -0.18141287565231323, -0.1632002890110016, -0.14498770236968994, -0.1267751008272171, -0.10856249928474426, -0.09034997224807739, -0.07213737815618515, -0.05392478406429291, -0.035712189972400665, -0.017499595880508423, 0.0007129982113838196, 0.018925592303276062, 0.0371381938457489, 0.05535078048706055, 0.07356337457895279, 0.09177596867084503, 0.10998856276273727, 0.12820115685462952, 0.14641374349594116, 0.164626345038414, 0.18283894658088684, 0.2010515332221985, 0.21926411986351013, 0.23747672140598297, 0.2556893229484558, 0.27390190958976746, 0.2921144962310791, 0.31032711267471313, 0.3285396993160248, 0.3467522859573364, 0.36496487259864807, 0.3831774592399597, 0.40139007568359375, 0.4196026623249054, 0.43781524896621704, 0.4560278654098511, 0.4742404520511627, 0.49245303869247437]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 7.0, 7.0, 15.0, 11.0, 24.0, 33.0, 46.0, 59.0, 79.0, 120.0, 149.0, 247.0, 331.0, 445.0, 692.0, 1112.0, 1759.0, 3012.0, 5617.0, 11806.0, 29152.0, 277329.0, 645881.0, 40313.0, 14369.0, 6726.0, 3555.0, 1962.0, 1197.0, 777.0, 508.0, 351.0, 224.0, 196.0, 120.0, 90.0, 71.0, 48.0, 35.0, 18.0, 23.0, 8.0, 11.0, 10.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.2139892578125, -0.2077178955078125, -0.201446533203125, -0.1951751708984375, -0.18890380859375, -0.1826324462890625, -0.176361083984375, -0.1700897216796875, -0.163818359375, -0.1575469970703125, -0.151275634765625, -0.1450042724609375, -0.13873291015625, -0.1324615478515625, -0.126190185546875, -0.1199188232421875, -0.1136474609375, -0.1073760986328125, -0.101104736328125, -0.0948333740234375, -0.08856201171875, -0.0822906494140625, -0.076019287109375, -0.0697479248046875, -0.0634765625, -0.0572052001953125, -0.050933837890625, -0.0446624755859375, -0.03839111328125, -0.0321197509765625, -0.025848388671875, -0.0195770263671875, -0.0133056640625, -0.0070343017578125, -0.000762939453125, 0.0055084228515625, 0.01177978515625, 0.0180511474609375, 0.024322509765625, 0.0305938720703125, 0.036865234375, 0.0431365966796875, 0.049407958984375, 0.0556793212890625, 0.06195068359375, 0.0682220458984375, 0.074493408203125, 0.0807647705078125, 0.0870361328125, 0.0933074951171875, 0.099578857421875, 0.1058502197265625, 0.11212158203125, 0.1183929443359375, 0.124664306640625, 0.1309356689453125, 0.13720703125, 0.1434783935546875, 0.149749755859375, 0.1560211181640625, 0.16229248046875, 0.1685638427734375, 0.174835205078125, 0.1811065673828125, 0.1873779296875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 2.0, 7.0, 15.0, 8.0, 9.0, 13.0, 33.0, 80.0, 204.0, 288.0, 185.0, 76.0, 12.0, 12.0, 8.0, 9.0, 10.0, 5.0, 3.0, 2.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03900146484375, -0.03779792785644531, -0.036594390869140625, -0.03539085388183594, -0.03418731689453125, -0.03298377990722656, -0.031780242919921875, -0.030576705932617188, -0.0293731689453125, -0.028169631958007812, -0.026966094970703125, -0.025762557983398438, -0.02455902099609375, -0.023355484008789062, -0.022151947021484375, -0.020948410034179688, -0.019744873046875, -0.018541336059570312, -0.017337799072265625, -0.016134262084960938, -0.01493072509765625, -0.013727188110351562, -0.012523651123046875, -0.011320114135742188, -0.0101165771484375, -0.008913040161132812, -0.007709503173828125, -0.0065059661865234375, -0.00530242919921875, -0.0040988922119140625, -0.002895355224609375, -0.0016918182373046875, -0.00048828125, 0.0007152557373046875, 0.001918792724609375, 0.0031223297119140625, 0.00432586669921875, 0.0055294036865234375, 0.006732940673828125, 0.007936477661132812, 0.0091400146484375, 0.010343551635742188, 0.011547088623046875, 0.012750625610351562, 0.01395416259765625, 0.015157699584960938, 0.016361236572265625, 0.017564773559570312, 0.018768310546875, 0.019971847534179688, 0.021175384521484375, 0.022378921508789062, 0.02358245849609375, 0.024785995483398438, 0.025989532470703125, 0.027193069458007812, 0.0283966064453125, 0.029600143432617188, 0.030803680419921875, 0.03200721740722656, 0.03321075439453125, 0.03441429138183594, 0.035617828369140625, 0.03682136535644531, 0.03802490234375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 8.0, 3.0, 6.0, 12.0, 17.0, 27.0, 44.0, 66.0, 116.0, 287.0, 865.0, 3944.0, 38319.0, 881467.0, 113981.0, 7272.0, 1283.0, 426.0, 172.0, 87.0, 53.0, 42.0, 18.0, 9.0, 8.0, 10.0, 5.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.483154296875, -0.4662971496582031, -0.44944000244140625, -0.4325828552246094, -0.4157257080078125, -0.3988685607910156, -0.38201141357421875, -0.3651542663574219, -0.348297119140625, -0.3314399719238281, -0.31458282470703125, -0.2977256774902344, -0.2808685302734375, -0.2640113830566406, -0.24715423583984375, -0.23029708862304688, -0.21343994140625, -0.19658279418945312, -0.17972564697265625, -0.16286849975585938, -0.1460113525390625, -0.12915420532226562, -0.11229705810546875, -0.09543991088867188, -0.078582763671875, -0.061725616455078125, -0.04486846923828125, -0.028011322021484375, -0.0111541748046875, 0.005702972412109375, 0.02256011962890625, 0.039417266845703125, 0.0562744140625, 0.07313156127929688, 0.08998870849609375, 0.10684585571289062, 0.1237030029296875, 0.14056015014648438, 0.15741729736328125, 0.17427444458007812, 0.191131591796875, 0.20798873901367188, 0.22484588623046875, 0.24170303344726562, 0.2585601806640625, 0.2754173278808594, 0.29227447509765625, 0.3091316223144531, 0.32598876953125, 0.3428459167480469, 0.35970306396484375, 0.3765602111816406, 0.3934173583984375, 0.4102745056152344, 0.42713165283203125, 0.4439888000488281, 0.460845947265625, 0.4777030944824219, 0.49456024169921875, 0.5114173889160156, 0.5282745361328125, 0.5451316833496094, 0.5619888305664062, 0.5788459777832031, 0.595703125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 5.0, 0.0, 1.0, 1.0, 2.0, 4.0, 7.0, 3.0, 2.0, 5.0, 13.0, 9.0, 6.0, 14.0, 15.0, 22.0, 28.0, 30.0, 27.0, 32.0, 24.0, 36.0, 36.0, 35.0, 40.0, 44.0, 48.0, 43.0, 47.0, 45.0, 45.0, 34.0, 27.0, 35.0, 41.0, 31.0, 20.0, 23.0, 21.0, 23.0, 12.0, 13.0, 19.0, 10.0, 11.0, 8.0, 7.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.143310546875, -0.13879013061523438, -0.13426971435546875, -0.12974929809570312, -0.1252288818359375, -0.12070846557617188, -0.11618804931640625, -0.11166763305664062, -0.107147216796875, -0.10262680053710938, -0.09810638427734375, -0.09358596801757812, -0.0890655517578125, -0.08454513549804688, -0.08002471923828125, -0.07550430297851562, -0.07098388671875, -0.06646347045898438, -0.06194305419921875, -0.057422637939453125, -0.0529022216796875, -0.048381805419921875, -0.04386138916015625, -0.039340972900390625, -0.034820556640625, -0.030300140380859375, -0.02577972412109375, -0.021259307861328125, -0.0167388916015625, -0.012218475341796875, -0.00769805908203125, -0.003177642822265625, 0.0013427734375, 0.005863189697265625, 0.01038360595703125, 0.014904022216796875, 0.0194244384765625, 0.023944854736328125, 0.02846527099609375, 0.032985687255859375, 0.037506103515625, 0.042026519775390625, 0.04654693603515625, 0.051067352294921875, 0.0555877685546875, 0.060108184814453125, 0.06462860107421875, 0.06914901733398438, 0.07366943359375, 0.07818984985351562, 0.08271026611328125, 0.08723068237304688, 0.0917510986328125, 0.09627151489257812, 0.10079193115234375, 0.10531234741210938, 0.109832763671875, 0.11435317993164062, 0.11887359619140625, 0.12339401245117188, 0.1279144287109375, 0.13243484497070312, 0.13695526123046875, 0.14147567749023438, 0.14599609375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 2.0, 3.0, 5.0, 8.0, 15.0, 21.0, 23.0, 17.0, 46.0, 54.0, 105.0, 185.0, 282.0, 524.0, 1138.0, 2787.0, 10020.0, 177834.0, 828231.0, 20120.0, 4044.0, 1464.0, 700.0, 361.0, 215.0, 116.0, 89.0, 41.0, 27.0, 18.0, 17.0, 10.0, 14.0, 7.0, 5.0, 4.0, 7.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.499267578125, -0.4850730895996094, -0.47087860107421875, -0.4566841125488281, -0.4424896240234375, -0.4282951354980469, -0.41410064697265625, -0.3999061584472656, -0.385711669921875, -0.3715171813964844, -0.35732269287109375, -0.3431282043457031, -0.3289337158203125, -0.3147392272949219, -0.30054473876953125, -0.2863502502441406, -0.27215576171875, -0.2579612731933594, -0.24376678466796875, -0.22957229614257812, -0.2153778076171875, -0.20118331909179688, -0.18698883056640625, -0.17279434204101562, -0.158599853515625, -0.14440536499023438, -0.13021087646484375, -0.11601638793945312, -0.1018218994140625, -0.08762741088867188, -0.07343292236328125, -0.059238433837890625, -0.0450439453125, -0.030849456787109375, -0.01665496826171875, -0.002460479736328125, 0.0117340087890625, 0.025928497314453125, 0.04012298583984375, 0.054317474365234375, 0.068511962890625, 0.08270645141601562, 0.09690093994140625, 0.11109542846679688, 0.1252899169921875, 0.13948440551757812, 0.15367889404296875, 0.16787338256835938, 0.18206787109375, 0.19626235961914062, 0.21045684814453125, 0.22465133666992188, 0.2388458251953125, 0.2530403137207031, 0.26723480224609375, 0.2814292907714844, 0.295623779296875, 0.3098182678222656, 0.32401275634765625, 0.3382072448730469, 0.3524017333984375, 0.3665962219238281, 0.38079071044921875, 0.3949851989746094, 0.4091796875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 6.0, 2.0, 6.0, 4.0, 13.0, 10.0, 10.0, 17.0, 18.0, 26.0, 32.0, 48.0, 51.0, 90.0, 112.0, 72.0, 109.0, 74.0, 69.0, 57.0, 45.0, 29.0, 22.0, 21.0, 17.0, 10.0, 7.0, 8.0, 6.0, 5.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.1517276763916016e-05, -2.0821578800678253e-05, -2.012588083744049e-05, -1.9430182874202728e-05, -1.8734484910964966e-05, -1.8038786947727203e-05, -1.734308898448944e-05, -1.664739102125168e-05, -1.5951693058013916e-05, -1.5255995094776154e-05, -1.4560297131538391e-05, -1.3864599168300629e-05, -1.3168901205062866e-05, -1.2473203241825104e-05, -1.1777505278587341e-05, -1.1081807315349579e-05, -1.0386109352111816e-05, -9.690411388874054e-06, -8.994713425636292e-06, -8.299015462398529e-06, -7.603317499160767e-06, -6.907619535923004e-06, -6.211921572685242e-06, -5.516223609447479e-06, -4.820525646209717e-06, -4.124827682971954e-06, -3.429129719734192e-06, -2.7334317564964294e-06, -2.037733793258667e-06, -1.3420358300209045e-06, -6.463378667831421e-07, 4.936009645462036e-08, 7.450580596923828e-07, 1.4407560229301453e-06, 2.1364539861679077e-06, 2.83215194940567e-06, 3.5278499126434326e-06, 4.223547875881195e-06, 4.9192458391189575e-06, 5.61494380235672e-06, 6.310641765594482e-06, 7.006339728832245e-06, 7.702037692070007e-06, 8.39773565530777e-06, 9.093433618545532e-06, 9.789131581783295e-06, 1.0484829545021057e-05, 1.118052750825882e-05, 1.1876225471496582e-05, 1.2571923434734344e-05, 1.3267621397972107e-05, 1.396331936120987e-05, 1.4659017324447632e-05, 1.5354715287685394e-05, 1.6050413250923157e-05, 1.674611121416092e-05, 1.744180917739868e-05, 1.8137507140636444e-05, 1.8833205103874207e-05, 1.952890306711197e-05, 2.022460103034973e-05, 2.0920298993587494e-05, 2.1615996956825256e-05, 2.231169492006302e-05, 2.300739288330078e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 1.0, 4.0, 2.0, 4.0, 2.0, 8.0, 14.0, 15.0, 16.0, 18.0, 24.0, 33.0, 49.0, 39.0, 85.0, 87.0, 145.0, 225.0, 291.0, 460.0, 666.0, 1163.0, 1932.0, 3266.0, 6414.0, 13741.0, 35500.0, 120110.0, 513000.0, 250222.0, 59656.0, 20930.0, 9142.0, 4615.0, 2451.0, 1441.0, 939.0, 555.0, 394.0, 255.0, 174.0, 139.0, 89.0, 71.0, 43.0, 34.0, 27.0, 21.0, 12.0, 12.0, 9.0, 4.0, 5.0, 3.0, 0.0, 0.0, 4.0], "bins": [-0.17529296875, -0.17038726806640625, -0.1654815673828125, -0.16057586669921875, -0.155670166015625, -0.15076446533203125, -0.1458587646484375, -0.14095306396484375, -0.13604736328125, -0.13114166259765625, -0.1262359619140625, -0.12133026123046875, -0.116424560546875, -0.11151885986328125, -0.1066131591796875, -0.10170745849609375, -0.0968017578125, -0.09189605712890625, -0.0869903564453125, -0.08208465576171875, -0.077178955078125, -0.07227325439453125, -0.0673675537109375, -0.06246185302734375, -0.05755615234375, -0.05265045166015625, -0.0477447509765625, -0.04283905029296875, -0.037933349609375, -0.03302764892578125, -0.0281219482421875, -0.02321624755859375, -0.018310546875, -0.01340484619140625, -0.0084991455078125, -0.00359344482421875, 0.001312255859375, 0.00621795654296875, 0.0111236572265625, 0.01602935791015625, 0.02093505859375, 0.02584075927734375, 0.0307464599609375, 0.03565216064453125, 0.040557861328125, 0.04546356201171875, 0.0503692626953125, 0.05527496337890625, 0.0601806640625, 0.06508636474609375, 0.0699920654296875, 0.07489776611328125, 0.079803466796875, 0.08470916748046875, 0.0896148681640625, 0.09452056884765625, 0.09942626953125, 0.10433197021484375, 0.1092376708984375, 0.11414337158203125, 0.119049072265625, 0.12395477294921875, 0.1288604736328125, 0.13376617431640625, 0.138671875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0, 2.0, 8.0, 10.0, 9.0, 8.0, 15.0, 25.0, 23.0, 25.0, 47.0, 48.0, 57.0, 79.0, 90.0, 81.0, 83.0, 69.0, 64.0, 55.0, 35.0, 38.0, 25.0, 20.0, 11.0, 18.0, 15.0, 6.0, 10.0, 3.0, 4.0, 4.0, 0.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.139892578125, -0.1342315673828125, -0.128570556640625, -0.1229095458984375, -0.11724853515625, -0.1115875244140625, -0.105926513671875, -0.1002655029296875, -0.0946044921875, -0.0889434814453125, -0.083282470703125, -0.0776214599609375, -0.07196044921875, -0.0662994384765625, -0.060638427734375, -0.0549774169921875, -0.04931640625, -0.0436553955078125, -0.037994384765625, -0.0323333740234375, -0.02667236328125, -0.0210113525390625, -0.015350341796875, -0.0096893310546875, -0.0040283203125, 0.0016326904296875, 0.007293701171875, 0.0129547119140625, 0.01861572265625, 0.0242767333984375, 0.029937744140625, 0.0355987548828125, 0.041259765625, 0.0469207763671875, 0.052581787109375, 0.0582427978515625, 0.06390380859375, 0.0695648193359375, 0.075225830078125, 0.0808868408203125, 0.0865478515625, 0.0922088623046875, 0.097869873046875, 0.1035308837890625, 0.10919189453125, 0.1148529052734375, 0.120513916015625, 0.1261749267578125, 0.1318359375, 0.1374969482421875, 0.143157958984375, 0.1488189697265625, 0.15447998046875, 0.1601409912109375, 0.165802001953125, 0.1714630126953125, 0.1771240234375, 0.1827850341796875, 0.188446044921875, 0.1941070556640625, 0.19976806640625, 0.2054290771484375, 0.211090087890625, 0.2167510986328125, 0.222412109375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 4.0, 3.0, 2.0, 5.0, 11.0, 25.0, 37.0, 86.0, 296.0, 399.0, 91.0, 26.0, 11.0, 6.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4275641441345215, -3.30173921585083, -3.1759145259857178, -3.0500898361206055, -2.924264907836914, -2.7984399795532227, -2.6726152896881104, -2.546790599822998, -2.4209656715393066, -2.2951407432556152, -2.169316053390503, -2.0434913635253906, -1.9176664352416992, -1.7918416261672974, -1.6660168170928955, -1.5401920080184937, -1.4143671989440918, -1.28854238986969, -1.162717580795288, -1.0368927717208862, -0.9110679626464844, -0.7852431535720825, -0.6594183444976807, -0.5335935354232788, -0.40776872634887695, -0.2819439172744751, -0.15611910820007324, -0.030294299125671387, 0.09553050994873047, 0.22135531902313232, 0.3471801280975342, 0.47300493717193604, 0.5988302230834961, 0.724655032157898, 0.8504798412322998, 0.9763046503067017, 1.1021294593811035, 1.2279542684555054, 1.3537790775299072, 1.479603886604309, 1.605428695678711, 1.7312535047531128, 1.8570783138275146, 1.9829031229019165, 2.1087279319763184, 2.2345528602600098, 2.360377550125122, 2.4862022399902344, 2.612027168273926, 2.737852096557617, 2.8636767864227295, 2.989501476287842, 3.115326404571533, 3.2411513328552246, 3.366976022720337, 3.492800712585449, 3.6186256408691406, 3.744450569152832, 3.8702752590179443, 3.9960999488830566, 4.121924877166748, 4.2477498054504395, 4.373574256896973, 4.499399185180664, 4.6252241134643555]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 5.0, 2.0, 8.0, 5.0, 7.0, 7.0, 14.0, 15.0, 39.0, 56.0, 81.0, 120.0, 139.0, 139.0, 119.0, 73.0, 48.0, 36.0, 18.0, 17.0, 11.0, 12.0, 5.0, 2.0, 3.0, 4.0, 6.0, 1.0, 2.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4463467597961426, -2.3524675369262695, -2.2585883140563965, -2.1647090911865234, -2.0708298683166504, -1.9769506454467773, -1.8830714225769043, -1.7891921997070312, -1.6953129768371582, -1.6014337539672852, -1.507554531097412, -1.413675308227539, -1.319796085357666, -1.225916862487793, -1.13203763961792, -1.0381584167480469, -0.9442793130874634, -0.8504000902175903, -0.7565208673477173, -0.6626416444778442, -0.5687624216079712, -0.47488322854042053, -0.3810040354728699, -0.2871248126029968, -0.19324558973312378, -0.09936637431383133, -0.005487158894538879, 0.08839204907417297, 0.18227127194404602, 0.27615049481391907, 0.3700296878814697, 0.4639089107513428, 0.5577881336212158, 0.6516673564910889, 0.7455465793609619, 0.839425802230835, 0.933305025100708, 1.027184247970581, 1.121063470840454, 1.2149426937103271, 1.3088219165802002, 1.4027011394500732, 1.4965803623199463, 1.5904595851898193, 1.6843388080596924, 1.7782180309295654, 1.8720972537994385, 1.9659764766693115, 2.0598554611206055, 2.1537346839904785, 2.2476139068603516, 2.3414931297302246, 2.4353723526000977, 2.5292515754699707, 2.6231307983398438, 2.717010021209717, 2.81088924407959, 2.904768466949463, 2.998647689819336, 3.092526912689209, 3.186406135559082, 3.280285358428955, 3.374164581298828, 3.468043804168701, 3.561923027038574]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 5.0, 6.0, 5.0, 5.0, 13.0, 9.0, 7.0, 16.0, 14.0, 25.0, 36.0, 57.0, 176.0, 989.0, 19669.0, 4145720.0, 25608.0, 1476.0, 233.0, 81.0, 33.0, 20.0, 20.0, 14.0, 5.0, 5.0, 6.0, 7.0, 3.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.173828125, -2.107025146484375, -2.04022216796875, -1.973419189453125, -1.9066162109375, -1.839813232421875, -1.77301025390625, -1.706207275390625, -1.639404296875, -1.572601318359375, -1.50579833984375, -1.438995361328125, -1.3721923828125, -1.305389404296875, -1.23858642578125, -1.171783447265625, -1.10498046875, -1.038177490234375, -0.97137451171875, -0.904571533203125, -0.8377685546875, -0.770965576171875, -0.70416259765625, -0.637359619140625, -0.570556640625, -0.503753662109375, -0.43695068359375, -0.370147705078125, -0.3033447265625, -0.236541748046875, -0.16973876953125, -0.102935791015625, -0.0361328125, 0.030670166015625, 0.09747314453125, 0.164276123046875, 0.2310791015625, 0.297882080078125, 0.36468505859375, 0.431488037109375, 0.498291015625, 0.565093994140625, 0.63189697265625, 0.698699951171875, 0.7655029296875, 0.832305908203125, 0.89910888671875, 0.965911865234375, 1.03271484375, 1.099517822265625, 1.16632080078125, 1.233123779296875, 1.2999267578125, 1.366729736328125, 1.43353271484375, 1.500335693359375, 1.567138671875, 1.633941650390625, 1.70074462890625, 1.767547607421875, 1.8343505859375, 1.901153564453125, 1.96795654296875, 2.034759521484375, 2.1015625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 4.0, 4.0, 7.0, 8.0, 12.0, 15.0, 21.0, 28.0, 60.0, 85.0, 132.0, 140.0, 160.0, 122.0, 72.0, 35.0, 25.0, 15.0, 11.0, 6.0, 4.0, 4.0, 3.0, 6.0, 2.0, 5.0, 2.0, 7.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0228729248046875, -0.02195572853088379, -0.021038532257080078, -0.020121335983276367, -0.019204139709472656, -0.018286943435668945, -0.017369747161865234, -0.016452550888061523, -0.015535354614257812, -0.014618158340454102, -0.01370096206665039, -0.01278376579284668, -0.011866569519042969, -0.010949373245239258, -0.010032176971435547, -0.009114980697631836, -0.008197784423828125, -0.007280588150024414, -0.006363391876220703, -0.005446195602416992, -0.004528999328613281, -0.0036118030548095703, -0.0026946067810058594, -0.0017774105072021484, -0.0008602142333984375, 5.698204040527344e-05, 0.0009741783142089844, 0.0018913745880126953, 0.0028085708618164062, 0.003725767135620117, 0.004642963409423828, 0.005560159683227539, 0.00647735595703125, 0.007394552230834961, 0.008311748504638672, 0.009228944778442383, 0.010146141052246094, 0.011063337326049805, 0.011980533599853516, 0.012897729873657227, 0.013814926147460938, 0.014732122421264648, 0.01564931869506836, 0.01656651496887207, 0.01748371124267578, 0.018400907516479492, 0.019318103790283203, 0.020235300064086914, 0.021152496337890625, 0.022069692611694336, 0.022986888885498047, 0.023904085159301758, 0.02482128143310547, 0.02573847770690918, 0.02665567398071289, 0.0275728702545166, 0.028490066528320312, 0.029407262802124023, 0.030324459075927734, 0.031241655349731445, 0.032158851623535156, 0.03307604789733887, 0.03399324417114258, 0.03491044044494629, 0.03582763671875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [4.0, 0.0, 4.0, 6.0, 30.0, 61.0, 246.0, 919.0, 6290.0, 277269.0, 3891578.0, 15369.0, 1649.0, 464.0, 175.0, 93.0, 48.0, 39.0, 22.0, 14.0, 6.0, 5.0, 7.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.316650390625, -0.2855033874511719, -0.25435638427734375, -0.22320938110351562, -0.1920623779296875, -0.16091537475585938, -0.12976837158203125, -0.09862136840820312, -0.067474365234375, -0.036327362060546875, -0.00518035888671875, 0.025966644287109375, 0.0571136474609375, 0.08826065063476562, 0.11940765380859375, 0.15055465698242188, 0.18170166015625, 0.21284866333007812, 0.24399566650390625, 0.2751426696777344, 0.3062896728515625, 0.3374366760253906, 0.36858367919921875, 0.3997306823730469, 0.430877685546875, 0.4620246887207031, 0.49317169189453125, 0.5243186950683594, 0.5554656982421875, 0.5866127014160156, 0.6177597045898438, 0.6489067077636719, 0.6800537109375, 0.7112007141113281, 0.7423477172851562, 0.7734947204589844, 0.8046417236328125, 0.8357887268066406, 0.8669357299804688, 0.8980827331542969, 0.929229736328125, 0.9603767395019531, 0.9915237426757812, 1.0226707458496094, 1.0538177490234375, 1.0849647521972656, 1.1161117553710938, 1.1472587585449219, 1.17840576171875, 1.2095527648925781, 1.2406997680664062, 1.2718467712402344, 1.3029937744140625, 1.3341407775878906, 1.3652877807617188, 1.3964347839355469, 1.427581787109375, 1.4587287902832031, 1.4898757934570312, 1.5210227966308594, 1.5521697998046875, 1.5833168029785156, 1.6144638061523438, 1.6456108093261719, 1.6767578125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 10.0, 3.0, 3.0, 9.0, 17.0, 14.0, 13.0, 15.0, 26.0, 48.0, 75.0, 173.0, 437.0, 1499.0, 953.0, 344.0, 152.0, 76.0, 61.0, 35.0, 22.0, 17.0, 16.0, 8.0, 4.0, 5.0, 7.0, 8.0, 4.0, 2.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.04608154296875, -0.04467201232910156, -0.043262481689453125, -0.04185295104980469, -0.04044342041015625, -0.03903388977050781, -0.037624359130859375, -0.03621482849121094, -0.0348052978515625, -0.03339576721191406, -0.031986236572265625, -0.030576705932617188, -0.02916717529296875, -0.027757644653320312, -0.026348114013671875, -0.024938583374023438, -0.023529052734375, -0.022119522094726562, -0.020709991455078125, -0.019300460815429688, -0.01789093017578125, -0.016481399536132812, -0.015071868896484375, -0.013662338256835938, -0.0122528076171875, -0.010843276977539062, -0.009433746337890625, -0.008024215698242188, -0.00661468505859375, -0.0052051544189453125, -0.003795623779296875, -0.0023860931396484375, -0.0009765625, 0.0004329681396484375, 0.001842498779296875, 0.0032520294189453125, 0.00466156005859375, 0.0060710906982421875, 0.007480621337890625, 0.008890151977539062, 0.0102996826171875, 0.011709213256835938, 0.013118743896484375, 0.014528274536132812, 0.01593780517578125, 0.017347335815429688, 0.018756866455078125, 0.020166397094726562, 0.021575927734375, 0.022985458374023438, 0.024394989013671875, 0.025804519653320312, 0.02721405029296875, 0.028623580932617188, 0.030033111572265625, 0.03144264221191406, 0.0328521728515625, 0.03426170349121094, 0.035671234130859375, 0.03708076477050781, 0.03849029541015625, 0.03989982604980469, 0.041309356689453125, 0.04271888732910156, 0.04412841796875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 8.0, 454.0, 497.0, 43.0, 12.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39107492566108704, -0.2905176877975464, -0.18996047973632812, -0.08940324187278748, 0.011153966188430786, 0.11171117424964905, 0.21226844191551208, 0.31282564997673035, 0.4133828580379486, 0.5139400959014893, 0.6144973039627075, 0.7150545120239258, 0.815611720085144, 0.9161689281463623, 1.0167262554168701, 1.1172834634780884, 1.2178406715393066, 1.318397879600525, 1.4189550876617432, 1.519512414932251, 1.6200695037841797, 1.7206268310546875, 1.8211840391159058, 1.921741247177124, 2.0222983360290527, 2.1228556632995605, 2.2234127521514893, 2.323970079421997, 2.424527168273926, 2.5250844955444336, 2.6256418228149414, 2.72619891166687, 2.826756000518799, 2.9273133277893066, 3.0278704166412354, 3.128427743911743, 3.228984832763672, 3.3295421600341797, 3.4300994873046875, 3.530656576156616, 3.631213665008545, 3.7317709922790527, 3.8323280811309814, 3.9328854084014893, 4.033442497253418, 4.133999824523926, 4.234557151794434, 4.335114479064941, 4.435671806335449, 4.536229133605957, 4.636786460876465, 4.7373433113098145, 4.837900638580322, 4.93845796585083, 5.039015293121338, 5.1395721435546875, 5.240129470825195, 5.340686798095703, 5.441244125366211, 5.5418009757995605, 5.642358303070068, 5.742915630340576, 5.843472957611084, 5.944029808044434, 6.044587135314941]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 6.0, 6.0, 8.0, 15.0, 17.0, 18.0, 18.0, 31.0, 29.0, 44.0, 46.0, 53.0, 71.0, 57.0, 81.0, 85.0, 53.0, 57.0, 63.0, 52.0, 33.0, 32.0, 21.0, 25.0, 15.0, 12.0, 11.0, 10.0, 10.0, 4.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3589369058609009, -0.3487369418144226, -0.33853697776794434, -0.3283369839191437, -0.3181370198726654, -0.30793705582618713, -0.29773709177970886, -0.2875371277332306, -0.27733713388442993, -0.26713716983795166, -0.2569372057914734, -0.24673722684383392, -0.23653724789619446, -0.2263372838497162, -0.21613731980323792, -0.20593735575675964, -0.19573739171028137, -0.1855374276638031, -0.17533744871616364, -0.16513748466968536, -0.1549375057220459, -0.14473754167556763, -0.13453757762908936, -0.12433760613203049, -0.11413763463497162, -0.10393766313791275, -0.09373769164085388, -0.08353772759437561, -0.07333775609731674, -0.06313778460025787, -0.052937816828489304, -0.042737849056720734, -0.032537877559661865, -0.022337907925248146, -0.012137938290834427, -0.0019379686564207077, 0.008262000977993011, 0.01846197247505188, 0.02866194024682045, 0.03886190801858902, 0.04906187951564789, 0.05926185101270676, 0.06946182250976562, 0.0796617865562439, 0.08986175805330276, 0.10006172955036163, 0.1102616935968399, 0.12046166509389877, 0.13066163659095764, 0.1408616006374359, 0.15106157958507538, 0.16126154363155365, 0.17146152257919312, 0.1816614866256714, 0.19186145067214966, 0.20206141471862793, 0.2122613936662674, 0.22246135771274567, 0.23266133666038513, 0.2428613007068634, 0.2530612647533417, 0.26326125860214233, 0.2734612226486206, 0.2836611866950989, 0.29386115074157715]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 4.0, 6.0, 9.0, 19.0, 19.0, 25.0, 57.0, 60.0, 107.0, 163.0, 240.0, 375.0, 593.0, 959.0, 1631.0, 2619.0, 4768.0, 9097.0, 20058.0, 54205.0, 205515.0, 508677.0, 158629.0, 44866.0, 17134.0, 8070.0, 4320.0, 2432.0, 1450.0, 852.0, 543.0, 363.0, 248.0, 161.0, 93.0, 61.0, 42.0, 24.0, 19.0, 13.0, 10.0, 7.0, 14.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1304931640625, -0.12605667114257812, -0.12162017822265625, -0.11718368530273438, -0.1127471923828125, -0.10831069946289062, -0.10387420654296875, -0.09943771362304688, -0.095001220703125, -0.09056472778320312, -0.08612823486328125, -0.08169174194335938, -0.0772552490234375, -0.07281875610351562, -0.06838226318359375, -0.06394577026367188, -0.05950927734375, -0.055072784423828125, -0.05063629150390625, -0.046199798583984375, -0.0417633056640625, -0.037326812744140625, -0.03289031982421875, -0.028453826904296875, -0.024017333984375, -0.019580841064453125, -0.01514434814453125, -0.010707855224609375, -0.0062713623046875, -0.001834869384765625, 0.00260162353515625, 0.007038116455078125, 0.011474609375, 0.015911102294921875, 0.02034759521484375, 0.024784088134765625, 0.0292205810546875, 0.033657073974609375, 0.03809356689453125, 0.042530059814453125, 0.046966552734375, 0.051403045654296875, 0.05583953857421875, 0.060276031494140625, 0.0647125244140625, 0.06914901733398438, 0.07358551025390625, 0.07802200317382812, 0.08245849609375, 0.08689498901367188, 0.09133148193359375, 0.09576797485351562, 0.1002044677734375, 0.10464096069335938, 0.10907745361328125, 0.11351394653320312, 0.117950439453125, 0.12238693237304688, 0.12682342529296875, 0.13125991821289062, 0.1356964111328125, 0.14013290405273438, 0.14456939697265625, 0.14900588989257812, 0.1534423828125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 7.0, 3.0, 5.0, 9.0, 6.0, 8.0, 12.0, 25.0, 32.0, 45.0, 62.0, 56.0, 78.0, 81.0, 86.0, 92.0, 72.0, 63.0, 58.0, 48.0, 37.0, 22.0, 23.0, 13.0, 9.0, 5.0, 5.0, 4.0, 3.0, 1.0, 2.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.016754150390625, -0.016226768493652344, -0.015699386596679688, -0.015172004699707031, -0.014644622802734375, -0.014117240905761719, -0.013589859008789062, -0.013062477111816406, -0.01253509521484375, -0.012007713317871094, -0.011480331420898438, -0.010952949523925781, -0.010425567626953125, -0.009898185729980469, -0.009370803833007812, -0.008843421936035156, -0.0083160400390625, -0.007788658142089844, -0.0072612762451171875, -0.006733894348144531, -0.006206512451171875, -0.005679130554199219, -0.0051517486572265625, -0.004624366760253906, -0.00409698486328125, -0.0035696029663085938, -0.0030422210693359375, -0.0025148391723632812, -0.001987457275390625, -0.0014600753784179688, -0.0009326934814453125, -0.00040531158447265625, 0.0001220703125, 0.0006494522094726562, 0.0011768341064453125, 0.0017042160034179688, 0.002231597900390625, 0.0027589797973632812, 0.0032863616943359375, 0.0038137435913085938, 0.00434112548828125, 0.004868507385253906, 0.0053958892822265625, 0.005923271179199219, 0.006450653076171875, 0.006978034973144531, 0.0075054168701171875, 0.008032798767089844, 0.0085601806640625, 0.009087562561035156, 0.009614944458007812, 0.010142326354980469, 0.010669708251953125, 0.011197090148925781, 0.011724472045898438, 0.012251853942871094, 0.01277923583984375, 0.013306617736816406, 0.013833999633789062, 0.014361381530761719, 0.014888763427734375, 0.015416145324707031, 0.015943527221679688, 0.016470909118652344, 0.016998291015625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 4.0, 3.0, 5.0, 3.0, 0.0, 3.0, 3.0, 6.0, 2.0, 1.0, 7.0, 9.0, 13.0, 29.0, 126.0, 1434.0, 48227.0, 951374.0, 45702.0, 1374.0, 133.0, 30.0, 13.0, 8.0, 5.0, 7.0, 6.0, 4.0, 4.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.67041015625, -0.65203857421875, -0.6336669921875, -0.61529541015625, -0.596923828125, -0.57855224609375, -0.5601806640625, -0.54180908203125, -0.5234375, -0.50506591796875, -0.4866943359375, -0.46832275390625, -0.449951171875, -0.43157958984375, -0.4132080078125, -0.39483642578125, -0.37646484375, -0.35809326171875, -0.3397216796875, -0.32135009765625, -0.302978515625, -0.28460693359375, -0.2662353515625, -0.24786376953125, -0.2294921875, -0.21112060546875, -0.1927490234375, -0.17437744140625, -0.156005859375, -0.13763427734375, -0.1192626953125, -0.10089111328125, -0.08251953125, -0.06414794921875, -0.0457763671875, -0.02740478515625, -0.009033203125, 0.00933837890625, 0.0277099609375, 0.04608154296875, 0.064453125, 0.08282470703125, 0.1011962890625, 0.11956787109375, 0.137939453125, 0.15631103515625, 0.1746826171875, 0.19305419921875, 0.21142578125, 0.22979736328125, 0.2481689453125, 0.26654052734375, 0.284912109375, 0.30328369140625, 0.3216552734375, 0.34002685546875, 0.3583984375, 0.37677001953125, 0.3951416015625, 0.41351318359375, 0.431884765625, 0.45025634765625, 0.4686279296875, 0.48699951171875, 0.50537109375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 5.0, 7.0, 6.0, 9.0, 5.0, 6.0, 17.0, 15.0, 16.0, 17.0, 22.0, 15.0, 24.0, 30.0, 25.0, 28.0, 28.0, 33.0, 35.0, 36.0, 40.0, 47.0, 39.0, 48.0, 49.0, 44.0, 44.0, 43.0, 27.0, 38.0, 28.0, 27.0, 20.0, 19.0, 15.0, 17.0, 11.0, 15.0, 14.0, 5.0, 6.0, 6.0, 11.0, 6.0, 4.0, 5.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07659912109375, -0.07422637939453125, -0.0718536376953125, -0.06948089599609375, -0.067108154296875, -0.06473541259765625, -0.0623626708984375, -0.05998992919921875, -0.0576171875, -0.05524444580078125, -0.0528717041015625, -0.05049896240234375, -0.048126220703125, -0.04575347900390625, -0.0433807373046875, -0.04100799560546875, -0.03863525390625, -0.03626251220703125, -0.0338897705078125, -0.03151702880859375, -0.029144287109375, -0.02677154541015625, -0.0243988037109375, -0.02202606201171875, -0.0196533203125, -0.01728057861328125, -0.0149078369140625, -0.01253509521484375, -0.010162353515625, -0.00778961181640625, -0.0054168701171875, -0.00304412841796875, -0.00067138671875, 0.00170135498046875, 0.0040740966796875, 0.00644683837890625, 0.008819580078125, 0.01119232177734375, 0.0135650634765625, 0.01593780517578125, 0.018310546875, 0.02068328857421875, 0.0230560302734375, 0.02542877197265625, 0.027801513671875, 0.03017425537109375, 0.0325469970703125, 0.03491973876953125, 0.03729248046875, 0.03966522216796875, 0.0420379638671875, 0.04441070556640625, 0.046783447265625, 0.04915618896484375, 0.0515289306640625, 0.05390167236328125, 0.0562744140625, 0.05864715576171875, 0.0610198974609375, 0.06339263916015625, 0.065765380859375, 0.06813812255859375, 0.0705108642578125, 0.07288360595703125, 0.07525634765625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 5.0, 11.0, 26.0, 129.0, 1130.0, 1043186.0, 3757.0, 227.0, 58.0, 12.0, 5.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.36328125, -4.233642578125, -4.10400390625, -3.974365234375, -3.8447265625, -3.715087890625, -3.58544921875, -3.455810546875, -3.326171875, -3.196533203125, -3.06689453125, -2.937255859375, -2.8076171875, -2.677978515625, -2.54833984375, -2.418701171875, -2.2890625, -2.159423828125, -2.02978515625, -1.900146484375, -1.7705078125, -1.640869140625, -1.51123046875, -1.381591796875, -1.251953125, -1.122314453125, -0.99267578125, -0.863037109375, -0.7333984375, -0.603759765625, -0.47412109375, -0.344482421875, -0.21484375, -0.085205078125, 0.04443359375, 0.174072265625, 0.3037109375, 0.433349609375, 0.56298828125, 0.692626953125, 0.822265625, 0.951904296875, 1.08154296875, 1.211181640625, 1.3408203125, 1.470458984375, 1.60009765625, 1.729736328125, 1.859375, 1.989013671875, 2.11865234375, 2.248291015625, 2.3779296875, 2.507568359375, 2.63720703125, 2.766845703125, 2.896484375, 3.026123046875, 3.15576171875, 3.285400390625, 3.4150390625, 3.544677734375, 3.67431640625, 3.803955078125, 3.93359375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 5.0, 5.0, 3.0, 2.0, 7.0, 6.0, 16.0, 15.0, 26.0, 31.0, 48.0, 114.0, 178.0, 206.0, 143.0, 67.0, 48.0, 25.0, 14.0, 21.0, 7.0, 9.0, 3.0, 1.0, 3.0, 2.0, 0.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.46574592590332e-05, -5.194917321205139e-05, -4.924088716506958e-05, -4.653260111808777e-05, -4.382431507110596e-05, -4.1116029024124146e-05, -3.8407742977142334e-05, -3.569945693016052e-05, -3.299117088317871e-05, -3.02828848361969e-05, -2.7574598789215088e-05, -2.4866312742233276e-05, -2.2158026695251465e-05, -1.9449740648269653e-05, -1.6741454601287842e-05, -1.403316855430603e-05, -1.1324882507324219e-05, -8.616596460342407e-06, -5.908310413360596e-06, -3.200024366378784e-06, -4.917383193969727e-07, 2.216547727584839e-06, 4.92483377456665e-06, 7.633119821548462e-06, 1.0341405868530273e-05, 1.3049691915512085e-05, 1.5757977962493896e-05, 1.8466264009475708e-05, 2.117455005645752e-05, 2.388283610343933e-05, 2.6591122150421143e-05, 2.9299408197402954e-05, 3.2007694244384766e-05, 3.471598029136658e-05, 3.742426633834839e-05, 4.01325523853302e-05, 4.284083843231201e-05, 4.554912447929382e-05, 4.8257410526275635e-05, 5.0965696573257446e-05, 5.367398262023926e-05, 5.638226866722107e-05, 5.909055471420288e-05, 6.179884076118469e-05, 6.45071268081665e-05, 6.721541285514832e-05, 6.992369890213013e-05, 7.263198494911194e-05, 7.534027099609375e-05, 7.804855704307556e-05, 8.075684309005737e-05, 8.346512913703918e-05, 8.6173415184021e-05, 8.888170123100281e-05, 9.158998727798462e-05, 9.429827332496643e-05, 9.700655937194824e-05, 9.971484541893005e-05, 0.00010242313146591187, 0.00010513141751289368, 0.00010783970355987549, 0.0001105479896068573, 0.00011325627565383911, 0.00011596456170082092, 0.00011867284774780273]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 6.0, 4.0, 1.0, 12.0, 12.0, 25.0, 23.0, 40.0, 57.0, 84.0, 135.0, 284.0, 678.0, 1912.0, 7049.0, 122242.0, 889388.0, 20838.0, 3669.0, 1115.0, 427.0, 207.0, 106.0, 69.0, 48.0, 29.0, 27.0, 13.0, 11.0, 11.0, 15.0, 4.0, 4.0, 3.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.432861328125, -0.4163856506347656, -0.39990997314453125, -0.3834342956542969, -0.3669586181640625, -0.3504829406738281, -0.33400726318359375, -0.3175315856933594, -0.301055908203125, -0.2845802307128906, -0.26810455322265625, -0.2516288757324219, -0.2351531982421875, -0.21867752075195312, -0.20220184326171875, -0.18572616577148438, -0.16925048828125, -0.15277481079101562, -0.13629913330078125, -0.11982345581054688, -0.1033477783203125, -0.08687210083007812, -0.07039642333984375, -0.053920745849609375, -0.037445068359375, -0.020969390869140625, -0.00449371337890625, 0.011981964111328125, 0.0284576416015625, 0.044933319091796875, 0.06140899658203125, 0.07788467407226562, 0.0943603515625, 0.11083602905273438, 0.12731170654296875, 0.14378738403320312, 0.1602630615234375, 0.17673873901367188, 0.19321441650390625, 0.20969009399414062, 0.226165771484375, 0.24264144897460938, 0.25911712646484375, 0.2755928039550781, 0.2920684814453125, 0.3085441589355469, 0.32501983642578125, 0.3414955139160156, 0.35797119140625, 0.3744468688964844, 0.39092254638671875, 0.4073982238769531, 0.4238739013671875, 0.4403495788574219, 0.45682525634765625, 0.4733009338378906, 0.489776611328125, 0.5062522888183594, 0.5227279663085938, 0.5392036437988281, 0.5556793212890625, 0.5721549987792969, 0.5886306762695312, 0.6051063537597656, 0.62158203125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 7.0, 15.0, 42.0, 85.0, 146.0, 198.0, 181.0, 144.0, 86.0, 43.0, 22.0, 11.0, 6.0, 3.0, 8.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14306640625, -0.136627197265625, -0.13018798828125, -0.123748779296875, -0.1173095703125, -0.110870361328125, -0.10443115234375, -0.097991943359375, -0.091552734375, -0.085113525390625, -0.07867431640625, -0.072235107421875, -0.0657958984375, -0.059356689453125, -0.05291748046875, -0.046478271484375, -0.0400390625, -0.033599853515625, -0.02716064453125, -0.020721435546875, -0.0142822265625, -0.007843017578125, -0.00140380859375, 0.005035400390625, 0.011474609375, 0.017913818359375, 0.02435302734375, 0.030792236328125, 0.0372314453125, 0.043670654296875, 0.05010986328125, 0.056549072265625, 0.06298828125, 0.069427490234375, 0.07586669921875, 0.082305908203125, 0.0887451171875, 0.095184326171875, 0.10162353515625, 0.108062744140625, 0.114501953125, 0.120941162109375, 0.12738037109375, 0.133819580078125, 0.1402587890625, 0.146697998046875, 0.15313720703125, 0.159576416015625, 0.166015625, 0.172454833984375, 0.17889404296875, 0.185333251953125, 0.1917724609375, 0.198211669921875, 0.20465087890625, 0.211090087890625, 0.217529296875, 0.223968505859375, 0.23040771484375, 0.236846923828125, 0.2432861328125, 0.249725341796875, 0.25616455078125, 0.262603759765625, 0.26904296875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 3.0, 15.0, 24.0, 75.0, 199.0, 323.0, 213.0, 76.0, 38.0, 20.0, 11.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9265696406364441, -0.8625232577323914, -0.7984769344329834, -0.7344305515289307, -0.6703841686248779, -0.60633784532547, -0.5422914624214172, -0.4782451093196869, -0.41419875621795654, -0.3501524031162262, -0.28610605001449585, -0.22205966711044312, -0.15801331400871277, -0.09396696090698242, -0.029920578002929688, 0.03412577509880066, 0.098172128200531, 0.16221848130226135, 0.2262648493051529, 0.29031121730804443, 0.3543575704097748, 0.4184039235115051, 0.48245030641555786, 0.5464966297149658, 0.6105430126190186, 0.6745893955230713, 0.7386357188224792, 0.802682101726532, 0.8667284250259399, 0.9307748079299927, 0.9948211908340454, 1.0588675737380981, 1.1229138374328613, 1.186960220336914, 1.2510066032409668, 1.3150529861450195, 1.3790992498397827, 1.4431456327438354, 1.5071920156478882, 1.571238398551941, 1.635284662246704, 1.6993310451507568, 1.7633774280548096, 1.8274238109588623, 1.8914700746536255, 1.9555164575576782, 2.0195627212524414, 2.083609104156494, 2.147655487060547, 2.2117018699645996, 2.2757482528686523, 2.339794635772705, 2.403841018676758, 2.4678874015808105, 2.5319337844848633, 2.595979928970337, 2.6600265502929688, 2.7240729331970215, 2.788119316101074, 2.852165699005127, 2.9162120819091797, 2.9802584648132324, 3.044304847717285, 3.108350992202759, 3.1723973751068115]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 6.0, 4.0, 4.0, 9.0, 11.0, 13.0, 20.0, 29.0, 24.0, 42.0, 55.0, 62.0, 67.0, 79.0, 79.0, 72.0, 69.0, 82.0, 66.0, 43.0, 41.0, 32.0, 20.0, 15.0, 18.0, 6.0, 3.0, 12.0, 4.0, 6.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9880886673927307, -0.959455668926239, -0.9308226704597473, -0.9021896123886108, -0.8735566139221191, -0.8449236154556274, -0.8162906169891357, -0.787657618522644, -0.7590246200561523, -0.7303916215896606, -0.701758623123169, -0.6731256246566772, -0.6444925665855408, -0.6158595681190491, -0.5872265696525574, -0.5585935711860657, -0.5299605131149292, -0.5013275146484375, -0.4726944863796234, -0.4440614879131317, -0.4154284596443176, -0.3867954611778259, -0.35816246271133423, -0.32952946424484253, -0.30089643597602844, -0.27226343750953674, -0.24363040924072266, -0.21499741077423096, -0.18636439740657806, -0.15773138403892517, -0.12909838557243347, -0.10046537220478058, -0.07183235883712769, -0.04319934919476509, -0.014566339552402496, 0.0140666663646698, 0.04269967973232269, 0.07133269309997559, 0.09996569156646729, 0.12859870493412018, 0.15723171830177307, 0.18586473166942596, 0.21449774503707886, 0.24313074350357056, 0.27176374197006226, 0.30039677023887634, 0.32902976870536804, 0.35766279697418213, 0.38629579544067383, 0.4149287939071655, 0.4435618221759796, 0.4721948206424713, 0.5008278489112854, 0.5294608473777771, 0.5580938458442688, 0.5867268443107605, 0.615359902381897, 0.6439929008483887, 0.6726258993148804, 0.7012588977813721, 0.7298919558525085, 0.7585249543190002, 0.7871579527854919, 0.8157909512519836, 0.8444239497184753]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 1.0, 2.0, 2.0, 4.0, 10.0, 8.0, 10.0, 6.0, 4.0, 7.0, 23.0, 20.0, 26.0, 45.0, 92.0, 219.0, 1120.0, 14313.0, 4141087.0, 34933.0, 1842.0, 284.0, 88.0, 29.0, 26.0, 18.0, 10.0, 14.0, 8.0, 6.0, 2.0, 4.0, 0.0, 2.0, 4.0, 2.0, 2.0, 4.0, 4.0, 4.0, 0.0, 2.0, 0.0, 2.0], "bins": [-2.0390625, -1.9862518310546875, -1.933441162109375, -1.8806304931640625, -1.82781982421875, -1.7750091552734375, -1.722198486328125, -1.6693878173828125, -1.6165771484375, -1.5637664794921875, -1.510955810546875, -1.4581451416015625, -1.40533447265625, -1.3525238037109375, -1.299713134765625, -1.2469024658203125, -1.194091796875, -1.1412811279296875, -1.088470458984375, -1.0356597900390625, -0.98284912109375, -0.9300384521484375, -0.877227783203125, -0.8244171142578125, -0.7716064453125, -0.7187957763671875, -0.665985107421875, -0.6131744384765625, -0.56036376953125, -0.5075531005859375, -0.454742431640625, -0.4019317626953125, -0.34912109375, -0.2963104248046875, -0.243499755859375, -0.1906890869140625, -0.13787841796875, -0.0850677490234375, -0.032257080078125, 0.0205535888671875, 0.0733642578125, 0.1261749267578125, 0.178985595703125, 0.2317962646484375, 0.28460693359375, 0.3374176025390625, 0.390228271484375, 0.4430389404296875, 0.495849609375, 0.5486602783203125, 0.601470947265625, 0.6542816162109375, 0.70709228515625, 0.7599029541015625, 0.812713623046875, 0.8655242919921875, 0.9183349609375, 0.9711456298828125, 1.023956298828125, 1.0767669677734375, 1.12957763671875, 1.1823883056640625, 1.235198974609375, 1.2880096435546875, 1.3408203125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 0.0, 2.0, 0.0, 6.0, 6.0, 1.0, 2.0, 5.0, 9.0, 16.0, 15.0, 26.0, 22.0, 26.0, 33.0, 43.0, 49.0, 58.0, 69.0, 78.0, 78.0, 79.0, 69.0, 61.0, 50.0, 46.0, 42.0, 31.0, 14.0, 14.0, 14.0, 3.0, 7.0, 8.0, 7.0, 5.0, 1.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0], "bins": [-0.0159454345703125, -0.015467166900634766, -0.014988899230957031, -0.014510631561279297, -0.014032363891601562, -0.013554096221923828, -0.013075828552246094, -0.01259756088256836, -0.012119293212890625, -0.01164102554321289, -0.011162757873535156, -0.010684490203857422, -0.010206222534179688, -0.009727954864501953, -0.009249687194824219, -0.008771419525146484, -0.00829315185546875, -0.007814884185791016, -0.007336616516113281, -0.006858348846435547, -0.0063800811767578125, -0.005901813507080078, -0.005423545837402344, -0.004945278167724609, -0.004467010498046875, -0.003988742828369141, -0.0035104751586914062, -0.003032207489013672, -0.0025539398193359375, -0.002075672149658203, -0.0015974044799804688, -0.0011191368103027344, -0.000640869140625, -0.00016260147094726562, 0.00031566619873046875, 0.0007939338684082031, 0.0012722015380859375, 0.0017504692077636719, 0.0022287368774414062, 0.0027070045471191406, 0.003185272216796875, 0.0036635398864746094, 0.004141807556152344, 0.004620075225830078, 0.0050983428955078125, 0.005576610565185547, 0.006054878234863281, 0.006533145904541016, 0.00701141357421875, 0.007489681243896484, 0.007967948913574219, 0.008446216583251953, 0.008924484252929688, 0.009402751922607422, 0.009881019592285156, 0.01035928726196289, 0.010837554931640625, 0.01131582260131836, 0.011794090270996094, 0.012272357940673828, 0.012750625610351562, 0.013228893280029297, 0.013707160949707031, 0.014185428619384766, 0.0146636962890625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 8.0, 4.0, 16.0, 16.0, 41.0, 74.0, 246.0, 6416.0, 4172546.0, 14466.0, 288.0, 92.0, 36.0, 21.0, 12.0, 4.0, 8.0, 2.0, 1.0, 1.0], "bins": [-3.43359375, -3.3682785034179688, -3.3029632568359375, -3.2376480102539062, -3.172332763671875, -3.1070175170898438, -3.0417022705078125, -2.9763870239257812, -2.91107177734375, -2.8457565307617188, -2.7804412841796875, -2.7151260375976562, -2.649810791015625, -2.5844955444335938, -2.5191802978515625, -2.4538650512695312, -2.3885498046875, -2.3232345581054688, -2.2579193115234375, -2.1926040649414062, -2.127288818359375, -2.0619735717773438, -1.9966583251953125, -1.9313430786132812, -1.86602783203125, -1.8007125854492188, -1.7353973388671875, -1.6700820922851562, -1.604766845703125, -1.5394515991210938, -1.4741363525390625, -1.4088211059570312, -1.343505859375, -1.2781906127929688, -1.2128753662109375, -1.1475601196289062, -1.082244873046875, -1.0169296264648438, -0.9516143798828125, -0.8862991333007812, -0.82098388671875, -0.7556686401367188, -0.6903533935546875, -0.6250381469726562, -0.559722900390625, -0.49440765380859375, -0.4290924072265625, -0.36377716064453125, -0.2984619140625, -0.23314666748046875, -0.1678314208984375, -0.10251617431640625, -0.037200927734375, 0.02811431884765625, 0.0934295654296875, 0.15874481201171875, 0.22406005859375, 0.28937530517578125, 0.3546905517578125, 0.42000579833984375, 0.485321044921875, 0.5506362915039062, 0.6159515380859375, 0.6812667846679688, 0.74658203125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 7.0, 6.0, 7.0, 9.0, 11.0, 26.0, 15.0, 20.0, 42.0, 41.0, 61.0, 88.0, 137.0, 213.0, 375.0, 1110.0, 946.0, 358.0, 194.0, 111.0, 76.0, 51.0, 35.0, 36.0, 15.0, 18.0, 12.0, 7.0, 9.0, 5.0, 9.0, 4.0, 3.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03521728515625, -0.034000396728515625, -0.03278350830078125, -0.031566619873046875, -0.0303497314453125, -0.029132843017578125, -0.02791595458984375, -0.026699066162109375, -0.025482177734375, -0.024265289306640625, -0.02304840087890625, -0.021831512451171875, -0.0206146240234375, -0.019397735595703125, -0.01818084716796875, -0.016963958740234375, -0.0157470703125, -0.014530181884765625, -0.01331329345703125, -0.012096405029296875, -0.0108795166015625, -0.009662628173828125, -0.00844573974609375, -0.007228851318359375, -0.006011962890625, -0.004795074462890625, -0.00357818603515625, -0.002361297607421875, -0.0011444091796875, 7.2479248046875e-05, 0.00128936767578125, 0.002506256103515625, 0.00372314453125, 0.004940032958984375, 0.00615692138671875, 0.007373809814453125, 0.0085906982421875, 0.009807586669921875, 0.01102447509765625, 0.012241363525390625, 0.013458251953125, 0.014675140380859375, 0.01589202880859375, 0.017108917236328125, 0.0183258056640625, 0.019542694091796875, 0.02075958251953125, 0.021976470947265625, 0.023193359375, 0.024410247802734375, 0.02562713623046875, 0.026844024658203125, 0.0280609130859375, 0.029277801513671875, 0.03049468994140625, 0.031711578369140625, 0.032928466796875, 0.034145355224609375, 0.03536224365234375, 0.036579132080078125, 0.0377960205078125, 0.039012908935546875, 0.04022979736328125, 0.041446685791015625, 0.04266357421875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 82.0, 917.0, 14.0, 3.0, 3.0], "bins": [-8.331463813781738, -8.193377494812012, -8.055292129516602, -7.917205810546875, -7.779119968414307, -7.641034126281738, -7.50294828414917, -7.364862442016602, -7.226776123046875, -7.088690280914307, -6.950604438781738, -6.812518119812012, -6.674432277679443, -6.536346435546875, -6.398260593414307, -6.260174751281738, -6.122088432312012, -5.984002590179443, -5.845916748046875, -5.707830429077148, -5.56974458694458, -5.431658744812012, -5.293572902679443, -5.155487060546875, -5.017401218414307, -4.879315376281738, -4.74122953414917, -4.603143215179443, -4.465057373046875, -4.326971530914307, -4.188885688781738, -4.050799369812012, -3.9127135276794434, -3.774627685546875, -3.6365416049957275, -3.498455762863159, -3.3603696823120117, -3.2222838401794434, -3.084197998046875, -2.9461119174957275, -2.80802583694458, -2.6699399948120117, -2.5318539142608643, -2.393768072128296, -2.2556819915771484, -2.11759614944458, -1.9795101881027222, -1.8414242267608643, -1.7033382654190063, -1.5652523040771484, -1.4271663427352905, -1.2890803813934326, -1.1509945392608643, -1.0129084587097168, -0.8748226165771484, -0.7367366552352905, -0.5986506938934326, -0.4605647325515747, -0.3224788010120392, -0.18439286947250366, -0.04630690813064575, 0.09177905321121216, 0.2298649549484253, 0.3679509162902832, 0.5060368776321411]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 0.0, 9.0, 14.0, 26.0, 39.0, 44.0, 78.0, 85.0, 90.0, 101.0, 104.0, 108.0, 76.0, 71.0, 47.0, 27.0, 20.0, 20.0, 13.0, 4.0, 7.0, 7.0, 3.0, 4.0, 3.0, 0.0, 2.0, 3.0], "bins": [-0.48254889249801636, -0.4720497727394104, -0.46155062317848206, -0.4510515034198761, -0.44055235385894775, -0.4300532341003418, -0.41955408453941345, -0.4090549647808075, -0.39855581521987915, -0.3880566954612732, -0.37755754590034485, -0.3670584261417389, -0.35655927658081055, -0.3460601568222046, -0.33556100726127625, -0.3250618875026703, -0.31456273794174194, -0.304063618183136, -0.29356446862220764, -0.2830653488636017, -0.27256619930267334, -0.2620670795440674, -0.25156792998313904, -0.24106881022453308, -0.23056969046592712, -0.22007055580615997, -0.20957142114639282, -0.19907228648662567, -0.18857315182685852, -0.17807401716709137, -0.16757488250732422, -0.15707576274871826, -0.14657661318778992, -0.13607747852802277, -0.12557834386825562, -0.11507920920848846, -0.10458007454872131, -0.09408093988895416, -0.08358181267976761, -0.07308267802000046, -0.0625835433602333, -0.052084408700466156, -0.041585274040699005, -0.031086143106222153, -0.020587008446455002, -0.010087873786687851, 0.00041125714778900146, 0.010910391807556152, 0.021409526467323303, 0.031908661127090454, 0.042407795786857605, 0.05290692672133446, 0.0634060651063919, 0.07390519976615906, 0.08440432697534561, 0.09490346163511276, 0.10540259629487991, 0.11590173095464706, 0.12640085816383362, 0.13689999282360077, 0.14739912748336792, 0.15789826214313507, 0.16839739680290222, 0.17889653146266937, 0.18939566612243652]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 4.0, 1.0, 5.0, 6.0, 4.0, 7.0, 14.0, 11.0, 16.0, 10.0, 17.0, 22.0, 21.0, 26.0, 36.0, 29.0, 25.0, 33.0, 53.0, 42.0, 320.0, 524931.0, 522216.0, 293.0, 58.0, 47.0, 40.0, 31.0, 31.0, 43.0, 29.0, 26.0, 25.0, 16.0, 16.0, 9.0, 4.0, 9.0, 8.0, 5.0, 3.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0], "bins": [-1.4755859375, -1.4334259033203125, -1.391265869140625, -1.3491058349609375, -1.30694580078125, -1.2647857666015625, -1.222625732421875, -1.1804656982421875, -1.1383056640625, -1.0961456298828125, -1.053985595703125, -1.0118255615234375, -0.96966552734375, -0.9275054931640625, -0.885345458984375, -0.8431854248046875, -0.801025390625, -0.7588653564453125, -0.716705322265625, -0.6745452880859375, -0.63238525390625, -0.5902252197265625, -0.548065185546875, -0.5059051513671875, -0.4637451171875, -0.4215850830078125, -0.379425048828125, -0.3372650146484375, -0.29510498046875, -0.2529449462890625, -0.210784912109375, -0.1686248779296875, -0.12646484375, -0.0843048095703125, -0.042144775390625, 1.52587890625e-05, 0.04217529296875, 0.0843353271484375, 0.126495361328125, 0.1686553955078125, 0.2108154296875, 0.2529754638671875, 0.295135498046875, 0.3372955322265625, 0.37945556640625, 0.4216156005859375, 0.463775634765625, 0.5059356689453125, 0.548095703125, 0.5902557373046875, 0.632415771484375, 0.6745758056640625, 0.71673583984375, 0.7588958740234375, 0.801055908203125, 0.8432159423828125, 0.8853759765625, 0.9275360107421875, 0.969696044921875, 1.0118560791015625, 1.05401611328125, 1.0961761474609375, 1.138336181640625, 1.1804962158203125, 1.22265625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 22.0, 54.0, 69.0, 105.0, 174.0, 181.0, 166.0, 107.0, 80.0, 29.0, 11.0, 8.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.061492919921875, -0.060167551040649414, -0.05884218215942383, -0.05751681327819824, -0.056191444396972656, -0.05486607551574707, -0.053540706634521484, -0.0522153377532959, -0.05088996887207031, -0.04956459999084473, -0.04823923110961914, -0.046913862228393555, -0.04558849334716797, -0.04426312446594238, -0.0429377555847168, -0.04161238670349121, -0.040287017822265625, -0.03896164894104004, -0.03763628005981445, -0.03631091117858887, -0.03498554229736328, -0.033660173416137695, -0.03233480453491211, -0.031009435653686523, -0.029684066772460938, -0.02835869789123535, -0.027033329010009766, -0.02570796012878418, -0.024382591247558594, -0.023057222366333008, -0.021731853485107422, -0.020406484603881836, -0.01908111572265625, -0.017755746841430664, -0.016430377960205078, -0.015105009078979492, -0.013779640197753906, -0.01245427131652832, -0.011128902435302734, -0.009803533554077148, -0.008478164672851562, -0.0071527957916259766, -0.005827426910400391, -0.004502058029174805, -0.0031766891479492188, -0.0018513202667236328, -0.0005259513854980469, 0.0007994174957275391, 0.002124786376953125, 0.003450155258178711, 0.004775524139404297, 0.006100893020629883, 0.007426261901855469, 0.008751630783081055, 0.01007699966430664, 0.011402368545532227, 0.012727737426757812, 0.014053106307983398, 0.015378475189208984, 0.01670384407043457, 0.018029212951660156, 0.019354581832885742, 0.020679950714111328, 0.022005319595336914, 0.0233306884765625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 7.0, 6.0, 10.0, 7.0, 11.0, 13.0, 15.0, 27.0, 28.0, 43.0, 73.0, 83.0, 140.0, 235.0, 373.0, 729.0, 1561.0, 3777.0, 11252.0, 45385.0, 261930.0, 553102.0, 131210.0, 26099.0, 7189.0, 2658.0, 1110.0, 583.0, 303.0, 190.0, 118.0, 80.0, 60.0, 38.0, 28.0, 21.0, 17.0, 12.0, 6.0, 6.0, 7.0, 3.0, 5.0, 1.0, 6.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.322021484375, -0.3113975524902344, -0.30077362060546875, -0.2901496887207031, -0.2795257568359375, -0.2689018249511719, -0.25827789306640625, -0.24765396118164062, -0.237030029296875, -0.22640609741210938, -0.21578216552734375, -0.20515823364257812, -0.1945343017578125, -0.18391036987304688, -0.17328643798828125, -0.16266250610351562, -0.15203857421875, -0.14141464233398438, -0.13079071044921875, -0.12016677856445312, -0.1095428466796875, -0.09891891479492188, -0.08829498291015625, -0.07767105102539062, -0.067047119140625, -0.056423187255859375, -0.04579925537109375, -0.035175323486328125, -0.0245513916015625, -0.013927459716796875, -0.00330352783203125, 0.007320404052734375, 0.0179443359375, 0.028568267822265625, 0.03919219970703125, 0.049816131591796875, 0.0604400634765625, 0.07106399536132812, 0.08168792724609375, 0.09231185913085938, 0.102935791015625, 0.11355972290039062, 0.12418365478515625, 0.13480758666992188, 0.1454315185546875, 0.15605545043945312, 0.16667938232421875, 0.17730331420898438, 0.18792724609375, 0.19855117797851562, 0.20917510986328125, 0.21979904174804688, 0.2304229736328125, 0.24104690551757812, 0.25167083740234375, 0.2622947692871094, 0.272918701171875, 0.2835426330566406, 0.29416656494140625, 0.3047904968261719, 0.3154144287109375, 0.3260383605957031, 0.33666229248046875, 0.3472862243652344, 0.35791015625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 8.0, 10.0, 7.0, 8.0, 12.0, 16.0, 23.0, 16.0, 36.0, 29.0, 29.0, 46.0, 44.0, 48.0, 52.0, 46.0, 39.0, 60.0, 39.0, 43.0, 41.0, 46.0, 33.0, 46.0, 31.0, 32.0, 19.0, 29.0, 29.0, 17.0, 18.0, 8.0, 7.0, 7.0, 2.0, 7.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0997314453125, -0.09676265716552734, -0.09379386901855469, -0.09082508087158203, -0.08785629272460938, -0.08488750457763672, -0.08191871643066406, -0.0789499282836914, -0.07598114013671875, -0.0730123519897461, -0.07004356384277344, -0.06707477569580078, -0.06410598754882812, -0.06113719940185547, -0.05816841125488281, -0.055199623107910156, -0.0522308349609375, -0.049262046813964844, -0.04629325866699219, -0.04332447052001953, -0.040355682373046875, -0.03738689422607422, -0.03441810607910156, -0.031449317932128906, -0.02848052978515625, -0.025511741638183594, -0.022542953491210938, -0.01957416534423828, -0.016605377197265625, -0.013636589050292969, -0.010667800903320312, -0.007699012756347656, -0.004730224609375, -0.0017614364624023438, 0.0012073516845703125, 0.004176139831542969, 0.007144927978515625, 0.010113716125488281, 0.013082504272460938, 0.016051292419433594, 0.01902008056640625, 0.021988868713378906, 0.024957656860351562, 0.02792644500732422, 0.030895233154296875, 0.03386402130126953, 0.03683280944824219, 0.039801597595214844, 0.0427703857421875, 0.045739173889160156, 0.04870796203613281, 0.05167675018310547, 0.054645538330078125, 0.05761432647705078, 0.06058311462402344, 0.0635519027709961, 0.06652069091796875, 0.0694894790649414, 0.07245826721191406, 0.07542705535888672, 0.07839584350585938, 0.08136463165283203, 0.08433341979980469, 0.08730220794677734, 0.09027099609375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 5.0, 8.0, 6.0, 9.0, 17.0, 24.0, 42.0, 73.0, 116.0, 197.0, 366.0, 772.0, 1905.0, 6375.0, 39463.0, 755856.0, 222416.0, 15137.0, 3339.0, 1192.0, 544.0, 281.0, 154.0, 83.0, 42.0, 35.0, 20.0, 22.0, 10.0, 11.0, 11.0, 8.0, 4.0, 5.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.63525390625, -0.6158676147460938, -0.5964813232421875, -0.5770950317382812, -0.557708740234375, -0.5383224487304688, -0.5189361572265625, -0.49954986572265625, -0.48016357421875, -0.46077728271484375, -0.4413909912109375, -0.42200469970703125, -0.402618408203125, -0.38323211669921875, -0.3638458251953125, -0.34445953369140625, -0.3250732421875, -0.30568695068359375, -0.2863006591796875, -0.26691436767578125, -0.247528076171875, -0.22814178466796875, -0.2087554931640625, -0.18936920166015625, -0.16998291015625, -0.15059661865234375, -0.1312103271484375, -0.11182403564453125, -0.092437744140625, -0.07305145263671875, -0.0536651611328125, -0.03427886962890625, -0.014892578125, 0.00449371337890625, 0.0238800048828125, 0.04326629638671875, 0.062652587890625, 0.08203887939453125, 0.1014251708984375, 0.12081146240234375, 0.14019775390625, 0.15958404541015625, 0.1789703369140625, 0.19835662841796875, 0.217742919921875, 0.23712921142578125, 0.2565155029296875, 0.27590179443359375, 0.2952880859375, 0.31467437744140625, 0.3340606689453125, 0.35344696044921875, 0.372833251953125, 0.39221954345703125, 0.4116058349609375, 0.43099212646484375, 0.45037841796875, 0.46976470947265625, 0.4891510009765625, 0.5085372924804688, 0.527923583984375, 0.5473098754882812, 0.5666961669921875, 0.5860824584960938, 0.60546875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 5.0, 16.0, 11.0, 24.0, 47.0, 62.0, 92.0, 147.0, 142.0, 143.0, 101.0, 54.0, 47.0, 29.0, 17.0, 12.0, 14.0, 6.0, 5.0, 5.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.729364395141602e-05, -6.534717977046967e-05, -6.340071558952332e-05, -6.145425140857697e-05, -5.9507787227630615e-05, -5.7561323046684265e-05, -5.5614858865737915e-05, -5.3668394684791565e-05, -5.1721930503845215e-05, -4.9775466322898865e-05, -4.7829002141952515e-05, -4.5882537961006165e-05, -4.3936073780059814e-05, -4.1989609599113464e-05, -4.0043145418167114e-05, -3.8096681237220764e-05, -3.6150217056274414e-05, -3.4203752875328064e-05, -3.2257288694381714e-05, -3.0310824513435364e-05, -2.8364360332489014e-05, -2.6417896151542664e-05, -2.4471431970596313e-05, -2.2524967789649963e-05, -2.0578503608703613e-05, -1.8632039427757263e-05, -1.6685575246810913e-05, -1.4739111065864563e-05, -1.2792646884918213e-05, -1.0846182703971863e-05, -8.899718523025513e-06, -6.953254342079163e-06, -5.0067901611328125e-06, -3.0603259801864624e-06, -1.1138617992401123e-06, 8.326023817062378e-07, 2.779066562652588e-06, 4.725530743598938e-06, 6.671994924545288e-06, 8.618459105491638e-06, 1.0564923286437988e-05, 1.2511387467384338e-05, 1.4457851648330688e-05, 1.640431582927704e-05, 1.835078001022339e-05, 2.029724419116974e-05, 2.224370837211609e-05, 2.419017255306244e-05, 2.613663673400879e-05, 2.808310091495514e-05, 3.002956509590149e-05, 3.197602927684784e-05, 3.392249345779419e-05, 3.586895763874054e-05, 3.781542181968689e-05, 3.976188600063324e-05, 4.170835018157959e-05, 4.365481436252594e-05, 4.560127854347229e-05, 4.754774272441864e-05, 4.949420690536499e-05, 5.144067108631134e-05, 5.338713526725769e-05, 5.533359944820404e-05, 5.728006362915039e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 8.0, 9.0, 14.0, 19.0, 30.0, 55.0, 74.0, 126.0, 237.0, 505.0, 1290.0, 4370.0, 22390.0, 767667.0, 233863.0, 13037.0, 3052.0, 929.0, 367.0, 202.0, 104.0, 71.0, 31.0, 41.0, 21.0, 12.0, 12.0, 5.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9033203125, -0.8730621337890625, -0.842803955078125, -0.8125457763671875, -0.78228759765625, -0.7520294189453125, -0.721771240234375, -0.6915130615234375, -0.6612548828125, -0.6309967041015625, -0.600738525390625, -0.5704803466796875, -0.54022216796875, -0.5099639892578125, -0.479705810546875, -0.4494476318359375, -0.419189453125, -0.3889312744140625, -0.358673095703125, -0.3284149169921875, -0.29815673828125, -0.2678985595703125, -0.237640380859375, -0.2073822021484375, -0.1771240234375, -0.1468658447265625, -0.116607666015625, -0.0863494873046875, -0.05609130859375, -0.0258331298828125, 0.004425048828125, 0.0346832275390625, 0.06494140625, 0.0951995849609375, 0.125457763671875, 0.1557159423828125, 0.18597412109375, 0.2162322998046875, 0.246490478515625, 0.2767486572265625, 0.3070068359375, 0.3372650146484375, 0.367523193359375, 0.3977813720703125, 0.42803955078125, 0.4582977294921875, 0.488555908203125, 0.5188140869140625, 0.549072265625, 0.5793304443359375, 0.609588623046875, 0.6398468017578125, 0.67010498046875, 0.7003631591796875, 0.730621337890625, 0.7608795166015625, 0.7911376953125, 0.8213958740234375, 0.851654052734375, 0.8819122314453125, 0.91217041015625, 0.9424285888671875, 0.972686767578125, 1.0029449462890625, 1.033203125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 5.0, 5.0, 3.0, 9.0, 12.0, 20.0, 43.0, 89.0, 183.0, 226.0, 185.0, 105.0, 46.0, 19.0, 14.0, 9.0, 7.0, 7.0, 4.0, 5.0, 2.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.529296875, -0.5168685913085938, -0.5044403076171875, -0.49201202392578125, -0.479583740234375, -0.46715545654296875, -0.4547271728515625, -0.44229888916015625, -0.42987060546875, -0.41744232177734375, -0.4050140380859375, -0.39258575439453125, -0.380157470703125, -0.36772918701171875, -0.3553009033203125, -0.34287261962890625, -0.3304443359375, -0.31801605224609375, -0.3055877685546875, -0.29315948486328125, -0.280731201171875, -0.26830291748046875, -0.2558746337890625, -0.24344635009765625, -0.23101806640625, -0.21858978271484375, -0.2061614990234375, -0.19373321533203125, -0.181304931640625, -0.16887664794921875, -0.1564483642578125, -0.14402008056640625, -0.131591796875, -0.11916351318359375, -0.1067352294921875, -0.09430694580078125, -0.081878662109375, -0.06945037841796875, -0.0570220947265625, -0.04459381103515625, -0.03216552734375, -0.01973724365234375, -0.0073089599609375, 0.00511932373046875, 0.017547607421875, 0.02997589111328125, 0.0424041748046875, 0.05483245849609375, 0.0672607421875, 0.07968902587890625, 0.0921173095703125, 0.10454559326171875, 0.116973876953125, 0.12940216064453125, 0.1418304443359375, 0.15425872802734375, 0.16668701171875, 0.17911529541015625, 0.1915435791015625, 0.20397186279296875, 0.216400146484375, 0.22882843017578125, 0.2412567138671875, 0.25368499755859375, 0.26611328125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 31.0, 423.0, 492.0, 48.0, 8.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.483553886413574, -4.139206409454346, -3.794858932495117, -3.4505116939544678, -3.1061642169952393, -2.7618167400360107, -2.4174695014953613, -2.073122024536133, -1.7287745475769043, -1.3844270706176758, -1.0400797128677368, -0.6957323551177979, -0.35138487815856934, -0.00703740119934082, 0.3373098373413086, 0.6816573143005371, 1.0260047912597656, 1.3703522682189941, 1.714699625968933, 2.059046983718872, 2.4033944606781006, 2.747741937637329, 3.0920891761779785, 3.436436653137207, 3.7807841300964355, 4.125131607055664, 4.469479084014893, 4.813826560974121, 5.158173561096191, 5.502521514892578, 5.846868515014648, 6.191215991973877, 6.535564422607422, 6.87991189956665, 7.224259376525879, 7.568606376647949, 7.912954330444336, 8.257301330566406, 8.601648330688477, 8.945996284484863, 9.29034423828125, 9.63469123840332, 9.979039192199707, 10.323386192321777, 10.667734146118164, 11.012081146240234, 11.356428146362305, 11.700776100158691, 12.045123100280762, 12.389470100402832, 12.733818054199219, 13.078165054321289, 13.422513008117676, 13.766860008239746, 14.111207962036133, 14.455554962158203, 14.799901962280273, 15.144248962402344, 15.48859691619873, 15.8329439163208, 16.177291870117188, 16.521638870239258, 16.865985870361328, 17.21033477783203, 17.5546817779541]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 12.0, 20.0, 32.0, 43.0, 67.0, 87.0, 113.0, 128.0, 98.0, 126.0, 109.0, 57.0, 41.0, 35.0, 16.0, 11.0, 3.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1933109760284424, -1.135461688041687, -1.077612280845642, -1.0197629928588867, -0.9619137048721313, -0.9040643572807312, -0.846215009689331, -0.7883657217025757, -0.7305164337158203, -0.6726670861244202, -0.6148177981376648, -0.5569684505462646, -0.4991191625595093, -0.44126981496810913, -0.38342049717903137, -0.3255711793899536, -0.26772183179855347, -0.2098725140094757, -0.15202319622039795, -0.094173863530159, -0.03632454574108124, 0.021524786949157715, 0.07937410473823547, 0.13722342252731323, 0.195072740316391, 0.25292205810546875, 0.3107713758945465, 0.36862069368362427, 0.4264700412750244, 0.4843193590641022, 0.5421686768531799, 0.6000180244445801, 0.6578673124313354, 0.7157166600227356, 0.773565948009491, 0.8314152956008911, 0.8892645835876465, 0.9471139311790466, 1.0049632787704468, 1.0628125667572021, 1.1206618547439575, 1.178511142730713, 1.2363605499267578, 1.2942098379135132, 1.3520591259002686, 1.4099085330963135, 1.4677578210830688, 1.5256071090698242, 1.5834565162658691, 1.6413058042526245, 1.6991552114486694, 1.7570044994354248, 1.8148537874221802, 1.8727030754089355, 1.9305524826049805, 1.9884017705917358, 2.046251058578491, 2.104100465774536, 2.161949634552002, 2.219799041748047, 2.277648448944092, 2.3354976177215576, 2.3933470249176025, 2.4511961936950684, 2.5090456008911133]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 4.0, 14.0, 8.0, 11.0, 16.0, 23.0, 21.0, 41.0, 39.0, 62.0, 73.0, 152.0, 314.0, 1346.0, 2509924.0, 1679724.0, 1730.0, 343.0, 135.0, 75.0, 66.0, 38.0, 31.0, 26.0, 20.0, 12.0, 12.0, 5.0, 2.0, 6.0, 6.0, 4.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.640625, -3.5559539794921875, -3.471282958984375, -3.3866119384765625, -3.30194091796875, -3.2172698974609375, -3.132598876953125, -3.0479278564453125, -2.9632568359375, -2.8785858154296875, -2.793914794921875, -2.7092437744140625, -2.62457275390625, -2.5399017333984375, -2.455230712890625, -2.3705596923828125, -2.285888671875, -2.2012176513671875, -2.116546630859375, -2.0318756103515625, -1.94720458984375, -1.8625335693359375, -1.777862548828125, -1.6931915283203125, -1.6085205078125, -1.5238494873046875, -1.439178466796875, -1.3545074462890625, -1.26983642578125, -1.1851654052734375, -1.100494384765625, -1.0158233642578125, -0.93115234375, -0.8464813232421875, -0.761810302734375, -0.6771392822265625, -0.59246826171875, -0.5077972412109375, -0.423126220703125, -0.3384552001953125, -0.2537841796875, -0.1691131591796875, -0.084442138671875, 0.0002288818359375, 0.08489990234375, 0.1695709228515625, 0.254241943359375, 0.3389129638671875, 0.423583984375, 0.5082550048828125, 0.592926025390625, 0.6775970458984375, 0.76226806640625, 0.8469390869140625, 0.931610107421875, 1.0162811279296875, 1.1009521484375, 1.1856231689453125, 1.270294189453125, 1.3549652099609375, 1.43963623046875, 1.5243072509765625, 1.608978271484375, 1.6936492919921875, 1.7783203125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 6.0, 6.0, 5.0, 15.0, 14.0, 28.0, 31.0, 57.0, 52.0, 63.0, 79.0, 86.0, 106.0, 88.0, 66.0, 82.0, 72.0, 43.0, 32.0, 25.0, 16.0, 9.0, 3.0, 9.0, 8.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0404052734375, -0.039382219314575195, -0.03835916519165039, -0.037336111068725586, -0.03631305694580078, -0.03529000282287598, -0.03426694869995117, -0.03324389457702637, -0.03222084045410156, -0.031197786331176758, -0.030174732208251953, -0.02915167808532715, -0.028128623962402344, -0.02710556983947754, -0.026082515716552734, -0.02505946159362793, -0.024036407470703125, -0.02301335334777832, -0.021990299224853516, -0.02096724510192871, -0.019944190979003906, -0.0189211368560791, -0.017898082733154297, -0.016875028610229492, -0.015851974487304688, -0.014828920364379883, -0.013805866241455078, -0.012782812118530273, -0.011759757995605469, -0.010736703872680664, -0.00971364974975586, -0.008690595626831055, -0.00766754150390625, -0.006644487380981445, -0.005621433258056641, -0.004598379135131836, -0.0035753250122070312, -0.0025522708892822266, -0.0015292167663574219, -0.0005061626434326172, 0.0005168914794921875, 0.0015399456024169922, 0.002562999725341797, 0.0035860538482666016, 0.004609107971191406, 0.005632162094116211, 0.006655216217041016, 0.00767827033996582, 0.008701324462890625, 0.00972437858581543, 0.010747432708740234, 0.011770486831665039, 0.012793540954589844, 0.013816595077514648, 0.014839649200439453, 0.015862703323364258, 0.016885757446289062, 0.017908811569213867, 0.018931865692138672, 0.019954919815063477, 0.02097797393798828, 0.022001028060913086, 0.02302408218383789, 0.024047136306762695, 0.0250701904296875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 7.0, 4.0, 5.0, 9.0, 15.0, 9.0, 14.0, 31.0, 29.0, 58.0, 69.0, 106.0, 110.0, 112.0, 188.0, 1013.0, 4175694.0, 15661.0, 426.0, 152.0, 135.0, 139.0, 78.0, 78.0, 46.0, 45.0, 22.0, 19.0, 4.0, 5.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-8.078125, -7.83880615234375, -7.5994873046875, -7.36016845703125, -7.120849609375, -6.88153076171875, -6.6422119140625, -6.40289306640625, -6.16357421875, -5.92425537109375, -5.6849365234375, -5.44561767578125, -5.206298828125, -4.96697998046875, -4.7276611328125, -4.48834228515625, -4.2490234375, -4.00970458984375, -3.7703857421875, -3.53106689453125, -3.291748046875, -3.05242919921875, -2.8131103515625, -2.57379150390625, -2.33447265625, -2.09515380859375, -1.8558349609375, -1.61651611328125, -1.377197265625, -1.13787841796875, -0.8985595703125, -0.65924072265625, -0.419921875, -0.18060302734375, 0.0587158203125, 0.29803466796875, 0.537353515625, 0.77667236328125, 1.0159912109375, 1.25531005859375, 1.49462890625, 1.73394775390625, 1.9732666015625, 2.21258544921875, 2.451904296875, 2.69122314453125, 2.9305419921875, 3.16986083984375, 3.4091796875, 3.64849853515625, 3.8878173828125, 4.12713623046875, 4.366455078125, 4.60577392578125, 4.8450927734375, 5.08441162109375, 5.32373046875, 5.56304931640625, 5.8023681640625, 6.04168701171875, 6.281005859375, 6.52032470703125, 6.7596435546875, 6.99896240234375, 7.23828125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 7.0, 4.0, 15.0, 31.0, 61.0, 114.0, 369.0, 2141.0, 964.0, 213.0, 92.0, 36.0, 18.0, 11.0, 8.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18310546875, -0.17652320861816406, -0.16994094848632812, -0.1633586883544922, -0.15677642822265625, -0.1501941680908203, -0.14361190795898438, -0.13702964782714844, -0.1304473876953125, -0.12386512756347656, -0.11728286743164062, -0.11070060729980469, -0.10411834716796875, -0.09753608703613281, -0.09095382690429688, -0.08437156677246094, -0.077789306640625, -0.07120704650878906, -0.06462478637695312, -0.05804252624511719, -0.05146026611328125, -0.04487800598144531, -0.038295745849609375, -0.03171348571777344, -0.0251312255859375, -0.018548965454101562, -0.011966705322265625, -0.0053844451904296875, 0.00119781494140625, 0.0077800750732421875, 0.014362335205078125, 0.020944595336914062, 0.02752685546875, 0.03410911560058594, 0.040691375732421875, 0.04727363586425781, 0.05385589599609375, 0.06043815612792969, 0.06702041625976562, 0.07360267639160156, 0.0801849365234375, 0.08676719665527344, 0.09334945678710938, 0.09993171691894531, 0.10651397705078125, 0.11309623718261719, 0.11967849731445312, 0.12626075744628906, 0.132843017578125, 0.13942527770996094, 0.14600753784179688, 0.1525897979736328, 0.15917205810546875, 0.1657543182373047, 0.17233657836914062, 0.17891883850097656, 0.1855010986328125, 0.19208335876464844, 0.19866561889648438, 0.2052478790283203, 0.21183013916015625, 0.2184123992919922, 0.22499465942382812, 0.23157691955566406, 0.2381591796875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 7.0, 1.0, 10.0, 11.0, 32.0, 88.0, 241.0, 430.0, 111.0, 46.0, 16.0, 7.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1266584396362305, -4.938282012939453, -4.749905586242676, -4.561529159545898, -4.373152732849121, -4.184776306152344, -3.9963996410369873, -3.80802321434021, -3.6196467876434326, -3.4312703609466553, -3.242893934249878, -3.0545172691345215, -2.866140842437744, -2.677764415740967, -2.4893879890441895, -2.301011562347412, -2.1126351356506348, -1.9242587089538574, -1.73588228225708, -1.5475057363510132, -1.3591293096542358, -1.1707528829574585, -0.9823763370513916, -0.7939999103546143, -0.6056234836578369, -0.4172470271587372, -0.22887057065963745, -0.04049408435821533, 0.147882342338562, 0.33625876903533936, 0.5246353149414062, 0.7130117416381836, 0.9013881683349609, 1.0897645950317383, 1.2781410217285156, 1.4665175676345825, 1.6548939943313599, 1.8432704210281372, 2.031646966934204, 2.2200233936309814, 2.408399820327759, 2.596776247024536, 2.7851526737213135, 2.97352933883667, 3.1619057655334473, 3.3502821922302246, 3.538658618927002, 3.7270350456237793, 3.9154114723205566, 4.103787899017334, 4.292164325714111, 4.480540752410889, 4.668917179107666, 4.857293605804443, 5.045670509338379, 5.234046936035156, 5.422423362731934, 5.610799789428711, 5.799176216125488, 5.987552642822266, 6.175929069519043, 6.36430549621582, 6.552681922912598, 6.741058349609375, 6.929434776306152]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 4.0, 9.0, 6.0, 9.0, 8.0, 27.0, 31.0, 35.0, 67.0, 67.0, 108.0, 74.0, 103.0, 74.0, 91.0, 72.0, 62.0, 44.0, 47.0, 26.0, 23.0, 12.0, 5.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6516462564468384, -0.6281753182411194, -0.6047043800354004, -0.5812334418296814, -0.5577625036239624, -0.5342915654182434, -0.5108206272125244, -0.48734965920448303, -0.46387872099876404, -0.44040778279304504, -0.41693684458732605, -0.39346587657928467, -0.3699949383735657, -0.3465240001678467, -0.3230530619621277, -0.2995821237564087, -0.2761111855506897, -0.2526402473449707, -0.2291693091392517, -0.20569835603237152, -0.18222741782665253, -0.15875647962093353, -0.13528552651405334, -0.11181458830833435, -0.08834365010261536, -0.06487271189689636, -0.04140176624059677, -0.01793082058429718, 0.005540117621421814, 0.029011055827140808, 0.052482008934020996, 0.07595294713973999, 0.09942394495010376, 0.12289488315582275, 0.14636582136154175, 0.16983677446842194, 0.19330771267414093, 0.21677865087985992, 0.2402496039867401, 0.2637205421924591, 0.2871914803981781, 0.3106624186038971, 0.3341333568096161, 0.35760432481765747, 0.38107526302337646, 0.40454620122909546, 0.42801713943481445, 0.45148807764053345, 0.47495901584625244, 0.49842995405197144, 0.5219008922576904, 0.5453718304634094, 0.5688427686691284, 0.5923137068748474, 0.6157846450805664, 0.6392556428909302, 0.6627265214920044, 0.6861974596977234, 0.7096683979034424, 0.7331393361091614, 0.7566102743148804, 0.7800812125205994, 0.8035521507263184, 0.8270231485366821, 0.8504940867424011]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 8.0, 4.0, 8.0, 12.0, 21.0, 20.0, 28.0, 50.0, 72.0, 93.0, 169.0, 349.0, 723.0, 1944.0, 7747.0, 68450.0, 862624.0, 93101.0, 9262.0, 2100.0, 818.0, 356.0, 205.0, 109.0, 84.0, 60.0, 36.0, 20.0, 14.0, 25.0, 10.0, 8.0, 5.0, 4.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.37109375, -2.290863037109375, -2.21063232421875, -2.130401611328125, -2.0501708984375, -1.969940185546875, -1.88970947265625, -1.809478759765625, -1.729248046875, -1.649017333984375, -1.56878662109375, -1.488555908203125, -1.4083251953125, -1.328094482421875, -1.24786376953125, -1.167633056640625, -1.08740234375, -1.007171630859375, -0.92694091796875, -0.846710205078125, -0.7664794921875, -0.686248779296875, -0.60601806640625, -0.525787353515625, -0.445556640625, -0.365325927734375, -0.28509521484375, -0.204864501953125, -0.1246337890625, -0.044403076171875, 0.03582763671875, 0.116058349609375, 0.1962890625, 0.276519775390625, 0.35675048828125, 0.436981201171875, 0.5172119140625, 0.597442626953125, 0.67767333984375, 0.757904052734375, 0.838134765625, 0.918365478515625, 0.99859619140625, 1.078826904296875, 1.1590576171875, 1.239288330078125, 1.31951904296875, 1.399749755859375, 1.47998046875, 1.560211181640625, 1.64044189453125, 1.720672607421875, 1.8009033203125, 1.881134033203125, 1.96136474609375, 2.041595458984375, 2.121826171875, 2.202056884765625, 2.28228759765625, 2.362518310546875, 2.4427490234375, 2.522979736328125, 2.60321044921875, 2.683441162109375, 2.763671875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 6.0, 4.0, 13.0, 12.0, 18.0, 20.0, 35.0, 46.0, 50.0, 67.0, 65.0, 95.0, 85.0, 79.0, 66.0, 79.0, 69.0, 51.0, 35.0, 27.0, 35.0, 10.0, 15.0, 11.0, 4.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0496826171875, -0.048462629318237305, -0.04724264144897461, -0.046022653579711914, -0.04480266571044922, -0.04358267784118652, -0.04236268997192383, -0.04114270210266113, -0.03992271423339844, -0.03870272636413574, -0.03748273849487305, -0.03626275062561035, -0.035042762756347656, -0.03382277488708496, -0.032602787017822266, -0.03138279914855957, -0.030162811279296875, -0.02894282341003418, -0.027722835540771484, -0.02650284767150879, -0.025282859802246094, -0.0240628719329834, -0.022842884063720703, -0.021622896194458008, -0.020402908325195312, -0.019182920455932617, -0.017962932586669922, -0.016742944717407227, -0.015522956848144531, -0.014302968978881836, -0.01308298110961914, -0.011862993240356445, -0.01064300537109375, -0.009423017501831055, -0.00820302963256836, -0.006983041763305664, -0.005763053894042969, -0.0045430660247802734, -0.003323078155517578, -0.002103090286254883, -0.0008831024169921875, 0.0003368854522705078, 0.0015568733215332031, 0.0027768611907958984, 0.003996849060058594, 0.005216836929321289, 0.006436824798583984, 0.00765681266784668, 0.008876800537109375, 0.01009678840637207, 0.011316776275634766, 0.012536764144897461, 0.013756752014160156, 0.014976739883422852, 0.016196727752685547, 0.017416715621948242, 0.018636703491210938, 0.019856691360473633, 0.021076679229736328, 0.022296667098999023, 0.02351665496826172, 0.024736642837524414, 0.02595663070678711, 0.027176618576049805, 0.0283966064453125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 4.0, 5.0, 19.0, 13.0, 21.0, 26.0, 33.0, 56.0, 103.0, 131.0, 225.0, 353.0, 696.0, 1355.0, 3382.0, 11059.0, 47556.0, 423201.0, 488064.0, 53521.0, 11940.0, 3666.0, 1443.0, 662.0, 375.0, 240.0, 137.0, 85.0, 64.0, 38.0, 24.0, 26.0, 7.0, 14.0, 8.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.869140625, -0.838134765625, -0.80712890625, -0.776123046875, -0.7451171875, -0.714111328125, -0.68310546875, -0.652099609375, -0.62109375, -0.590087890625, -0.55908203125, -0.528076171875, -0.4970703125, -0.466064453125, -0.43505859375, -0.404052734375, -0.373046875, -0.342041015625, -0.31103515625, -0.280029296875, -0.2490234375, -0.218017578125, -0.18701171875, -0.156005859375, -0.125, -0.093994140625, -0.06298828125, -0.031982421875, -0.0009765625, 0.030029296875, 0.06103515625, 0.092041015625, 0.123046875, 0.154052734375, 0.18505859375, 0.216064453125, 0.2470703125, 0.278076171875, 0.30908203125, 0.340087890625, 0.37109375, 0.402099609375, 0.43310546875, 0.464111328125, 0.4951171875, 0.526123046875, 0.55712890625, 0.588134765625, 0.619140625, 0.650146484375, 0.68115234375, 0.712158203125, 0.7431640625, 0.774169921875, 0.80517578125, 0.836181640625, 0.8671875, 0.898193359375, 0.92919921875, 0.960205078125, 0.9912109375, 1.022216796875, 1.05322265625, 1.084228515625, 1.115234375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 2.0, 9.0, 9.0, 14.0, 8.0, 13.0, 16.0, 25.0, 20.0, 26.0, 18.0, 29.0, 36.0, 24.0, 38.0, 39.0, 32.0, 38.0, 50.0, 44.0, 45.0, 45.0, 51.0, 42.0, 36.0, 32.0, 41.0, 25.0, 16.0, 28.0, 22.0, 14.0, 18.0, 21.0, 16.0, 7.0, 7.0, 10.0, 8.0, 5.0, 6.0, 6.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.1612548828125, -0.1566791534423828, -0.15210342407226562, -0.14752769470214844, -0.14295196533203125, -0.13837623596191406, -0.13380050659179688, -0.1292247772216797, -0.1246490478515625, -0.12007331848144531, -0.11549758911132812, -0.11092185974121094, -0.10634613037109375, -0.10177040100097656, -0.09719467163085938, -0.09261894226074219, -0.088043212890625, -0.08346748352050781, -0.07889175415039062, -0.07431602478027344, -0.06974029541015625, -0.06516456604003906, -0.060588836669921875, -0.05601310729980469, -0.0514373779296875, -0.04686164855957031, -0.042285919189453125, -0.03771018981933594, -0.03313446044921875, -0.028558731079101562, -0.023983001708984375, -0.019407272338867188, -0.01483154296875, -0.010255813598632812, -0.005680084228515625, -0.0011043548583984375, 0.00347137451171875, 0.008047103881835938, 0.012622833251953125, 0.017198562622070312, 0.0217742919921875, 0.026350021362304688, 0.030925750732421875, 0.03550148010253906, 0.04007720947265625, 0.04465293884277344, 0.049228668212890625, 0.05380439758300781, 0.058380126953125, 0.06295585632324219, 0.06753158569335938, 0.07210731506347656, 0.07668304443359375, 0.08125877380371094, 0.08583450317382812, 0.09041023254394531, 0.0949859619140625, 0.09956169128417969, 0.10413742065429688, 0.10871315002441406, 0.11328887939453125, 0.11786460876464844, 0.12244033813476562, 0.1270160675048828, 0.131591796875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 2.0, 7.0, 5.0, 13.0, 19.0, 26.0, 38.0, 57.0, 91.0, 207.0, 354.0, 758.0, 2105.0, 9938.0, 183246.0, 822921.0, 22922.0, 3619.0, 1149.0, 450.0, 246.0, 141.0, 79.0, 43.0, 35.0, 18.0, 17.0, 14.0, 12.0, 8.0, 4.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2275390625, -1.1868896484375, -1.146240234375, -1.1055908203125, -1.06494140625, -1.0242919921875, -0.983642578125, -0.9429931640625, -0.90234375, -0.8616943359375, -0.821044921875, -0.7803955078125, -0.73974609375, -0.6990966796875, -0.658447265625, -0.6177978515625, -0.5771484375, -0.5364990234375, -0.495849609375, -0.4552001953125, -0.41455078125, -0.3739013671875, -0.333251953125, -0.2926025390625, -0.251953125, -0.2113037109375, -0.170654296875, -0.1300048828125, -0.08935546875, -0.0487060546875, -0.008056640625, 0.0325927734375, 0.0732421875, 0.1138916015625, 0.154541015625, 0.1951904296875, 0.23583984375, 0.2764892578125, 0.317138671875, 0.3577880859375, 0.3984375, 0.4390869140625, 0.479736328125, 0.5203857421875, 0.56103515625, 0.6016845703125, 0.642333984375, 0.6829833984375, 0.7236328125, 0.7642822265625, 0.804931640625, 0.8455810546875, 0.88623046875, 0.9268798828125, 0.967529296875, 1.0081787109375, 1.048828125, 1.0894775390625, 1.130126953125, 1.1707763671875, 1.21142578125, 1.2520751953125, 1.292724609375, 1.3333740234375, 1.3740234375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 4.0, 6.0, 13.0, 23.0, 29.0, 66.0, 120.0, 218.0, 225.0, 139.0, 79.0, 40.0, 24.0, 14.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001766681671142578, -0.000171637162566185, -0.00016660615801811218, -0.00016157515347003937, -0.00015654414892196655, -0.00015151314437389374, -0.00014648213982582092, -0.0001414511352777481, -0.0001364201307296753, -0.00013138912618160248, -0.00012635812163352966, -0.00012132711708545685, -0.00011629611253738403, -0.00011126510798931122, -0.0001062341034412384, -0.00010120309889316559, -9.617209434509277e-05, -9.114108979701996e-05, -8.611008524894714e-05, -8.107908070087433e-05, -7.604807615280151e-05, -7.10170716047287e-05, -6.598606705665588e-05, -6.095506250858307e-05, -5.5924057960510254e-05, -5.089305341243744e-05, -4.5862048864364624e-05, -4.083104431629181e-05, -3.5800039768218994e-05, -3.076903522014618e-05, -2.5738030672073364e-05, -2.070702612400055e-05, -1.5676021575927734e-05, -1.064501702785492e-05, -5.6140124797821045e-06, -5.830079317092896e-07, 4.447996616363525e-06, 9.47900116443634e-06, 1.4510005712509155e-05, 1.954101026058197e-05, 2.4572014808654785e-05, 2.96030193567276e-05, 3.4634023904800415e-05, 3.966502845287323e-05, 4.4696033000946045e-05, 4.972703754901886e-05, 5.4758042097091675e-05, 5.978904664516449e-05, 6.48200511932373e-05, 6.985105574131012e-05, 7.488206028938293e-05, 7.991306483745575e-05, 8.494406938552856e-05, 8.997507393360138e-05, 9.50060784816742e-05, 0.00010003708302974701, 0.00010506808757781982, 0.00011009909212589264, 0.00011513009667396545, 0.00012016110122203827, 0.00012519210577011108, 0.0001302231103181839, 0.00013525411486625671, 0.00014028511941432953, 0.00014531612396240234]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 4.0, 4.0, 4.0, 4.0, 6.0, 5.0, 12.0, 14.0, 16.0, 24.0, 20.0, 40.0, 54.0, 77.0, 115.0, 179.0, 371.0, 717.0, 1518.0, 3562.0, 11073.0, 55042.0, 680097.0, 258017.0, 25941.0, 6642.0, 2518.0, 1117.0, 548.0, 290.0, 187.0, 99.0, 52.0, 59.0, 33.0, 23.0, 13.0, 11.0, 13.0, 11.0, 5.0, 2.0, 10.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.7548828125, -0.7318649291992188, -0.7088470458984375, -0.6858291625976562, -0.662811279296875, -0.6397933959960938, -0.6167755126953125, -0.5937576293945312, -0.57073974609375, -0.5477218627929688, -0.5247039794921875, -0.5016860961914062, -0.478668212890625, -0.45565032958984375, -0.4326324462890625, -0.40961456298828125, -0.3865966796875, -0.36357879638671875, -0.3405609130859375, -0.31754302978515625, -0.294525146484375, -0.27150726318359375, -0.2484893798828125, -0.22547149658203125, -0.20245361328125, -0.17943572998046875, -0.1564178466796875, -0.13339996337890625, -0.110382080078125, -0.08736419677734375, -0.0643463134765625, -0.04132843017578125, -0.018310546875, 0.00470733642578125, 0.0277252197265625, 0.05074310302734375, 0.073760986328125, 0.09677886962890625, 0.1197967529296875, 0.14281463623046875, 0.16583251953125, 0.18885040283203125, 0.2118682861328125, 0.23488616943359375, 0.257904052734375, 0.28092193603515625, 0.3039398193359375, 0.32695770263671875, 0.3499755859375, 0.37299346923828125, 0.3960113525390625, 0.41902923583984375, 0.442047119140625, 0.46506500244140625, 0.4880828857421875, 0.5111007690429688, 0.53411865234375, 0.5571365356445312, 0.5801544189453125, 0.6031723022460938, 0.626190185546875, 0.6492080688476562, 0.6722259521484375, 0.6952438354492188, 0.71826171875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 5.0, 4.0, 8.0, 11.0, 18.0, 21.0, 36.0, 57.0, 52.0, 79.0, 110.0, 115.0, 125.0, 98.0, 57.0, 59.0, 38.0, 28.0, 12.0, 16.0, 5.0, 10.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.361083984375, -0.3506660461425781, -0.34024810791015625, -0.3298301696777344, -0.3194122314453125, -0.3089942932128906, -0.29857635498046875, -0.2881584167480469, -0.277740478515625, -0.2673225402832031, -0.25690460205078125, -0.24648666381835938, -0.2360687255859375, -0.22565078735351562, -0.21523284912109375, -0.20481491088867188, -0.19439697265625, -0.18397903442382812, -0.17356109619140625, -0.16314315795898438, -0.1527252197265625, -0.14230728149414062, -0.13188934326171875, -0.12147140502929688, -0.111053466796875, -0.10063552856445312, -0.09021759033203125, -0.07979965209960938, -0.0693817138671875, -0.058963775634765625, -0.04854583740234375, -0.038127899169921875, -0.0277099609375, -0.017292022705078125, -0.00687408447265625, 0.003543853759765625, 0.0139617919921875, 0.024379730224609375, 0.03479766845703125, 0.045215606689453125, 0.055633544921875, 0.06605148315429688, 0.07646942138671875, 0.08688735961914062, 0.0973052978515625, 0.10772323608398438, 0.11814117431640625, 0.12855911254882812, 0.13897705078125, 0.14939498901367188, 0.15981292724609375, 0.17023086547851562, 0.1806488037109375, 0.19106674194335938, 0.20148468017578125, 0.21190261840820312, 0.222320556640625, 0.23273849487304688, 0.24315643310546875, 0.2535743713378906, 0.2639923095703125, 0.2744102478027344, 0.28482818603515625, 0.2952461242675781, 0.3056640625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 7.0, 10.0, 25.0, 51.0, 136.0, 201.0, 257.0, 165.0, 85.0, 35.0, 10.0, 8.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.294405460357666, -6.098361968994141, -5.902318477630615, -5.706274509429932, -5.510231018066406, -5.314187526702881, -5.1181440353393555, -4.922100067138672, -4.7260565757751465, -4.530013084411621, -4.333969593048096, -4.137925624847412, -3.9418821334838867, -3.7458386421203613, -3.549795150756836, -3.3537514209747314, -3.157707929611206, -2.9616644382476807, -2.765620708465576, -2.569577217102051, -2.3735334873199463, -2.177489995956421, -1.981446385383606, -1.785402774810791, -1.589359164237976, -1.3933155536651611, -1.1972719430923462, -1.0012283325195312, -0.8051847815513611, -0.6091411709785461, -0.413097620010376, -0.21705400943756104, -0.021010398864746094, 0.17503319680690765, 0.3710767924785614, 0.567120373249054, 0.7631639838218689, 0.9592075943946838, 1.155251145362854, 1.351294755935669, 1.5473383665084839, 1.7433819770812988, 1.9394255876541138, 2.1354691982269287, 2.331512689590454, 2.5275564193725586, 2.723599910736084, 2.9196434020996094, 3.115687131881714, 3.3117306232452393, 3.5077743530273438, 3.703817844390869, 3.8998615741729736, 4.095905303955078, 4.2919487953186035, 4.487992286682129, 4.684035778045654, 4.88007926940918, 5.076122760772705, 5.272166728973389, 5.468210220336914, 5.6642537117004395, 5.860297203063965, 6.056341171264648, 6.252384662628174]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 4.0, 7.0, 6.0, 5.0, 5.0, 11.0, 19.0, 14.0, 26.0, 34.0, 38.0, 40.0, 46.0, 44.0, 44.0, 61.0, 51.0, 70.0, 48.0, 66.0, 61.0, 48.0, 47.0, 38.0, 40.0, 28.0, 29.0, 11.0, 18.0, 10.0, 9.0, 5.0, 9.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.0267624855041504, -1.972910761833191, -1.919059157371521, -1.8652074337005615, -1.811355710029602, -1.7575039863586426, -1.7036523818969727, -1.6498006582260132, -1.5959489345550537, -1.5420972108840942, -1.4882456064224243, -1.4343938827514648, -1.3805421590805054, -1.326690435409546, -1.272838830947876, -1.2189871072769165, -1.165135383605957, -1.1112836599349976, -1.0574320554733276, -1.0035803318023682, -0.9497286081314087, -0.895876944065094, -0.8420252799987793, -0.7881735563278198, -0.7343219518661499, -0.6804702877998352, -0.6266185641288757, -0.572766900062561, -0.5189151763916016, -0.46506351232528687, -0.4112118184566498, -0.3573601245880127, -0.3035084009170532, -0.24965670704841614, -0.19580501317977905, -0.14195333421230316, -0.08810164034366608, -0.034249961376190186, 0.0196017324924469, 0.07345342636108398, 0.12730512022972107, 0.18115681409835815, 0.23500850796699524, 0.2888602018356323, 0.342711865901947, 0.3965635597705841, 0.4504152536392212, 0.5042669773101807, 0.5581186413764954, 0.6119703054428101, 0.6658220291137695, 0.7196736931800842, 0.7735254168510437, 0.8273770809173584, 0.8812288045883179, 0.9350804686546326, 0.9889321327209473, 1.0427838563919067, 1.0966354608535767, 1.1504871845245361, 1.2043389081954956, 1.258190631866455, 1.312042236328125, 1.3658939599990845, 1.419745683670044]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 5.0, 3.0, 3.0, 6.0, 3.0, 5.0, 7.0, 6.0, 13.0, 9.0, 14.0, 16.0, 15.0, 24.0, 29.0, 49.0, 58.0, 116.0, 193.0, 288.0, 604.0, 1438.0, 5103.0, 26938.0, 477181.0, 3623094.0, 47116.0, 8260.0, 2104.0, 723.0, 357.0, 195.0, 112.0, 60.0, 43.0, 22.0, 18.0, 13.0, 9.0, 11.0, 10.0, 5.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.044921875, -1.981292724609375, -1.91766357421875, -1.854034423828125, -1.7904052734375, -1.726776123046875, -1.66314697265625, -1.599517822265625, -1.535888671875, -1.472259521484375, -1.40863037109375, -1.345001220703125, -1.2813720703125, -1.217742919921875, -1.15411376953125, -1.090484619140625, -1.02685546875, -0.963226318359375, -0.89959716796875, -0.835968017578125, -0.7723388671875, -0.708709716796875, -0.64508056640625, -0.581451416015625, -0.517822265625, -0.454193115234375, -0.39056396484375, -0.326934814453125, -0.2633056640625, -0.199676513671875, -0.13604736328125, -0.072418212890625, -0.0087890625, 0.054840087890625, 0.11846923828125, 0.182098388671875, 0.2457275390625, 0.309356689453125, 0.37298583984375, 0.436614990234375, 0.500244140625, 0.563873291015625, 0.62750244140625, 0.691131591796875, 0.7547607421875, 0.818389892578125, 0.88201904296875, 0.945648193359375, 1.00927734375, 1.072906494140625, 1.13653564453125, 1.200164794921875, 1.2637939453125, 1.327423095703125, 1.39105224609375, 1.454681396484375, 1.518310546875, 1.581939697265625, 1.64556884765625, 1.709197998046875, 1.7728271484375, 1.836456298828125, 1.90008544921875, 1.963714599609375, 2.02734375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 0.0, 4.0, 5.0, 6.0, 9.0, 15.0, 19.0, 21.0, 27.0, 30.0, 37.0, 40.0, 43.0, 62.0, 68.0, 67.0, 90.0, 70.0, 61.0, 60.0, 44.0, 53.0, 37.0, 31.0, 27.0, 20.0, 19.0, 9.0, 9.0, 2.0, 8.0, 1.0, 5.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.057281494140625, -0.05589771270751953, -0.05451393127441406, -0.053130149841308594, -0.051746368408203125, -0.050362586975097656, -0.04897880554199219, -0.04759502410888672, -0.04621124267578125, -0.04482746124267578, -0.04344367980957031, -0.042059898376464844, -0.040676116943359375, -0.039292335510253906, -0.03790855407714844, -0.03652477264404297, -0.0351409912109375, -0.03375720977783203, -0.03237342834472656, -0.030989646911621094, -0.029605865478515625, -0.028222084045410156, -0.026838302612304688, -0.02545452117919922, -0.02407073974609375, -0.02268695831298828, -0.021303176879882812, -0.019919395446777344, -0.018535614013671875, -0.017151832580566406, -0.015768051147460938, -0.014384269714355469, -0.01300048828125, -0.011616706848144531, -0.010232925415039062, -0.008849143981933594, -0.007465362548828125, -0.006081581115722656, -0.0046977996826171875, -0.0033140182495117188, -0.00193023681640625, -0.0005464553833007812, 0.0008373260498046875, 0.0022211074829101562, 0.003604888916015625, 0.004988670349121094, 0.0063724517822265625, 0.007756233215332031, 0.0091400146484375, 0.010523796081542969, 0.011907577514648438, 0.013291358947753906, 0.014675140380859375, 0.016058921813964844, 0.017442703247070312, 0.01882648468017578, 0.02021026611328125, 0.02159404754638672, 0.022977828979492188, 0.024361610412597656, 0.025745391845703125, 0.027129173278808594, 0.028512954711914062, 0.02989673614501953, 0.031280517578125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 4.0, 8.0, 17.0, 15.0, 40.0, 58.0, 125.0, 252.0, 641.0, 2270.0, 159447.0, 4025877.0, 4166.0, 790.0, 262.0, 119.0, 69.0, 54.0, 29.0, 18.0, 9.0, 3.0, 5.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5625, -6.3446044921875, -6.126708984375, -5.9088134765625, -5.69091796875, -5.4730224609375, -5.255126953125, -5.0372314453125, -4.8193359375, -4.6014404296875, -4.383544921875, -4.1656494140625, -3.94775390625, -3.7298583984375, -3.511962890625, -3.2940673828125, -3.076171875, -2.8582763671875, -2.640380859375, -2.4224853515625, -2.20458984375, -1.9866943359375, -1.768798828125, -1.5509033203125, -1.3330078125, -1.1151123046875, -0.897216796875, -0.6793212890625, -0.46142578125, -0.2435302734375, -0.025634765625, 0.1922607421875, 0.41015625, 0.6280517578125, 0.845947265625, 1.0638427734375, 1.28173828125, 1.4996337890625, 1.717529296875, 1.9354248046875, 2.1533203125, 2.3712158203125, 2.589111328125, 2.8070068359375, 3.02490234375, 3.2427978515625, 3.460693359375, 3.6785888671875, 3.896484375, 4.1143798828125, 4.332275390625, 4.5501708984375, 4.76806640625, 4.9859619140625, 5.203857421875, 5.4217529296875, 5.6396484375, 5.8575439453125, 6.075439453125, 6.2933349609375, 6.51123046875, 6.7291259765625, 6.947021484375, 7.1649169921875, 7.3828125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 8.0, 13.0, 29.0, 46.0, 104.0, 395.0, 2576.0, 603.0, 168.0, 59.0, 30.0, 14.0, 12.0, 4.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.64501953125, -0.6302337646484375, -0.615447998046875, -0.6006622314453125, -0.58587646484375, -0.5710906982421875, -0.556304931640625, -0.5415191650390625, -0.5267333984375, -0.5119476318359375, -0.497161865234375, -0.4823760986328125, -0.46759033203125, -0.4528045654296875, -0.438018798828125, -0.4232330322265625, -0.408447265625, -0.3936614990234375, -0.378875732421875, -0.3640899658203125, -0.34930419921875, -0.3345184326171875, -0.319732666015625, -0.3049468994140625, -0.2901611328125, -0.2753753662109375, -0.260589599609375, -0.2458038330078125, -0.23101806640625, -0.2162322998046875, -0.201446533203125, -0.1866607666015625, -0.171875, -0.1570892333984375, -0.142303466796875, -0.1275177001953125, -0.11273193359375, -0.0979461669921875, -0.083160400390625, -0.0683746337890625, -0.0535888671875, -0.0388031005859375, -0.024017333984375, -0.0092315673828125, 0.00555419921875, 0.0203399658203125, 0.035125732421875, 0.0499114990234375, 0.064697265625, 0.0794830322265625, 0.094268798828125, 0.1090545654296875, 0.12384033203125, 0.1386260986328125, 0.153411865234375, 0.1681976318359375, 0.1829833984375, 0.1977691650390625, 0.212554931640625, 0.2273406982421875, 0.24212646484375, 0.2569122314453125, 0.271697998046875, 0.2864837646484375, 0.30126953125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 2.0, 2.0, 3.0, 6.0, 10.0, 21.0, 29.0, 51.0, 91.0, 175.0, 233.0, 172.0, 95.0, 44.0, 20.0, 20.0, 8.0, 6.0, 6.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8442435264587402, -2.7480037212371826, -2.651763916015625, -2.5555241107940674, -2.4592843055725098, -2.363044500350952, -2.2668046951293945, -2.170564889907837, -2.0743250846862793, -1.9780852794647217, -1.881845474243164, -1.7856056690216064, -1.6893658638000488, -1.5931260585784912, -1.4968862533569336, -1.400646448135376, -1.3044066429138184, -1.2081668376922607, -1.1119270324707031, -1.0156872272491455, -0.9194474220275879, -0.8232076168060303, -0.7269678115844727, -0.630728006362915, -0.5344882011413574, -0.4382483959197998, -0.3420085906982422, -0.24576878547668457, -0.14952898025512695, -0.053289175033569336, 0.04295063018798828, 0.1391904354095459, 0.23543024063110352, 0.33167004585266113, 0.42790985107421875, 0.5241496562957764, 0.620389461517334, 0.7166292667388916, 0.8128690719604492, 0.9091088771820068, 1.0053486824035645, 1.101588487625122, 1.1978282928466797, 1.2940680980682373, 1.390307903289795, 1.4865477085113525, 1.5827875137329102, 1.6790273189544678, 1.7752671241760254, 1.871506929397583, 1.9677467346191406, 2.0639865398406982, 2.160226345062256, 2.2564661502838135, 2.352705955505371, 2.4489457607269287, 2.5451855659484863, 2.641425371170044, 2.7376651763916016, 2.833904981613159, 2.930144786834717, 3.0263845920562744, 3.122624397277832, 3.2188642024993896, 3.3151040077209473]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 9.0, 11.0, 15.0, 13.0, 34.0, 33.0, 51.0, 58.0, 67.0, 101.0, 93.0, 98.0, 72.0, 79.0, 68.0, 44.0, 48.0, 34.0, 26.0, 18.0, 9.0, 6.0, 9.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.323563575744629, -1.2810187339782715, -1.2384737730026245, -1.1959288120269775, -1.1533839702606201, -1.1108391284942627, -1.0682941675186157, -1.0257492065429688, -0.9832043647766113, -0.9406594634056091, -0.8981145620346069, -0.8555696606636047, -0.8130247592926025, -0.7704798579216003, -0.7279349565505981, -0.685390055179596, -0.6428451538085938, -0.6003002524375916, -0.5577553510665894, -0.5152104496955872, -0.47266554832458496, -0.43012064695358276, -0.38757574558258057, -0.34503084421157837, -0.30248594284057617, -0.259941041469574, -0.21739614009857178, -0.17485123872756958, -0.13230633735656738, -0.08976143598556519, -0.04721653461456299, -0.004671633243560791, 0.037873148918151855, 0.08041805028915405, 0.12296295166015625, 0.16550785303115845, 0.20805275440216064, 0.25059765577316284, 0.29314255714416504, 0.33568745851516724, 0.37823235988616943, 0.42077726125717163, 0.46332216262817383, 0.505867063999176, 0.5484119653701782, 0.5909568667411804, 0.6335017681121826, 0.6760466694831848, 0.718591570854187, 0.7611364722251892, 0.8036813735961914, 0.8462262749671936, 0.8887711763381958, 0.931316077709198, 0.9738609790802002, 1.0164058208465576, 1.0589507818222046, 1.1014957427978516, 1.144040584564209, 1.1865854263305664, 1.2291303873062134, 1.2716753482818604, 1.3142201900482178, 1.3567650318145752, 1.3993099927902222]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 5.0, 6.0, 13.0, 11.0, 21.0, 23.0, 38.0, 38.0, 60.0, 93.0, 108.0, 160.0, 238.0, 344.0, 741.0, 1722.0, 5014.0, 21411.0, 139342.0, 723542.0, 127380.0, 19826.0, 4858.0, 1661.0, 735.0, 423.0, 255.0, 154.0, 110.0, 63.0, 48.0, 30.0, 22.0, 21.0, 12.0, 5.0, 7.0, 2.0, 2.0, 8.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.859375, -1.798370361328125, -1.73736572265625, -1.676361083984375, -1.6153564453125, -1.554351806640625, -1.49334716796875, -1.432342529296875, -1.371337890625, -1.310333251953125, -1.24932861328125, -1.188323974609375, -1.1273193359375, -1.066314697265625, -1.00531005859375, -0.944305419921875, -0.88330078125, -0.822296142578125, -0.76129150390625, -0.700286865234375, -0.6392822265625, -0.578277587890625, -0.51727294921875, -0.456268310546875, -0.395263671875, -0.334259033203125, -0.27325439453125, -0.212249755859375, -0.1512451171875, -0.090240478515625, -0.02923583984375, 0.031768798828125, 0.0927734375, 0.153778076171875, 0.21478271484375, 0.275787353515625, 0.3367919921875, 0.397796630859375, 0.45880126953125, 0.519805908203125, 0.580810546875, 0.641815185546875, 0.70281982421875, 0.763824462890625, 0.8248291015625, 0.885833740234375, 0.94683837890625, 1.007843017578125, 1.06884765625, 1.129852294921875, 1.19085693359375, 1.251861572265625, 1.3128662109375, 1.373870849609375, 1.43487548828125, 1.495880126953125, 1.556884765625, 1.617889404296875, 1.67889404296875, 1.739898681640625, 1.8009033203125, 1.861907958984375, 1.92291259765625, 1.983917236328125, 2.044921875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 15.0, 7.0, 10.0, 17.0, 18.0, 28.0, 26.0, 36.0, 60.0, 60.0, 73.0, 85.0, 89.0, 80.0, 80.0, 72.0, 55.0, 47.0, 45.0, 24.0, 19.0, 13.0, 14.0, 5.0, 10.0, 7.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07904052734375, -0.0765371322631836, -0.07403373718261719, -0.07153034210205078, -0.06902694702148438, -0.06652355194091797, -0.06402015686035156, -0.061516761779785156, -0.05901336669921875, -0.056509971618652344, -0.05400657653808594, -0.05150318145751953, -0.048999786376953125, -0.04649639129638672, -0.04399299621582031, -0.041489601135253906, -0.0389862060546875, -0.036482810974121094, -0.03397941589355469, -0.03147602081298828, -0.028972625732421875, -0.02646923065185547, -0.023965835571289062, -0.021462440490722656, -0.01895904541015625, -0.016455650329589844, -0.013952255249023438, -0.011448860168457031, -0.008945465087890625, -0.006442070007324219, -0.0039386749267578125, -0.0014352798461914062, 0.001068115234375, 0.0035715103149414062, 0.0060749053955078125, 0.008578300476074219, 0.011081695556640625, 0.013585090637207031, 0.016088485717773438, 0.018591880798339844, 0.02109527587890625, 0.023598670959472656, 0.026102066040039062, 0.02860546112060547, 0.031108856201171875, 0.03361225128173828, 0.03611564636230469, 0.038619041442871094, 0.0411224365234375, 0.043625831604003906, 0.04612922668457031, 0.04863262176513672, 0.051136016845703125, 0.05363941192626953, 0.05614280700683594, 0.058646202087402344, 0.06114959716796875, 0.06365299224853516, 0.06615638732910156, 0.06865978240966797, 0.07116317749023438, 0.07366657257080078, 0.07616996765136719, 0.0786733627319336, 0.0811767578125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 0.0, 3.0, 4.0, 2.0, 3.0, 9.0, 10.0, 8.0, 16.0, 24.0, 30.0, 51.0, 54.0, 72.0, 111.0, 148.0, 266.0, 401.0, 645.0, 1199.0, 2417.0, 5273.0, 13206.0, 42803.0, 198217.0, 556766.0, 167223.0, 37734.0, 11907.0, 4816.0, 2206.0, 1135.0, 641.0, 360.0, 218.0, 165.0, 111.0, 72.0, 53.0, 42.0, 31.0, 25.0, 17.0, 16.0, 9.0, 8.0, 8.0, 4.0, 6.0, 6.0, 4.0, 6.0, 2.0, 1.0], "bins": [-1.0361328125, -1.0069046020507812, -0.9776763916015625, -0.9484481811523438, -0.919219970703125, -0.8899917602539062, -0.8607635498046875, -0.8315353393554688, -0.80230712890625, -0.7730789184570312, -0.7438507080078125, -0.7146224975585938, -0.685394287109375, -0.6561660766601562, -0.6269378662109375, -0.5977096557617188, -0.5684814453125, -0.5392532348632812, -0.5100250244140625, -0.48079681396484375, -0.451568603515625, -0.42234039306640625, -0.3931121826171875, -0.36388397216796875, -0.33465576171875, -0.30542755126953125, -0.2761993408203125, -0.24697113037109375, -0.217742919921875, -0.18851470947265625, -0.1592864990234375, -0.13005828857421875, -0.100830078125, -0.07160186767578125, -0.0423736572265625, -0.01314544677734375, 0.016082763671875, 0.04531097412109375, 0.0745391845703125, 0.10376739501953125, 0.13299560546875, 0.16222381591796875, 0.1914520263671875, 0.22068023681640625, 0.249908447265625, 0.27913665771484375, 0.3083648681640625, 0.33759307861328125, 0.3668212890625, 0.39604949951171875, 0.4252777099609375, 0.45450592041015625, 0.483734130859375, 0.5129623413085938, 0.5421905517578125, 0.5714187622070312, 0.60064697265625, 0.6298751831054688, 0.6591033935546875, 0.6883316040039062, 0.717559814453125, 0.7467880249023438, 0.7760162353515625, 0.8052444458007812, 0.83447265625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 6.0, 8.0, 4.0, 9.0, 6.0, 13.0, 13.0, 24.0, 22.0, 31.0, 28.0, 39.0, 37.0, 51.0, 59.0, 66.0, 46.0, 59.0, 61.0, 62.0, 61.0, 49.0, 37.0, 33.0, 36.0, 28.0, 22.0, 22.0, 9.0, 12.0, 18.0, 9.0, 4.0, 6.0, 5.0, 7.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27001953125, -0.25943756103515625, -0.2488555908203125, -0.23827362060546875, -0.227691650390625, -0.21710968017578125, -0.2065277099609375, -0.19594573974609375, -0.18536376953125, -0.17478179931640625, -0.1641998291015625, -0.15361785888671875, -0.143035888671875, -0.13245391845703125, -0.1218719482421875, -0.11128997802734375, -0.1007080078125, -0.09012603759765625, -0.0795440673828125, -0.06896209716796875, -0.058380126953125, -0.04779815673828125, -0.0372161865234375, -0.02663421630859375, -0.01605224609375, -0.00547027587890625, 0.0051116943359375, 0.01569366455078125, 0.026275634765625, 0.03685760498046875, 0.0474395751953125, 0.05802154541015625, 0.068603515625, 0.07918548583984375, 0.0897674560546875, 0.10034942626953125, 0.110931396484375, 0.12151336669921875, 0.1320953369140625, 0.14267730712890625, 0.15325927734375, 0.16384124755859375, 0.1744232177734375, 0.18500518798828125, 0.195587158203125, 0.20616912841796875, 0.2167510986328125, 0.22733306884765625, 0.2379150390625, 0.24849700927734375, 0.2590789794921875, 0.26966094970703125, 0.280242919921875, 0.29082489013671875, 0.3014068603515625, 0.31198883056640625, 0.32257080078125, 0.33315277099609375, 0.3437347412109375, 0.35431671142578125, 0.364898681640625, 0.37548065185546875, 0.3860626220703125, 0.39664459228515625, 0.4072265625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 0.0, 5.0, 4.0, 5.0, 6.0, 7.0, 12.0, 9.0, 10.0, 13.0, 19.0, 27.0, 35.0, 44.0, 75.0, 133.0, 269.0, 511.0, 1061.0, 2334.0, 5621.0, 21086.0, 343644.0, 630201.0, 31059.0, 7006.0, 2754.0, 1246.0, 600.0, 289.0, 165.0, 87.0, 48.0, 33.0, 28.0, 23.0, 14.0, 17.0, 8.0, 12.0, 10.0, 2.0, 5.0, 7.0, 1.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.92138671875, -0.8917617797851562, -0.8621368408203125, -0.8325119018554688, -0.802886962890625, -0.7732620239257812, -0.7436370849609375, -0.7140121459960938, -0.68438720703125, -0.6547622680664062, -0.6251373291015625, -0.5955123901367188, -0.565887451171875, -0.5362625122070312, -0.5066375732421875, -0.47701263427734375, -0.4473876953125, -0.41776275634765625, -0.3881378173828125, -0.35851287841796875, -0.328887939453125, -0.29926300048828125, -0.2696380615234375, -0.24001312255859375, -0.21038818359375, -0.18076324462890625, -0.1511383056640625, -0.12151336669921875, -0.091888427734375, -0.06226348876953125, -0.0326385498046875, -0.00301361083984375, 0.026611328125, 0.05623626708984375, 0.0858612060546875, 0.11548614501953125, 0.145111083984375, 0.17473602294921875, 0.2043609619140625, 0.23398590087890625, 0.26361083984375, 0.29323577880859375, 0.3228607177734375, 0.35248565673828125, 0.382110595703125, 0.41173553466796875, 0.4413604736328125, 0.47098541259765625, 0.5006103515625, 0.5302352905273438, 0.5598602294921875, 0.5894851684570312, 0.619110107421875, 0.6487350463867188, 0.6783599853515625, 0.7079849243164062, 0.73760986328125, 0.7672348022460938, 0.7968597412109375, 0.8264846801757812, 0.856109619140625, 0.8857345581054688, 0.9153594970703125, 0.9449844360351562, 0.974609375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 5.0, 4.0, 12.0, 11.0, 16.0, 16.0, 26.0, 42.0, 52.0, 83.0, 114.0, 145.0, 134.0, 93.0, 67.0, 61.0, 26.0, 26.0, 17.0, 15.0, 8.0, 5.0, 3.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.620189666748047e-05, -9.298045188188553e-05, -8.975900709629059e-05, -8.653756231069565e-05, -8.331611752510071e-05, -8.009467273950577e-05, -7.687322795391083e-05, -7.365178316831589e-05, -7.043033838272095e-05, -6.720889359712601e-05, -6.398744881153107e-05, -6.076600402593613e-05, -5.7544559240341187e-05, -5.4323114454746246e-05, -5.1101669669151306e-05, -4.7880224883556366e-05, -4.4658780097961426e-05, -4.1437335312366486e-05, -3.8215890526771545e-05, -3.4994445741176605e-05, -3.1773000955581665e-05, -2.8551556169986725e-05, -2.5330111384391785e-05, -2.2108666598796844e-05, -1.8887221813201904e-05, -1.5665777027606964e-05, -1.2444332242012024e-05, -9.222887456417084e-06, -6.0014426708221436e-06, -2.7799978852272034e-06, 4.414469003677368e-07, 3.662891685962677e-06, 6.884336471557617e-06, 1.0105781257152557e-05, 1.3327226042747498e-05, 1.6548670828342438e-05, 1.9770115613937378e-05, 2.2991560399532318e-05, 2.6213005185127258e-05, 2.94344499707222e-05, 3.265589475631714e-05, 3.587733954191208e-05, 3.909878432750702e-05, 4.232022911310196e-05, 4.55416738986969e-05, 4.876311868429184e-05, 5.198456346988678e-05, 5.520600825548172e-05, 5.842745304107666e-05, 6.16488978266716e-05, 6.487034261226654e-05, 6.809178739786148e-05, 7.131323218345642e-05, 7.453467696905136e-05, 7.77561217546463e-05, 8.097756654024124e-05, 8.419901132583618e-05, 8.742045611143112e-05, 9.064190089702606e-05, 9.3863345682621e-05, 9.708479046821594e-05, 0.00010030623525381088, 0.00010352768003940582, 0.00010674912482500076, 0.0001099705696105957]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 7.0, 6.0, 3.0, 7.0, 6.0, 10.0, 16.0, 13.0, 23.0, 38.0, 52.0, 87.0, 145.0, 238.0, 462.0, 879.0, 1784.0, 3996.0, 12051.0, 84723.0, 858443.0, 67261.0, 10858.0, 3898.0, 1733.0, 758.0, 419.0, 225.0, 152.0, 74.0, 55.0, 40.0, 16.0, 16.0, 17.0, 8.0, 12.0, 6.0, 1.0, 11.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.9677734375, -0.9388504028320312, -0.9099273681640625, -0.8810043334960938, -0.852081298828125, -0.8231582641601562, -0.7942352294921875, -0.7653121948242188, -0.73638916015625, -0.7074661254882812, -0.6785430908203125, -0.6496200561523438, -0.620697021484375, -0.5917739868164062, -0.5628509521484375, -0.5339279174804688, -0.5050048828125, -0.47608184814453125, -0.4471588134765625, -0.41823577880859375, -0.389312744140625, -0.36038970947265625, -0.3314666748046875, -0.30254364013671875, -0.27362060546875, -0.24469757080078125, -0.2157745361328125, -0.18685150146484375, -0.157928466796875, -0.12900543212890625, -0.1000823974609375, -0.07115936279296875, -0.042236328125, -0.01331329345703125, 0.0156097412109375, 0.04453277587890625, 0.073455810546875, 0.10237884521484375, 0.1313018798828125, 0.16022491455078125, 0.18914794921875, 0.21807098388671875, 0.2469940185546875, 0.27591705322265625, 0.304840087890625, 0.33376312255859375, 0.3626861572265625, 0.39160919189453125, 0.4205322265625, 0.44945526123046875, 0.4783782958984375, 0.5073013305664062, 0.536224365234375, 0.5651473999023438, 0.5940704345703125, 0.6229934692382812, 0.65191650390625, 0.6808395385742188, 0.7097625732421875, 0.7386856079101562, 0.767608642578125, 0.7965316772460938, 0.8254547119140625, 0.8543777465820312, 0.88330078125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 1.0, 5.0, 3.0, 12.0, 16.0, 30.0, 46.0, 89.0, 134.0, 163.0, 180.0, 128.0, 85.0, 33.0, 20.0, 18.0, 6.0, 6.0, 3.0, 2.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.609375, -0.5918960571289062, -0.5744171142578125, -0.5569381713867188, -0.539459228515625, -0.5219802856445312, -0.5045013427734375, -0.48702239990234375, -0.46954345703125, -0.45206451416015625, -0.4345855712890625, -0.41710662841796875, -0.399627685546875, -0.38214874267578125, -0.3646697998046875, -0.34719085693359375, -0.3297119140625, -0.31223297119140625, -0.2947540283203125, -0.27727508544921875, -0.259796142578125, -0.24231719970703125, -0.2248382568359375, -0.20735931396484375, -0.18988037109375, -0.17240142822265625, -0.1549224853515625, -0.13744354248046875, -0.119964599609375, -0.10248565673828125, -0.0850067138671875, -0.06752777099609375, -0.050048828125, -0.03256988525390625, -0.0150909423828125, 0.00238800048828125, 0.019866943359375, 0.03734588623046875, 0.0548248291015625, 0.07230377197265625, 0.08978271484375, 0.10726165771484375, 0.1247406005859375, 0.14221954345703125, 0.159698486328125, 0.17717742919921875, 0.1946563720703125, 0.21213531494140625, 0.2296142578125, 0.24709320068359375, 0.2645721435546875, 0.28205108642578125, 0.299530029296875, 0.31700897216796875, 0.3344879150390625, 0.35196685791015625, 0.36944580078125, 0.38692474365234375, 0.4044036865234375, 0.42188262939453125, 0.439361572265625, 0.45684051513671875, 0.4743194580078125, 0.49179840087890625, 0.50927734375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 4.0, 2.0, 8.0, 20.0, 57.0, 132.0, 281.0, 283.0, 135.0, 47.0, 15.0, 13.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.259020805358887, -4.906360149383545, -4.553699493408203, -4.201038360595703, -3.8483779430389404, -3.4957172870635986, -3.1430563926696777, -2.790395736694336, -2.437735080718994, -2.0850744247436523, -1.732413649559021, -1.3797528743743896, -1.0270922183990479, -0.674431562423706, -0.32177066802978516, 0.03088998794555664, 0.38355064392089844, 0.736211359500885, 1.0888720750808716, 1.441532850265503, 1.7941935062408447, 2.1468541622161865, 2.4995150566101074, 2.852175712585449, 3.204836368560791, 3.557497024536133, 3.9101576805114746, 4.262818336486816, 4.615479469299316, 4.9681396484375, 5.32080078125, 5.673461437225342, 6.026123046875, 6.378783702850342, 6.731444358825684, 7.084105491638184, 7.436765670776367, 7.789426803588867, 8.142087936401367, 8.49474811553955, 8.847408294677734, 9.200069427490234, 9.552729606628418, 9.905390739440918, 10.258050918579102, 10.610712051391602, 10.963373184204102, 11.316033363342285, 11.668694496154785, 12.021355628967285, 12.374015808105469, 12.726676940917969, 13.079337120056152, 13.431998252868652, 13.784658432006836, 14.137319564819336, 14.489980697631836, 14.842641830444336, 15.19530200958252, 15.54796314239502, 15.900623321533203, 16.253284454345703, 16.605945587158203, 16.958606719970703, 17.31126594543457]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 10.0, 4.0, 7.0, 8.0, 11.0, 16.0, 15.0, 17.0, 20.0, 25.0, 34.0, 35.0, 45.0, 55.0, 37.0, 47.0, 53.0, 48.0, 53.0, 39.0, 39.0, 43.0, 42.0, 32.0, 43.0, 30.0, 33.0, 27.0, 23.0, 25.0, 14.0, 13.0, 11.0, 11.0, 13.0, 9.0, 5.0, 4.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9902983903884888, -1.9242666959762573, -1.8582348823547363, -1.7922031879425049, -1.7261714935302734, -1.6601396799087524, -1.594107985496521, -1.528076171875, -1.4620444774627686, -1.396012783050537, -1.3299809694290161, -1.2639492750167847, -1.1979174613952637, -1.1318857669830322, -1.0658540725708008, -0.9998223185539246, -0.9337905645370483, -0.8677588105201721, -0.8017270565032959, -0.7356953620910645, -0.6696636080741882, -0.603631854057312, -0.5376001596450806, -0.47156840562820435, -0.4055366516113281, -0.3395048975944519, -0.27347317337989807, -0.20744143426418304, -0.14140969514846802, -0.0753779411315918, -0.009346216917037964, 0.05668550729751587, 0.12271714210510254, 0.18874888122081757, 0.2547806203365326, 0.3208123445510864, 0.38684409856796265, 0.45287585258483887, 0.5189075469970703, 0.5849393010139465, 0.6509710550308228, 0.717002809047699, 0.7830345630645752, 0.8490662574768066, 0.9150980114936829, 0.9811297655105591, 1.0471614599227905, 1.1131932735443115, 1.179224967956543, 1.2452566623687744, 1.3112884759902954, 1.3773201704025269, 1.4433519840240479, 1.5093836784362793, 1.5754153728485107, 1.6414470672607422, 1.7074788808822632, 1.7735105752944946, 1.8395423889160156, 1.905574083328247, 1.9716057777404785, 2.037637710571289, 2.1036694049835205, 2.169701099395752, 2.2357327938079834]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 1.0, 5.0, 2.0, 4.0, 5.0, 6.0, 7.0, 10.0, 19.0, 22.0, 27.0, 32.0, 47.0, 77.0, 101.0, 188.0, 352.0, 687.0, 1592.0, 4478.0, 16597.0, 145355.0, 3937263.0, 69617.0, 11785.0, 3504.0, 1202.0, 515.0, 290.0, 156.0, 101.0, 63.0, 44.0, 36.0, 25.0, 24.0, 7.0, 9.0, 8.0, 5.0, 4.0, 7.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.27734375, -2.2129669189453125, -2.148590087890625, -2.0842132568359375, -2.01983642578125, -1.9554595947265625, -1.891082763671875, -1.8267059326171875, -1.7623291015625, -1.6979522705078125, -1.633575439453125, -1.5691986083984375, -1.50482177734375, -1.4404449462890625, -1.376068115234375, -1.3116912841796875, -1.247314453125, -1.1829376220703125, -1.118560791015625, -1.0541839599609375, -0.98980712890625, -0.9254302978515625, -0.861053466796875, -0.7966766357421875, -0.7322998046875, -0.6679229736328125, -0.603546142578125, -0.5391693115234375, -0.47479248046875, -0.4104156494140625, -0.346038818359375, -0.2816619873046875, -0.21728515625, -0.1529083251953125, -0.088531494140625, -0.0241546630859375, 0.04022216796875, 0.1045989990234375, 0.168975830078125, 0.2333526611328125, 0.2977294921875, 0.3621063232421875, 0.426483154296875, 0.4908599853515625, 0.55523681640625, 0.6196136474609375, 0.683990478515625, 0.7483673095703125, 0.812744140625, 0.8771209716796875, 0.941497802734375, 1.0058746337890625, 1.07025146484375, 1.1346282958984375, 1.199005126953125, 1.2633819580078125, 1.3277587890625, 1.3921356201171875, 1.456512451171875, 1.5208892822265625, 1.58526611328125, 1.6496429443359375, 1.714019775390625, 1.7783966064453125, 1.8427734375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 3.0, 6.0, 4.0, 12.0, 12.0, 9.0, 18.0, 21.0, 34.0, 30.0, 47.0, 50.0, 56.0, 70.0, 76.0, 74.0, 68.0, 64.0, 78.0, 49.0, 49.0, 46.0, 26.0, 28.0, 24.0, 15.0, 8.0, 7.0, 6.0, 6.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07977294921875, -0.07724857330322266, -0.07472419738769531, -0.07219982147216797, -0.06967544555664062, -0.06715106964111328, -0.06462669372558594, -0.062102317810058594, -0.05957794189453125, -0.057053565979003906, -0.05452919006347656, -0.05200481414794922, -0.049480438232421875, -0.04695606231689453, -0.04443168640136719, -0.041907310485839844, -0.0393829345703125, -0.036858558654785156, -0.03433418273925781, -0.03180980682373047, -0.029285430908203125, -0.02676105499267578, -0.024236679077148438, -0.021712303161621094, -0.01918792724609375, -0.016663551330566406, -0.014139175415039062, -0.011614799499511719, -0.009090423583984375, -0.006566047668457031, -0.0040416717529296875, -0.0015172958374023438, 0.001007080078125, 0.0035314559936523438, 0.0060558319091796875, 0.008580207824707031, 0.011104583740234375, 0.013628959655761719, 0.016153335571289062, 0.018677711486816406, 0.02120208740234375, 0.023726463317871094, 0.026250839233398438, 0.02877521514892578, 0.031299591064453125, 0.03382396697998047, 0.03634834289550781, 0.038872718811035156, 0.0413970947265625, 0.043921470642089844, 0.04644584655761719, 0.04897022247314453, 0.051494598388671875, 0.05401897430419922, 0.05654335021972656, 0.059067726135253906, 0.06159210205078125, 0.0641164779663086, 0.06664085388183594, 0.06916522979736328, 0.07168960571289062, 0.07421398162841797, 0.07673835754394531, 0.07926273345947266, 0.081787109375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 5.0, 7.0, 13.0, 18.0, 37.0, 64.0, 83.0, 146.0, 225.0, 506.0, 1123.0, 4778.0, 43184.0, 4038933.0, 94837.0, 7418.0, 1609.0, 535.0, 301.0, 156.0, 133.0, 69.0, 31.0, 29.0, 20.0, 10.0, 3.0, 8.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.76953125, -1.683685302734375, -1.59783935546875, -1.511993408203125, -1.4261474609375, -1.340301513671875, -1.25445556640625, -1.168609619140625, -1.082763671875, -0.996917724609375, -0.91107177734375, -0.825225830078125, -0.7393798828125, -0.653533935546875, -0.56768798828125, -0.481842041015625, -0.39599609375, -0.310150146484375, -0.22430419921875, -0.138458251953125, -0.0526123046875, 0.033233642578125, 0.11907958984375, 0.204925537109375, 0.290771484375, 0.376617431640625, 0.46246337890625, 0.548309326171875, 0.6341552734375, 0.720001220703125, 0.80584716796875, 0.891693115234375, 0.9775390625, 1.063385009765625, 1.14923095703125, 1.235076904296875, 1.3209228515625, 1.406768798828125, 1.49261474609375, 1.578460693359375, 1.664306640625, 1.750152587890625, 1.83599853515625, 1.921844482421875, 2.0076904296875, 2.093536376953125, 2.17938232421875, 2.265228271484375, 2.35107421875, 2.436920166015625, 2.52276611328125, 2.608612060546875, 2.6944580078125, 2.780303955078125, 2.86614990234375, 2.951995849609375, 3.037841796875, 3.123687744140625, 3.20953369140625, 3.295379638671875, 3.3812255859375, 3.467071533203125, 3.55291748046875, 3.638763427734375, 3.724609375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 5.0, 7.0, 9.0, 15.0, 15.0, 55.0, 128.0, 357.0, 2417.0, 764.0, 155.0, 76.0, 33.0, 16.0, 12.0, 9.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.265869140625, -0.24998092651367188, -0.23409271240234375, -0.21820449829101562, -0.2023162841796875, -0.18642807006835938, -0.17053985595703125, -0.15465164184570312, -0.138763427734375, -0.12287521362304688, -0.10698699951171875, -0.09109878540039062, -0.0752105712890625, -0.059322357177734375, -0.04343414306640625, -0.027545928955078125, -0.01165771484375, 0.004230499267578125, 0.02011871337890625, 0.036006927490234375, 0.0518951416015625, 0.06778335571289062, 0.08367156982421875, 0.09955978393554688, 0.115447998046875, 0.13133621215820312, 0.14722442626953125, 0.16311264038085938, 0.1790008544921875, 0.19488906860351562, 0.21077728271484375, 0.22666549682617188, 0.2425537109375, 0.2584419250488281, 0.27433013916015625, 0.2902183532714844, 0.3061065673828125, 0.3219947814941406, 0.33788299560546875, 0.3537712097167969, 0.369659423828125, 0.3855476379394531, 0.40143585205078125, 0.4173240661621094, 0.4332122802734375, 0.4491004943847656, 0.46498870849609375, 0.4808769226074219, 0.49676513671875, 0.5126533508300781, 0.5285415649414062, 0.5444297790527344, 0.5603179931640625, 0.5762062072753906, 0.5920944213867188, 0.6079826354980469, 0.623870849609375, 0.6397590637207031, 0.6556472778320312, 0.6715354919433594, 0.6874237060546875, 0.7033119201660156, 0.7192001342773438, 0.7350883483886719, 0.7509765625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 22.0, 188.0, 610.0, 165.0, 15.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.36672592163086, -12.106424331665039, -11.846122741699219, -11.585821151733398, -11.325519561767578, -11.065218925476074, -10.804917335510254, -10.544615745544434, -10.284314155578613, -10.024012565612793, -9.763710975646973, -9.503409385681152, -9.243108749389648, -8.982807159423828, -8.722505569458008, -8.462203979492188, -8.201902389526367, -7.941600799560547, -7.681299209594727, -7.4209980964660645, -7.160696506500244, -6.900394916534424, -6.640093803405762, -6.379792213439941, -6.119490623474121, -5.859189033508301, -5.5988874435424805, -5.338586330413818, -5.078284740447998, -4.817983150482178, -4.557682037353516, -4.297380447387695, -4.037079811096191, -3.776778221130371, -3.51647686958313, -3.2561755180358887, -2.9958739280700684, -2.735572338104248, -2.475270986557007, -2.2149696350097656, -1.9546680450439453, -1.6943665742874146, -1.4340651035308838, -1.173763632774353, -0.9134621620178223, -0.6531606912612915, -0.39285922050476074, -0.13255774974822998, 0.12774372100830078, 0.38804519176483154, 0.6483466625213623, 0.9086481332778931, 1.1689496040344238, 1.4292510747909546, 1.6895525455474854, 1.9498540163040161, 2.210155487060547, 2.470457077026367, 2.7307584285736084, 2.9910597801208496, 3.25136137008667, 3.5116629600524902, 3.7719643115997314, 4.032265663146973, 4.292567253112793]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 12.0, 8.0, 16.0, 23.0, 31.0, 40.0, 46.0, 59.0, 81.0, 77.0, 85.0, 91.0, 91.0, 70.0, 72.0, 64.0, 39.0, 31.0, 20.0, 20.0, 13.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.0033044815063477, -1.9571845531463623, -1.911064624786377, -1.864944577217102, -1.8188246488571167, -1.7727047204971313, -1.7265846729278564, -1.680464744567871, -1.6343448162078857, -1.5882248878479004, -1.542104959487915, -1.4959849119186401, -1.4498649835586548, -1.4037450551986694, -1.3576250076293945, -1.3115050792694092, -1.2653851509094238, -1.2192652225494385, -1.1731452941894531, -1.1270252466201782, -1.0809053182601929, -1.0347853899002075, -0.9886654019355774, -0.9425454139709473, -0.8964254856109619, -0.8503055572509766, -0.8041855692863464, -0.7580655813217163, -0.711945652961731, -0.6658257246017456, -0.6197057366371155, -0.5735857486724854, -0.5274658203125, -0.48134586215019226, -0.4352259039878845, -0.3891059458255768, -0.34298598766326904, -0.2968660295009613, -0.25074607133865356, -0.20462611317634583, -0.15850615501403809, -0.11238619685173035, -0.06626623868942261, -0.020146280527114868, 0.02597367763519287, 0.07209363579750061, 0.11821359395980835, 0.1643335521221161, 0.21045351028442383, 0.25657346844673157, 0.3026934266090393, 0.34881338477134705, 0.3949333429336548, 0.4410533010959625, 0.48717325925827026, 0.5332932472229004, 0.5794131755828857, 0.6255331039428711, 0.6716530919075012, 0.7177730798721313, 0.7638930082321167, 0.810012936592102, 0.8561329245567322, 0.9022529125213623, 0.9483728408813477]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 6.0, 10.0, 13.0, 13.0, 25.0, 45.0, 105.0, 125.0, 258.0, 506.0, 1029.0, 2966.0, 15705.0, 222424.0, 742703.0, 53195.0, 6299.0, 1718.0, 674.0, 300.0, 173.0, 90.0, 71.0, 34.0, 19.0, 15.0, 15.0, 6.0, 4.0, 3.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6572265625, -1.5792694091796875, -1.501312255859375, -1.4233551025390625, -1.34539794921875, -1.2674407958984375, -1.189483642578125, -1.1115264892578125, -1.0335693359375, -0.9556121826171875, -0.877655029296875, -0.7996978759765625, -0.72174072265625, -0.6437835693359375, -0.565826416015625, -0.4878692626953125, -0.409912109375, -0.3319549560546875, -0.253997802734375, -0.1760406494140625, -0.09808349609375, -0.0201263427734375, 0.057830810546875, 0.1357879638671875, 0.2137451171875, 0.2917022705078125, 0.369659423828125, 0.4476165771484375, 0.52557373046875, 0.6035308837890625, 0.681488037109375, 0.7594451904296875, 0.83740234375, 0.9153594970703125, 0.993316650390625, 1.0712738037109375, 1.14923095703125, 1.2271881103515625, 1.305145263671875, 1.3831024169921875, 1.4610595703125, 1.5390167236328125, 1.616973876953125, 1.6949310302734375, 1.77288818359375, 1.8508453369140625, 1.928802490234375, 2.0067596435546875, 2.084716796875, 2.1626739501953125, 2.240631103515625, 2.3185882568359375, 2.39654541015625, 2.4745025634765625, 2.552459716796875, 2.6304168701171875, 2.7083740234375, 2.7863311767578125, 2.864288330078125, 2.9422454833984375, 3.02020263671875, 3.0981597900390625, 3.176116943359375, 3.2540740966796875, 3.33203125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 2.0, 11.0, 11.0, 24.0, 33.0, 37.0, 46.0, 40.0, 52.0, 68.0, 68.0, 64.0, 59.0, 66.0, 76.0, 52.0, 60.0, 46.0, 49.0, 36.0, 17.0, 29.0, 12.0, 15.0, 7.0, 3.0, 7.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.11956787109375, -0.1166067123413086, -0.11364555358886719, -0.11068439483642578, -0.10772323608398438, -0.10476207733154297, -0.10180091857910156, -0.09883975982666016, -0.09587860107421875, -0.09291744232177734, -0.08995628356933594, -0.08699512481689453, -0.08403396606445312, -0.08107280731201172, -0.07811164855957031, -0.0751504898071289, -0.0721893310546875, -0.0692281723022461, -0.06626701354980469, -0.06330585479736328, -0.060344696044921875, -0.05738353729248047, -0.05442237854003906, -0.051461219787597656, -0.04850006103515625, -0.045538902282714844, -0.04257774353027344, -0.03961658477783203, -0.036655426025390625, -0.03369426727294922, -0.030733108520507812, -0.027771949768066406, -0.024810791015625, -0.021849632263183594, -0.018888473510742188, -0.01592731475830078, -0.012966156005859375, -0.010004997253417969, -0.0070438385009765625, -0.004082679748535156, -0.00112152099609375, 0.0018396377563476562, 0.0048007965087890625, 0.007761955261230469, 0.010723114013671875, 0.013684272766113281, 0.016645431518554688, 0.019606590270996094, 0.0225677490234375, 0.025528907775878906, 0.028490066528320312, 0.03145122528076172, 0.034412384033203125, 0.03737354278564453, 0.04033470153808594, 0.043295860290527344, 0.04625701904296875, 0.049218177795410156, 0.05217933654785156, 0.05514049530029297, 0.058101654052734375, 0.06106281280517578, 0.06402397155761719, 0.0669851303100586, 0.0699462890625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 3.0, 2.0, 4.0, 2.0, 10.0, 13.0, 12.0, 30.0, 32.0, 44.0, 59.0, 138.0, 271.0, 455.0, 906.0, 2155.0, 6676.0, 30094.0, 282497.0, 637434.0, 69850.0, 11819.0, 3429.0, 1220.0, 621.0, 312.0, 169.0, 114.0, 52.0, 38.0, 37.0, 17.0, 10.0, 8.0, 6.0, 5.0, 1.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.8408203125, -1.788543701171875, -1.73626708984375, -1.683990478515625, -1.6317138671875, -1.579437255859375, -1.52716064453125, -1.474884033203125, -1.422607421875, -1.370330810546875, -1.31805419921875, -1.265777587890625, -1.2135009765625, -1.161224365234375, -1.10894775390625, -1.056671142578125, -1.00439453125, -0.952117919921875, -0.89984130859375, -0.847564697265625, -0.7952880859375, -0.743011474609375, -0.69073486328125, -0.638458251953125, -0.586181640625, -0.533905029296875, -0.48162841796875, -0.429351806640625, -0.3770751953125, -0.324798583984375, -0.27252197265625, -0.220245361328125, -0.16796875, -0.115692138671875, -0.06341552734375, -0.011138916015625, 0.0411376953125, 0.093414306640625, 0.14569091796875, 0.197967529296875, 0.250244140625, 0.302520751953125, 0.35479736328125, 0.407073974609375, 0.4593505859375, 0.511627197265625, 0.56390380859375, 0.616180419921875, 0.66845703125, 0.720733642578125, 0.77301025390625, 0.825286865234375, 0.8775634765625, 0.929840087890625, 0.98211669921875, 1.034393310546875, 1.086669921875, 1.138946533203125, 1.19122314453125, 1.243499755859375, 1.2957763671875, 1.348052978515625, 1.40032958984375, 1.452606201171875, 1.5048828125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 3.0, 1.0, 7.0, 9.0, 9.0, 7.0, 18.0, 18.0, 22.0, 20.0, 31.0, 26.0, 26.0, 20.0, 46.0, 49.0, 47.0, 45.0, 53.0, 38.0, 39.0, 43.0, 59.0, 54.0, 31.0, 51.0, 28.0, 31.0, 24.0, 23.0, 15.0, 24.0, 24.0, 11.0, 18.0, 10.0, 10.0, 5.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3369140625, -0.3252067565917969, -0.31349945068359375, -0.3017921447753906, -0.2900848388671875, -0.2783775329589844, -0.26667022705078125, -0.2549629211425781, -0.243255615234375, -0.23154830932617188, -0.21984100341796875, -0.20813369750976562, -0.1964263916015625, -0.18471908569335938, -0.17301177978515625, -0.16130447387695312, -0.14959716796875, -0.13788986206054688, -0.12618255615234375, -0.11447525024414062, -0.1027679443359375, -0.09106063842773438, -0.07935333251953125, -0.06764602661132812, -0.055938720703125, -0.044231414794921875, -0.03252410888671875, -0.020816802978515625, -0.0091094970703125, 0.002597808837890625, 0.01430511474609375, 0.026012420654296875, 0.0377197265625, 0.049427032470703125, 0.06113433837890625, 0.07284164428710938, 0.0845489501953125, 0.09625625610351562, 0.10796356201171875, 0.11967086791992188, 0.131378173828125, 0.14308547973632812, 0.15479278564453125, 0.16650009155273438, 0.1782073974609375, 0.18991470336914062, 0.20162200927734375, 0.21332931518554688, 0.22503662109375, 0.23674392700195312, 0.24845123291015625, 0.2601585388183594, 0.2718658447265625, 0.2835731506347656, 0.29528045654296875, 0.3069877624511719, 0.318695068359375, 0.3304023742675781, 0.34210968017578125, 0.3538169860839844, 0.3655242919921875, 0.3772315979003906, 0.38893890380859375, 0.4006462097167969, 0.412353515625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 6.0, 3.0, 8.0, 10.0, 14.0, 20.0, 15.0, 32.0, 50.0, 82.0, 192.0, 471.0, 989.0, 2354.0, 6979.0, 48642.0, 830110.0, 141664.0, 11168.0, 3242.0, 1326.0, 566.0, 285.0, 121.0, 62.0, 38.0, 37.0, 16.0, 8.0, 14.0, 7.0, 3.0, 5.0, 7.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9853515625, -0.9551849365234375, -0.925018310546875, -0.8948516845703125, -0.86468505859375, -0.8345184326171875, -0.804351806640625, -0.7741851806640625, -0.7440185546875, -0.7138519287109375, -0.683685302734375, -0.6535186767578125, -0.62335205078125, -0.5931854248046875, -0.563018798828125, -0.5328521728515625, -0.502685546875, -0.4725189208984375, -0.442352294921875, -0.4121856689453125, -0.38201904296875, -0.3518524169921875, -0.321685791015625, -0.2915191650390625, -0.2613525390625, -0.2311859130859375, -0.201019287109375, -0.1708526611328125, -0.14068603515625, -0.1105194091796875, -0.080352783203125, -0.0501861572265625, -0.02001953125, 0.0101470947265625, 0.040313720703125, 0.0704803466796875, 0.10064697265625, 0.1308135986328125, 0.160980224609375, 0.1911468505859375, 0.2213134765625, 0.2514801025390625, 0.281646728515625, 0.3118133544921875, 0.34197998046875, 0.3721466064453125, 0.402313232421875, 0.4324798583984375, 0.462646484375, 0.4928131103515625, 0.522979736328125, 0.5531463623046875, 0.58331298828125, 0.6134796142578125, 0.643646240234375, 0.6738128662109375, 0.7039794921875, 0.7341461181640625, 0.764312744140625, 0.7944793701171875, 0.82464599609375, 0.8548126220703125, 0.884979248046875, 0.9151458740234375, 0.9453125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 9.0, 11.0, 36.0, 52.0, 128.0, 198.0, 257.0, 145.0, 68.0, 37.0, 16.0, 16.0, 9.0, 8.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000125885009765625, -0.00011967122554779053, -0.00011345744132995605, -0.00010724365711212158, -0.00010102987289428711, -9.481608867645264e-05, -8.860230445861816e-05, -8.238852024078369e-05, -7.617473602294922e-05, -6.996095180511475e-05, -6.374716758728027e-05, -5.75333833694458e-05, -5.131959915161133e-05, -4.5105814933776855e-05, -3.889203071594238e-05, -3.267824649810791e-05, -2.6464462280273438e-05, -2.0250678062438965e-05, -1.4036893844604492e-05, -7.82310962677002e-06, -1.6093254089355469e-06, 4.604458808898926e-06, 1.0818243026733398e-05, 1.703202724456787e-05, 2.3245811462402344e-05, 2.9459595680236816e-05, 3.567337989807129e-05, 4.188716411590576e-05, 4.8100948333740234e-05, 5.431473255157471e-05, 6.052851676940918e-05, 6.674230098724365e-05, 7.295608520507812e-05, 7.91698694229126e-05, 8.538365364074707e-05, 9.159743785858154e-05, 9.781122207641602e-05, 0.00010402500629425049, 0.00011023879051208496, 0.00011645257472991943, 0.0001226663589477539, 0.00012888014316558838, 0.00013509392738342285, 0.00014130771160125732, 0.0001475214958190918, 0.00015373528003692627, 0.00015994906425476074, 0.00016616284847259521, 0.0001723766326904297, 0.00017859041690826416, 0.00018480420112609863, 0.0001910179853439331, 0.00019723176956176758, 0.00020344555377960205, 0.00020965933799743652, 0.000215873122215271, 0.00022208690643310547, 0.00022830069065093994, 0.00023451447486877441, 0.0002407282590866089, 0.00024694204330444336, 0.00025315582752227783, 0.0002593696117401123, 0.0002655833959579468, 0.00027179718017578125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 3.0, 8.0, 1.0, 4.0, 11.0, 10.0, 17.0, 29.0, 31.0, 44.0, 58.0, 108.0, 148.0, 296.0, 513.0, 1029.0, 2301.0, 6371.0, 34281.0, 662494.0, 313312.0, 19214.0, 4528.0, 1783.0, 829.0, 476.0, 238.0, 137.0, 93.0, 64.0, 45.0, 29.0, 14.0, 12.0, 8.0, 10.0, 5.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-1.0302734375, -1.0037612915039062, -0.9772491455078125, -0.9507369995117188, -0.924224853515625, -0.8977127075195312, -0.8712005615234375, -0.8446884155273438, -0.81817626953125, -0.7916641235351562, -0.7651519775390625, -0.7386398315429688, -0.712127685546875, -0.6856155395507812, -0.6591033935546875, -0.6325912475585938, -0.6060791015625, -0.5795669555664062, -0.5530548095703125, -0.5265426635742188, -0.500030517578125, -0.47351837158203125, -0.4470062255859375, -0.42049407958984375, -0.39398193359375, -0.36746978759765625, -0.3409576416015625, -0.31444549560546875, -0.287933349609375, -0.26142120361328125, -0.2349090576171875, -0.20839691162109375, -0.181884765625, -0.15537261962890625, -0.1288604736328125, -0.10234832763671875, -0.075836181640625, -0.04932403564453125, -0.0228118896484375, 0.00370025634765625, 0.03021240234375, 0.05672454833984375, 0.0832366943359375, 0.10974884033203125, 0.136260986328125, 0.16277313232421875, 0.1892852783203125, 0.21579742431640625, 0.2423095703125, 0.26882171630859375, 0.2953338623046875, 0.32184600830078125, 0.348358154296875, 0.37487030029296875, 0.4013824462890625, 0.42789459228515625, 0.45440673828125, 0.48091888427734375, 0.5074310302734375, 0.5339431762695312, 0.560455322265625, 0.5869674682617188, 0.6134796142578125, 0.6399917602539062, 0.66650390625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 6.0, 2.0, 6.0, 13.0, 25.0, 31.0, 47.0, 60.0, 103.0, 103.0, 114.0, 139.0, 105.0, 71.0, 76.0, 32.0, 20.0, 17.0, 4.0, 5.0, 12.0, 5.0, 2.0, 2.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.59716796875, -0.5825843811035156, -0.5680007934570312, -0.5534172058105469, -0.5388336181640625, -0.5242500305175781, -0.5096664428710938, -0.4950828552246094, -0.480499267578125, -0.4659156799316406, -0.45133209228515625, -0.4367485046386719, -0.4221649169921875, -0.4075813293457031, -0.39299774169921875, -0.3784141540527344, -0.36383056640625, -0.3492469787597656, -0.33466339111328125, -0.3200798034667969, -0.3054962158203125, -0.2909126281738281, -0.27632904052734375, -0.2617454528808594, -0.247161865234375, -0.23257827758789062, -0.21799468994140625, -0.20341110229492188, -0.1888275146484375, -0.17424392700195312, -0.15966033935546875, -0.14507675170898438, -0.1304931640625, -0.11590957641601562, -0.10132598876953125, -0.08674240112304688, -0.0721588134765625, -0.057575225830078125, -0.04299163818359375, -0.028408050537109375, -0.013824462890625, 0.000759124755859375, 0.01534271240234375, 0.029926300048828125, 0.0445098876953125, 0.059093475341796875, 0.07367706298828125, 0.08826065063476562, 0.10284423828125, 0.11742782592773438, 0.13201141357421875, 0.14659500122070312, 0.1611785888671875, 0.17576217651367188, 0.19034576416015625, 0.20492935180664062, 0.219512939453125, 0.23409652709960938, 0.24868011474609375, 0.2632637023925781, 0.2778472900390625, 0.2924308776855469, 0.30701446533203125, 0.3215980529785156, 0.336181640625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 8.0, 13.0, 22.0, 39.0, 67.0, 116.0, 185.0, 232.0, 143.0, 89.0, 46.0, 14.0, 15.0, 9.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.83360767364502, -11.560700416564941, -11.28779411315918, -11.014886856079102, -10.741979598999023, -10.469073295593262, -10.196166038513184, -9.923258781433105, -9.650352478027344, -9.377445220947266, -9.104538917541504, -8.831631660461426, -8.558724403381348, -8.285818099975586, -8.012910842895508, -7.740004062652588, -7.46709680557251, -7.19419002532959, -6.921282768249512, -6.648375988006592, -6.375469207763672, -6.102561950683594, -5.829655170440674, -5.556748390197754, -5.283841133117676, -5.010934352874756, -4.738027095794678, -4.465120315551758, -4.192213535308838, -3.919306516647339, -3.64639949798584, -3.37349271774292, -3.100586414337158, -2.827679395675659, -2.5547726154327393, -2.2818655967712402, -2.0089588165283203, -1.7360517978668213, -1.4631447792053223, -1.1902378797531128, -0.9173309803009033, -0.6444240808486938, -0.3715171217918396, -0.09861016273498535, 0.17429673671722412, 0.4472036361694336, 0.7201106548309326, 0.9930175542831421, 1.2659244537353516, 1.538831353187561, 1.8117382526397705, 2.0846452713012695, 2.3575520515441895, 2.6304590702056885, 2.9033660888671875, 3.1762728691101074, 3.4491798877716064, 3.7220869064331055, 3.9949936866760254, 4.267900466918945, 4.540807723999023, 4.813714504241943, 5.086621284484863, 5.359528541564941, 5.632435321807861]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 4.0, 7.0, 8.0, 4.0, 6.0, 7.0, 9.0, 15.0, 13.0, 25.0, 24.0, 34.0, 31.0, 29.0, 50.0, 35.0, 54.0, 45.0, 59.0, 44.0, 54.0, 55.0, 49.0, 62.0, 50.0, 28.0, 32.0, 27.0, 38.0, 24.0, 15.0, 9.0, 11.0, 16.0, 10.0, 8.0, 7.0, 4.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.6021432876586914, -2.5201263427734375, -2.4381091594696045, -2.3560922145843506, -2.2740750312805176, -2.1920580863952637, -2.1100409030914307, -2.0280239582061768, -1.9460068941116333, -1.8639898300170898, -1.7819727659225464, -1.699955701828003, -1.617938756942749, -1.535921573638916, -1.453904628753662, -1.3718875646591187, -1.2898705005645752, -1.2078534364700317, -1.1258363723754883, -1.0438193082809448, -0.9618023037910461, -0.8797852396965027, -0.797768235206604, -0.7157511711120605, -0.6337341070175171, -0.5517170429229736, -0.46970000863075256, -0.3876829743385315, -0.30566591024398804, -0.22364884614944458, -0.1416318118572235, -0.05961477756500244, 0.022402524948120117, 0.10441957414150238, 0.18643662333488464, 0.2684536576271057, 0.35047072172164917, 0.4324877858161926, 0.5145047903060913, 0.5965218544006348, 0.6785389184951782, 0.7605559825897217, 0.8425730466842651, 0.9245900511741638, 1.0066070556640625, 1.0886242389678955, 1.1706411838531494, 1.2526582479476929, 1.3346753120422363, 1.4166923761367798, 1.4987094402313232, 1.5807265043258667, 1.6627435684204102, 1.744760513305664, 1.8267775774002075, 1.908794641494751, 1.9908117055892944, 2.072828769683838, 2.154845714569092, 2.236862897872925, 2.3188798427581787, 2.4008970260620117, 2.4829139709472656, 2.5649309158325195, 2.6469480991363525]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 6.0, 8.0, 7.0, 17.0, 19.0, 15.0, 27.0, 26.0, 60.0, 81.0, 119.0, 178.0, 299.0, 579.0, 1105.0, 3141.0, 11729.0, 63684.0, 3061058.0, 990725.0, 47668.0, 9106.0, 2583.0, 958.0, 469.0, 230.0, 128.0, 86.0, 51.0, 29.0, 31.0, 16.0, 12.0, 10.0, 9.0, 6.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.9697265625, -1.9098968505859375, -1.850067138671875, -1.7902374267578125, -1.73040771484375, -1.6705780029296875, -1.610748291015625, -1.5509185791015625, -1.4910888671875, -1.4312591552734375, -1.371429443359375, -1.3115997314453125, -1.25177001953125, -1.1919403076171875, -1.132110595703125, -1.0722808837890625, -1.012451171875, -0.9526214599609375, -0.892791748046875, -0.8329620361328125, -0.77313232421875, -0.7133026123046875, -0.653472900390625, -0.5936431884765625, -0.5338134765625, -0.4739837646484375, -0.414154052734375, -0.3543243408203125, -0.29449462890625, -0.2346649169921875, -0.174835205078125, -0.1150054931640625, -0.05517578125, 0.0046539306640625, 0.064483642578125, 0.1243133544921875, 0.18414306640625, 0.2439727783203125, 0.303802490234375, 0.3636322021484375, 0.4234619140625, 0.4832916259765625, 0.543121337890625, 0.6029510498046875, 0.66278076171875, 0.7226104736328125, 0.782440185546875, 0.8422698974609375, 0.902099609375, 0.9619293212890625, 1.021759033203125, 1.0815887451171875, 1.14141845703125, 1.2012481689453125, 1.261077880859375, 1.3209075927734375, 1.3807373046875, 1.4405670166015625, 1.500396728515625, 1.5602264404296875, 1.62005615234375, 1.6798858642578125, 1.739715576171875, 1.7995452880859375, 1.859375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 5.0, 4.0, 5.0, 15.0, 12.0, 19.0, 23.0, 35.0, 33.0, 36.0, 46.0, 64.0, 54.0, 56.0, 43.0, 58.0, 58.0, 69.0, 62.0, 60.0, 59.0, 30.0, 45.0, 24.0, 19.0, 19.0, 13.0, 12.0, 11.0, 3.0, 2.0, 0.0, 1.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10980224609375, -0.10686588287353516, -0.10392951965332031, -0.10099315643310547, -0.09805679321289062, -0.09512042999267578, -0.09218406677246094, -0.0892477035522461, -0.08631134033203125, -0.0833749771118164, -0.08043861389160156, -0.07750225067138672, -0.07456588745117188, -0.07162952423095703, -0.06869316101074219, -0.06575679779052734, -0.0628204345703125, -0.059884071350097656, -0.05694770812988281, -0.05401134490966797, -0.051074981689453125, -0.04813861846923828, -0.04520225524902344, -0.042265892028808594, -0.03932952880859375, -0.036393165588378906, -0.03345680236816406, -0.03052043914794922, -0.027584075927734375, -0.02464771270751953, -0.021711349487304688, -0.018774986267089844, -0.015838623046875, -0.012902259826660156, -0.009965896606445312, -0.007029533386230469, -0.004093170166015625, -0.0011568069458007812, 0.0017795562744140625, 0.004715919494628906, 0.00765228271484375, 0.010588645935058594, 0.013525009155273438, 0.01646137237548828, 0.019397735595703125, 0.02233409881591797, 0.025270462036132812, 0.028206825256347656, 0.0311431884765625, 0.034079551696777344, 0.03701591491699219, 0.03995227813720703, 0.042888641357421875, 0.04582500457763672, 0.04876136779785156, 0.051697731018066406, 0.05463409423828125, 0.057570457458496094, 0.06050682067871094, 0.06344318389892578, 0.06637954711914062, 0.06931591033935547, 0.07225227355957031, 0.07518863677978516, 0.078125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 6.0, 14.0, 20.0, 42.0, 45.0, 67.0, 148.0, 294.0, 798.0, 3467.0, 55880.0, 4114792.0, 15699.0, 1936.0, 535.0, 215.0, 126.0, 77.0, 48.0, 24.0, 18.0, 13.0, 5.0, 8.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3515625, -5.15582275390625, -4.9600830078125, -4.76434326171875, -4.568603515625, -4.37286376953125, -4.1771240234375, -3.98138427734375, -3.78564453125, -3.58990478515625, -3.3941650390625, -3.19842529296875, -3.002685546875, -2.80694580078125, -2.6112060546875, -2.41546630859375, -2.2197265625, -2.02398681640625, -1.8282470703125, -1.63250732421875, -1.436767578125, -1.24102783203125, -1.0452880859375, -0.84954833984375, -0.65380859375, -0.45806884765625, -0.2623291015625, -0.06658935546875, 0.129150390625, 0.32489013671875, 0.5206298828125, 0.71636962890625, 0.912109375, 1.10784912109375, 1.3035888671875, 1.49932861328125, 1.695068359375, 1.89080810546875, 2.0865478515625, 2.28228759765625, 2.47802734375, 2.67376708984375, 2.8695068359375, 3.06524658203125, 3.260986328125, 3.45672607421875, 3.6524658203125, 3.84820556640625, 4.0439453125, 4.23968505859375, 4.4354248046875, 4.63116455078125, 4.826904296875, 5.02264404296875, 5.2183837890625, 5.41412353515625, 5.60986328125, 5.80560302734375, 6.0013427734375, 6.19708251953125, 6.392822265625, 6.58856201171875, 6.7843017578125, 6.98004150390625, 7.17578125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 7.0, 12.0, 20.0, 35.0, 92.0, 247.0, 1228.0, 1968.0, 301.0, 96.0, 42.0, 20.0, 8.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7607421875, -0.7277984619140625, -0.694854736328125, -0.6619110107421875, -0.62896728515625, -0.5960235595703125, -0.563079833984375, -0.5301361083984375, -0.4971923828125, -0.4642486572265625, -0.431304931640625, -0.3983612060546875, -0.36541748046875, -0.3324737548828125, -0.299530029296875, -0.2665863037109375, -0.233642578125, -0.2006988525390625, -0.167755126953125, -0.1348114013671875, -0.10186767578125, -0.0689239501953125, -0.035980224609375, -0.0030364990234375, 0.0299072265625, 0.0628509521484375, 0.095794677734375, 0.1287384033203125, 0.16168212890625, 0.1946258544921875, 0.227569580078125, 0.2605133056640625, 0.29345703125, 0.3264007568359375, 0.359344482421875, 0.3922882080078125, 0.42523193359375, 0.4581756591796875, 0.491119384765625, 0.5240631103515625, 0.5570068359375, 0.5899505615234375, 0.622894287109375, 0.6558380126953125, 0.68878173828125, 0.7217254638671875, 0.754669189453125, 0.7876129150390625, 0.820556640625, 0.8535003662109375, 0.886444091796875, 0.9193878173828125, 0.95233154296875, 0.9852752685546875, 1.018218994140625, 1.0511627197265625, 1.0841064453125, 1.1170501708984375, 1.149993896484375, 1.1829376220703125, 1.21588134765625, 1.2488250732421875, 1.281768798828125, 1.3147125244140625, 1.34765625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 16.0, 30.0, 108.0, 275.0, 333.0, 151.0, 61.0, 14.0, 11.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.704033851623535, -9.428254127502441, -9.152475357055664, -8.87669563293457, -8.600915908813477, -8.3251371383667, -8.049357414245605, -7.77357816696167, -7.497798919677734, -7.222019672393799, -6.946239948272705, -6.6704607009887695, -6.394681453704834, -6.118902206420898, -5.843122482299805, -5.567343235015869, -5.291563510894775, -5.01578426361084, -4.740004539489746, -4.4642252922058105, -4.188446044921875, -3.9126665592193604, -3.6368870735168457, -3.36110782623291, -3.0853283405303955, -2.809548854827881, -2.5337696075439453, -2.2579901218414307, -1.9822107553482056, -1.7064313888549805, -1.4306519031524658, -1.1548725366592407, -0.8790936470031738, -0.6033142805099487, -0.32753485441207886, -0.051755428314208984, 0.2240239381790161, 0.4998033046722412, 0.7755827903747559, 1.051362156867981, 1.327141523361206, 1.6029208898544312, 1.8787002563476562, 2.154479742050171, 2.4302592277526855, 2.706038475036621, 2.9818179607391357, 3.2575974464416504, 3.533376693725586, 3.8091561794281006, 4.084935665130615, 4.360714912414551, 4.636494159698486, 4.912273406982422, 5.188053131103516, 5.463832378387451, 5.739611625671387, 6.015390872955322, 6.291170597076416, 6.566949844360352, 6.842729091644287, 7.118508338928223, 7.394288063049316, 7.670067310333252, 7.945847034454346]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 4.0, 4.0, 10.0, 10.0, 9.0, 20.0, 23.0, 27.0, 54.0, 64.0, 72.0, 77.0, 81.0, 104.0, 85.0, 68.0, 54.0, 72.0, 41.0, 31.0, 27.0, 22.0, 19.0, 14.0, 7.0, 0.0, 4.0, 3.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5929620265960693, -2.514258623123169, -2.4355552196502686, -2.356851816177368, -2.2781484127044678, -2.1994450092315674, -2.120741605758667, -2.0420382022857666, -1.9633347988128662, -1.8846313953399658, -1.8059279918670654, -1.727224588394165, -1.6485211849212646, -1.5698177814483643, -1.4911143779754639, -1.4124109745025635, -1.333707571029663, -1.2550041675567627, -1.1763007640838623, -1.097597360610962, -1.0188939571380615, -0.9401905536651611, -0.8614871501922607, -0.7827837467193604, -0.70408034324646, -0.6253769397735596, -0.5466735363006592, -0.4679701328277588, -0.3892667293548584, -0.310563325881958, -0.23185992240905762, -0.15315651893615723, -0.07445335388183594, 0.004250049591064453, 0.08295345306396484, 0.16165685653686523, 0.24036026000976562, 0.319063663482666, 0.3977670669555664, 0.4764704704284668, 0.5551738739013672, 0.6338772773742676, 0.712580680847168, 0.7912840843200684, 0.8699874877929688, 0.9486908912658691, 1.0273942947387695, 1.10609769821167, 1.1848011016845703, 1.2635045051574707, 1.342207908630371, 1.4209113121032715, 1.4996147155761719, 1.5783181190490723, 1.6570215225219727, 1.735724925994873, 1.8144283294677734, 1.8931317329406738, 1.9718351364135742, 2.0505385398864746, 2.129241943359375, 2.2079453468322754, 2.286648750305176, 2.365352153778076, 2.4440555572509766]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 9.0, 7.0, 10.0, 10.0, 21.0, 26.0, 39.0, 50.0, 86.0, 120.0, 169.0, 276.0, 520.0, 1048.0, 2332.0, 8187.0, 56842.0, 520817.0, 405612.0, 41617.0, 6451.0, 2091.0, 898.0, 449.0, 287.0, 189.0, 125.0, 70.0, 52.0, 44.0, 22.0, 24.0, 12.0, 12.0, 14.0, 6.0, 2.0, 5.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.025390625, -1.9638824462890625, -1.902374267578125, -1.8408660888671875, -1.77935791015625, -1.7178497314453125, -1.656341552734375, -1.5948333740234375, -1.5333251953125, -1.4718170166015625, -1.410308837890625, -1.3488006591796875, -1.28729248046875, -1.2257843017578125, -1.164276123046875, -1.1027679443359375, -1.041259765625, -0.9797515869140625, -0.918243408203125, -0.8567352294921875, -0.79522705078125, -0.7337188720703125, -0.672210693359375, -0.6107025146484375, -0.5491943359375, -0.4876861572265625, -0.426177978515625, -0.3646697998046875, -0.30316162109375, -0.2416534423828125, -0.180145263671875, -0.1186370849609375, -0.05712890625, 0.0043792724609375, 0.065887451171875, 0.1273956298828125, 0.18890380859375, 0.2504119873046875, 0.311920166015625, 0.3734283447265625, 0.4349365234375, 0.4964447021484375, 0.557952880859375, 0.6194610595703125, 0.68096923828125, 0.7424774169921875, 0.803985595703125, 0.8654937744140625, 0.927001953125, 0.9885101318359375, 1.050018310546875, 1.1115264892578125, 1.17303466796875, 1.2345428466796875, 1.296051025390625, 1.3575592041015625, 1.4190673828125, 1.4805755615234375, 1.542083740234375, 1.6035919189453125, 1.66510009765625, 1.7266082763671875, 1.788116455078125, 1.8496246337890625, 1.9111328125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 11.0, 20.0, 32.0, 52.0, 84.0, 123.0, 131.0, 125.0, 142.0, 106.0, 81.0, 42.0, 21.0, 14.0, 16.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2802734375, -0.2723426818847656, -0.26441192626953125, -0.2564811706542969, -0.2485504150390625, -0.24061965942382812, -0.23268890380859375, -0.22475814819335938, -0.216827392578125, -0.20889663696289062, -0.20096588134765625, -0.19303512573242188, -0.1851043701171875, -0.17717361450195312, -0.16924285888671875, -0.16131210327148438, -0.15338134765625, -0.14545059204101562, -0.13751983642578125, -0.12958908081054688, -0.1216583251953125, -0.11372756958007812, -0.10579681396484375, -0.09786605834960938, -0.089935302734375, -0.08200454711914062, -0.07407379150390625, -0.06614303588867188, -0.0582122802734375, -0.050281524658203125, -0.04235076904296875, -0.034420013427734375, -0.0264892578125, -0.018558502197265625, -0.01062774658203125, -0.002696990966796875, 0.0052337646484375, 0.013164520263671875, 0.02109527587890625, 0.029026031494140625, 0.036956787109375, 0.044887542724609375, 0.05281829833984375, 0.060749053955078125, 0.0686798095703125, 0.07661056518554688, 0.08454132080078125, 0.09247207641601562, 0.10040283203125, 0.10833358764648438, 0.11626434326171875, 0.12419509887695312, 0.1321258544921875, 0.14005661010742188, 0.14798736572265625, 0.15591812133789062, 0.163848876953125, 0.17177963256835938, 0.17971038818359375, 0.18764114379882812, 0.1955718994140625, 0.20350265502929688, 0.21143341064453125, 0.21936416625976562, 0.227294921875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 6.0, 5.0, 8.0, 9.0, 10.0, 9.0, 25.0, 20.0, 34.0, 56.0, 88.0, 130.0, 183.0, 303.0, 531.0, 921.0, 1958.0, 3888.0, 8701.0, 21403.0, 56743.0, 159134.0, 351285.0, 274526.0, 104130.0, 37391.0, 14739.0, 6087.0, 2851.0, 1440.0, 767.0, 447.0, 254.0, 152.0, 101.0, 73.0, 43.0, 38.0, 18.0, 19.0, 13.0, 4.0, 7.0, 8.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52978515625, -0.509246826171875, -0.48870849609375, -0.468170166015625, -0.4476318359375, -0.427093505859375, -0.40655517578125, -0.386016845703125, -0.365478515625, -0.344940185546875, -0.32440185546875, -0.303863525390625, -0.2833251953125, -0.262786865234375, -0.24224853515625, -0.221710205078125, -0.201171875, -0.180633544921875, -0.16009521484375, -0.139556884765625, -0.1190185546875, -0.098480224609375, -0.07794189453125, -0.057403564453125, -0.036865234375, -0.016326904296875, 0.00421142578125, 0.024749755859375, 0.0452880859375, 0.065826416015625, 0.08636474609375, 0.106903076171875, 0.12744140625, 0.147979736328125, 0.16851806640625, 0.189056396484375, 0.2095947265625, 0.230133056640625, 0.25067138671875, 0.271209716796875, 0.291748046875, 0.312286376953125, 0.33282470703125, 0.353363037109375, 0.3739013671875, 0.394439697265625, 0.41497802734375, 0.435516357421875, 0.4560546875, 0.476593017578125, 0.49713134765625, 0.517669677734375, 0.5382080078125, 0.558746337890625, 0.57928466796875, 0.599822998046875, 0.620361328125, 0.640899658203125, 0.66143798828125, 0.681976318359375, 0.7025146484375, 0.723052978515625, 0.74359130859375, 0.764129638671875, 0.78466796875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 5.0, 3.0, 9.0, 9.0, 6.0, 13.0, 18.0, 12.0, 16.0, 17.0, 28.0, 36.0, 32.0, 44.0, 31.0, 38.0, 42.0, 48.0, 53.0, 52.0, 41.0, 58.0, 47.0, 50.0, 39.0, 36.0, 26.0, 29.0, 24.0, 30.0, 25.0, 11.0, 16.0, 8.0, 12.0, 13.0, 10.0, 8.0, 2.0, 1.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.4697265625, -0.4561195373535156, -0.44251251220703125, -0.4289054870605469, -0.4152984619140625, -0.4016914367675781, -0.38808441162109375, -0.3744773864746094, -0.360870361328125, -0.3472633361816406, -0.33365631103515625, -0.3200492858886719, -0.3064422607421875, -0.2928352355957031, -0.27922821044921875, -0.2656211853027344, -0.25201416015625, -0.23840713500976562, -0.22480010986328125, -0.21119308471679688, -0.1975860595703125, -0.18397903442382812, -0.17037200927734375, -0.15676498413085938, -0.143157958984375, -0.12955093383789062, -0.11594390869140625, -0.10233688354492188, -0.0887298583984375, -0.07512283325195312, -0.06151580810546875, -0.047908782958984375, -0.0343017578125, -0.020694732666015625, -0.00708770751953125, 0.006519317626953125, 0.0201263427734375, 0.033733367919921875, 0.04734039306640625, 0.060947418212890625, 0.074554443359375, 0.08816146850585938, 0.10176849365234375, 0.11537551879882812, 0.1289825439453125, 0.14258956909179688, 0.15619659423828125, 0.16980361938476562, 0.18341064453125, 0.19701766967773438, 0.21062469482421875, 0.22423171997070312, 0.2378387451171875, 0.2514457702636719, 0.26505279541015625, 0.2786598205566406, 0.292266845703125, 0.3058738708496094, 0.31948089599609375, 0.3330879211425781, 0.3466949462890625, 0.3603019714355469, 0.37390899658203125, 0.3875160217285156, 0.401123046875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 5.0, 10.0, 7.0, 17.0, 25.0, 36.0, 60.0, 97.0, 151.0, 257.0, 571.0, 1144.0, 2934.0, 9246.0, 48157.0, 613841.0, 333385.0, 27838.0, 6558.0, 2232.0, 944.0, 462.0, 216.0, 125.0, 68.0, 56.0, 34.0, 23.0, 13.0, 16.0, 8.0, 6.0, 2.0, 4.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.87451171875, -0.84942626953125, -0.8243408203125, -0.79925537109375, -0.774169921875, -0.74908447265625, -0.7239990234375, -0.69891357421875, -0.673828125, -0.64874267578125, -0.6236572265625, -0.59857177734375, -0.573486328125, -0.54840087890625, -0.5233154296875, -0.49822998046875, -0.47314453125, -0.44805908203125, -0.4229736328125, -0.39788818359375, -0.372802734375, -0.34771728515625, -0.3226318359375, -0.29754638671875, -0.2724609375, -0.24737548828125, -0.2222900390625, -0.19720458984375, -0.172119140625, -0.14703369140625, -0.1219482421875, -0.09686279296875, -0.07177734375, -0.04669189453125, -0.0216064453125, 0.00347900390625, 0.028564453125, 0.05364990234375, 0.0787353515625, 0.10382080078125, 0.12890625, 0.15399169921875, 0.1790771484375, 0.20416259765625, 0.229248046875, 0.25433349609375, 0.2794189453125, 0.30450439453125, 0.32958984375, 0.35467529296875, 0.3797607421875, 0.40484619140625, 0.429931640625, 0.45501708984375, 0.4801025390625, 0.50518798828125, 0.5302734375, 0.55535888671875, 0.5804443359375, 0.60552978515625, 0.630615234375, 0.65570068359375, 0.6807861328125, 0.70587158203125, 0.73095703125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 3.0, 4.0, 5.0, 4.0, 10.0, 11.0, 26.0, 31.0, 37.0, 63.0, 75.0, 85.0, 113.0, 105.0, 87.0, 89.0, 64.0, 36.0, 43.0, 28.0, 20.0, 13.0, 13.0, 9.0, 8.0, 8.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.081031799316406e-05, -6.774440407752991e-05, -6.467849016189575e-05, -6.16125762462616e-05, -5.854666233062744e-05, -5.5480748414993286e-05, -5.241483449935913e-05, -4.9348920583724976e-05, -4.628300666809082e-05, -4.3217092752456665e-05, -4.015117883682251e-05, -3.7085264921188354e-05, -3.40193510055542e-05, -3.0953437089920044e-05, -2.788752317428589e-05, -2.4821609258651733e-05, -2.1755695343017578e-05, -1.8689781427383423e-05, -1.5623867511749268e-05, -1.2557953596115112e-05, -9.492039680480957e-06, -6.426125764846802e-06, -3.3602118492126465e-06, -2.942979335784912e-07, 2.771615982055664e-06, 5.837529897689819e-06, 8.903443813323975e-06, 1.196935772895813e-05, 1.5035271644592285e-05, 1.810118556022644e-05, 2.1167099475860596e-05, 2.423301339149475e-05, 2.7298927307128906e-05, 3.036484122276306e-05, 3.343075513839722e-05, 3.649666905403137e-05, 3.956258296966553e-05, 4.262849688529968e-05, 4.569441080093384e-05, 4.876032471656799e-05, 5.182623863220215e-05, 5.4892152547836304e-05, 5.795806646347046e-05, 6.1023980379104614e-05, 6.408989429473877e-05, 6.715580821037292e-05, 7.022172212600708e-05, 7.328763604164124e-05, 7.635354995727539e-05, 7.941946387290955e-05, 8.24853777885437e-05, 8.555129170417786e-05, 8.861720561981201e-05, 9.168311953544617e-05, 9.474903345108032e-05, 9.781494736671448e-05, 0.00010088086128234863, 0.00010394677519798279, 0.00010701268911361694, 0.0001100786030292511, 0.00011314451694488525, 0.00011621043086051941, 0.00011927634477615356, 0.00012234225869178772, 0.00012540817260742188]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 3.0, 14.0, 20.0, 21.0, 56.0, 72.0, 131.0, 288.0, 603.0, 1257.0, 3144.0, 10333.0, 56121.0, 638806.0, 299222.0, 27818.0, 6501.0, 2230.0, 965.0, 434.0, 235.0, 113.0, 59.0, 41.0, 19.0, 18.0, 10.0, 6.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.75927734375, -0.73614501953125, -0.7130126953125, -0.68988037109375, -0.666748046875, -0.64361572265625, -0.6204833984375, -0.59735107421875, -0.57421875, -0.55108642578125, -0.5279541015625, -0.50482177734375, -0.481689453125, -0.45855712890625, -0.4354248046875, -0.41229248046875, -0.38916015625, -0.36602783203125, -0.3428955078125, -0.31976318359375, -0.296630859375, -0.27349853515625, -0.2503662109375, -0.22723388671875, -0.2041015625, -0.18096923828125, -0.1578369140625, -0.13470458984375, -0.111572265625, -0.08843994140625, -0.0653076171875, -0.04217529296875, -0.01904296875, 0.00408935546875, 0.0272216796875, 0.05035400390625, 0.073486328125, 0.09661865234375, 0.1197509765625, 0.14288330078125, 0.166015625, 0.18914794921875, 0.2122802734375, 0.23541259765625, 0.258544921875, 0.28167724609375, 0.3048095703125, 0.32794189453125, 0.35107421875, 0.37420654296875, 0.3973388671875, 0.42047119140625, 0.443603515625, 0.46673583984375, 0.4898681640625, 0.51300048828125, 0.5361328125, 0.55926513671875, 0.5823974609375, 0.60552978515625, 0.628662109375, 0.65179443359375, 0.6749267578125, 0.69805908203125, 0.72119140625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 0.0, 3.0, 2.0, 3.0, 5.0, 7.0, 10.0, 16.0, 19.0, 21.0, 41.0, 66.0, 92.0, 93.0, 104.0, 100.0, 83.0, 94.0, 72.0, 58.0, 37.0, 15.0, 15.0, 8.0, 14.0, 3.0, 5.0, 10.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.379150390625, -0.36565399169921875, -0.3521575927734375, -0.33866119384765625, -0.325164794921875, -0.31166839599609375, -0.2981719970703125, -0.28467559814453125, -0.27117919921875, -0.25768280029296875, -0.2441864013671875, -0.23069000244140625, -0.217193603515625, -0.20369720458984375, -0.1902008056640625, -0.17670440673828125, -0.1632080078125, -0.14971160888671875, -0.1362152099609375, -0.12271881103515625, -0.109222412109375, -0.09572601318359375, -0.0822296142578125, -0.06873321533203125, -0.05523681640625, -0.04174041748046875, -0.0282440185546875, -0.01474761962890625, -0.001251220703125, 0.01224517822265625, 0.0257415771484375, 0.03923797607421875, 0.052734375, 0.06623077392578125, 0.0797271728515625, 0.09322357177734375, 0.106719970703125, 0.12021636962890625, 0.1337127685546875, 0.14720916748046875, 0.16070556640625, 0.17420196533203125, 0.1876983642578125, 0.20119476318359375, 0.214691162109375, 0.22818756103515625, 0.2416839599609375, 0.25518035888671875, 0.2686767578125, 0.28217315673828125, 0.2956695556640625, 0.30916595458984375, 0.322662353515625, 0.33615875244140625, 0.3496551513671875, 0.36315155029296875, 0.37664794921875, 0.39014434814453125, 0.4036407470703125, 0.41713714599609375, 0.430633544921875, 0.44412994384765625, 0.4576263427734375, 0.47112274169921875, 0.484619140625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 8.0, 12.0, 27.0, 67.0, 141.0, 252.0, 246.0, 136.0, 59.0, 34.0, 18.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.599502563476562, -13.259078979492188, -12.918655395507812, -12.578231811523438, -12.237807273864746, -11.897383689880371, -11.556960105895996, -11.216536521911621, -10.87611198425293, -10.535688400268555, -10.19526481628418, -9.854841232299805, -9.514416694641113, -9.173993110656738, -8.833569526672363, -8.493145942687988, -8.152722358703613, -7.812298774719238, -7.471874713897705, -7.13145112991333, -6.791027069091797, -6.450603485107422, -6.110179901123047, -5.769756317138672, -5.429332256317139, -5.088908672332764, -4.7484846115112305, -4.4080610275268555, -4.0676374435424805, -3.7272133827209473, -3.3867897987365723, -3.046365976333618, -2.705942153930664, -2.36551833152771, -2.025094509124756, -1.6846709251403809, -1.3442471027374268, -1.0038232803344727, -0.6633996963500977, -0.32297587394714355, 0.017447948455810547, 0.3578717112541199, 0.6982954740524292, 1.0387191772460938, 1.3791429996490479, 1.719566822052002, 2.059990406036377, 2.400414228439331, 2.740838050842285, 3.0812618732452393, 3.4216856956481934, 3.7621092796325684, 4.102533340454102, 4.442956924438477, 4.783380508422852, 5.123804092407227, 5.46422815322876, 5.804651737213135, 6.145075798034668, 6.485499382019043, 6.825922966003418, 7.166347026824951, 7.506770610809326, 7.847194671630859, 8.187618255615234]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 2.0, 6.0, 14.0, 12.0, 15.0, 19.0, 24.0, 24.0, 33.0, 46.0, 51.0, 45.0, 41.0, 54.0, 50.0, 72.0, 51.0, 53.0, 59.0, 63.0, 41.0, 39.0, 40.0, 32.0, 19.0, 22.0, 24.0, 11.0, 8.0, 5.0, 7.0, 5.0, 3.0, 7.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2581593990325928, -3.1566693782806396, -3.0551791191101074, -2.9536890983581543, -2.852199077606201, -2.750709056854248, -2.649218797683716, -2.5477287769317627, -2.4462385177612305, -2.3447484970092773, -2.243258237838745, -2.141768217086792, -2.040278196334839, -1.9387880563735962, -1.8372979164123535, -1.7358078956604004, -1.6343178749084473, -1.5328277349472046, -1.4313377141952515, -1.3298475742340088, -1.2283575534820557, -1.126867413520813, -1.0253772735595703, -0.9238871932029724, -0.8223971128463745, -0.7209070324897766, -0.6194169521331787, -0.517926812171936, -0.41643673181533813, -0.31494665145874023, -0.21345651149749756, -0.11196643114089966, -0.01047658920288086, 0.09101350605487823, 0.19250360131263733, 0.2939937114715576, 0.3954837918281555, 0.4969738721847534, 0.5984640121459961, 0.699954092502594, 0.8014441728591919, 0.9029342532157898, 1.0044243335723877, 1.1059144735336304, 1.207404613494873, 1.3088946342468262, 1.4103847742080688, 1.5118749141693115, 1.6133649349212646, 1.7148550748825073, 1.8163450956344604, 1.9178352355957031, 2.0193252563476562, 2.1208152770996094, 2.2223055362701416, 2.3237955570220947, 2.425285816192627, 2.52677583694458, 2.6282660961151123, 2.7297561168670654, 2.8312461376190186, 2.932736396789551, 3.034226417541504, 3.135716438293457, 3.23720645904541]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 6.0, 10.0, 12.0, 21.0, 19.0, 18.0, 33.0, 39.0, 62.0, 75.0, 124.0, 167.0, 282.0, 609.0, 1645.0, 7255.0, 56019.0, 4001550.0, 111733.0, 10507.0, 2358.0, 759.0, 406.0, 230.0, 111.0, 84.0, 50.0, 27.0, 17.0, 13.0, 9.0, 8.0, 5.0, 5.0, 4.0, 3.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.642578125, -2.56622314453125, -2.4898681640625, -2.41351318359375, -2.337158203125, -2.26080322265625, -2.1844482421875, -2.10809326171875, -2.03173828125, -1.95538330078125, -1.8790283203125, -1.80267333984375, -1.726318359375, -1.64996337890625, -1.5736083984375, -1.49725341796875, -1.4208984375, -1.34454345703125, -1.2681884765625, -1.19183349609375, -1.115478515625, -1.03912353515625, -0.9627685546875, -0.88641357421875, -0.81005859375, -0.73370361328125, -0.6573486328125, -0.58099365234375, -0.504638671875, -0.42828369140625, -0.3519287109375, -0.27557373046875, -0.19921875, -0.12286376953125, -0.0465087890625, 0.02984619140625, 0.106201171875, 0.18255615234375, 0.2589111328125, 0.33526611328125, 0.41162109375, 0.48797607421875, 0.5643310546875, 0.64068603515625, 0.717041015625, 0.79339599609375, 0.8697509765625, 0.94610595703125, 1.0224609375, 1.09881591796875, 1.1751708984375, 1.25152587890625, 1.327880859375, 1.40423583984375, 1.4805908203125, 1.55694580078125, 1.63330078125, 1.70965576171875, 1.7860107421875, 1.86236572265625, 1.938720703125, 2.01507568359375, 2.0914306640625, 2.16778564453125, 2.244140625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 18.0, 30.0, 43.0, 75.0, 93.0, 117.0, 130.0, 124.0, 114.0, 97.0, 56.0, 41.0, 27.0, 21.0, 9.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2822265625, -0.2743644714355469, -0.26650238037109375, -0.2586402893066406, -0.2507781982421875, -0.24291610717773438, -0.23505401611328125, -0.22719192504882812, -0.219329833984375, -0.21146774291992188, -0.20360565185546875, -0.19574356079101562, -0.1878814697265625, -0.18001937866210938, -0.17215728759765625, -0.16429519653320312, -0.15643310546875, -0.14857101440429688, -0.14070892333984375, -0.13284683227539062, -0.1249847412109375, -0.11712265014648438, -0.10926055908203125, -0.10139846801757812, -0.093536376953125, -0.08567428588867188, -0.07781219482421875, -0.06995010375976562, -0.0620880126953125, -0.054225921630859375, -0.04636383056640625, -0.038501739501953125, -0.0306396484375, -0.022777557373046875, -0.01491546630859375, -0.007053375244140625, 0.0008087158203125, 0.008670806884765625, 0.01653289794921875, 0.024394989013671875, 0.032257080078125, 0.040119171142578125, 0.04798126220703125, 0.055843353271484375, 0.0637054443359375, 0.07156753540039062, 0.07942962646484375, 0.08729171752929688, 0.09515380859375, 0.10301589965820312, 0.11087799072265625, 0.11874008178710938, 0.1266021728515625, 0.13446426391601562, 0.14232635498046875, 0.15018844604492188, 0.158050537109375, 0.16591262817382812, 0.17377471923828125, 0.18163681030273438, 0.1894989013671875, 0.19736099243164062, 0.20522308349609375, 0.21308517456054688, 0.220947265625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 7.0, 11.0, 4.0, 8.0, 23.0, 19.0, 43.0, 84.0, 178.0, 400.0, 945.0, 2276.0, 6309.0, 21660.0, 113975.0, 3649287.0, 345636.0, 37486.0, 10096.0, 3383.0, 1333.0, 586.0, 250.0, 146.0, 62.0, 29.0, 21.0, 7.0, 7.0, 5.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2841796875, -1.2436676025390625, -1.203155517578125, -1.1626434326171875, -1.12213134765625, -1.0816192626953125, -1.041107177734375, -1.0005950927734375, -0.9600830078125, -0.9195709228515625, -0.879058837890625, -0.8385467529296875, -0.79803466796875, -0.7575225830078125, -0.717010498046875, -0.6764984130859375, -0.635986328125, -0.5954742431640625, -0.554962158203125, -0.5144500732421875, -0.47393798828125, -0.4334259033203125, -0.392913818359375, -0.3524017333984375, -0.3118896484375, -0.2713775634765625, -0.230865478515625, -0.1903533935546875, -0.14984130859375, -0.1093292236328125, -0.068817138671875, -0.0283050537109375, 0.01220703125, 0.0527191162109375, 0.093231201171875, 0.1337432861328125, 0.17425537109375, 0.2147674560546875, 0.255279541015625, 0.2957916259765625, 0.3363037109375, 0.3768157958984375, 0.417327880859375, 0.4578399658203125, 0.49835205078125, 0.5388641357421875, 0.579376220703125, 0.6198883056640625, 0.660400390625, 0.7009124755859375, 0.741424560546875, 0.7819366455078125, 0.82244873046875, 0.8629608154296875, 0.903472900390625, 0.9439849853515625, 0.9844970703125, 1.0250091552734375, 1.065521240234375, 1.1060333251953125, 1.14654541015625, 1.1870574951171875, 1.227569580078125, 1.2680816650390625, 1.30859375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 9.0, 9.0, 10.0, 13.0, 15.0, 27.0, 28.0, 39.0, 90.0, 125.0, 264.0, 860.0, 1724.0, 452.0, 161.0, 87.0, 52.0, 30.0, 15.0, 13.0, 17.0, 14.0, 6.0, 8.0, 1.0, 3.0, 5.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.425537109375, -0.4134559631347656, -0.40137481689453125, -0.3892936706542969, -0.3772125244140625, -0.3651313781738281, -0.35305023193359375, -0.3409690856933594, -0.328887939453125, -0.3168067932128906, -0.30472564697265625, -0.2926445007324219, -0.2805633544921875, -0.2684822082519531, -0.25640106201171875, -0.24431991577148438, -0.23223876953125, -0.22015762329101562, -0.20807647705078125, -0.19599533081054688, -0.1839141845703125, -0.17183303833007812, -0.15975189208984375, -0.14767074584960938, -0.135589599609375, -0.12350845336914062, -0.11142730712890625, -0.09934616088867188, -0.0872650146484375, -0.07518386840820312, -0.06310272216796875, -0.051021575927734375, -0.0389404296875, -0.026859283447265625, -0.01477813720703125, -0.002696990966796875, 0.0093841552734375, 0.021465301513671875, 0.03354644775390625, 0.045627593994140625, 0.057708740234375, 0.06978988647460938, 0.08187103271484375, 0.09395217895507812, 0.1060333251953125, 0.11811447143554688, 0.13019561767578125, 0.14227676391601562, 0.15435791015625, 0.16643905639648438, 0.17852020263671875, 0.19060134887695312, 0.2026824951171875, 0.21476364135742188, 0.22684478759765625, 0.23892593383789062, 0.251007080078125, 0.2630882263183594, 0.27516937255859375, 0.2872505187988281, 0.2993316650390625, 0.3114128112792969, 0.32349395751953125, 0.3355751037597656, 0.34765625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 8.0, 29.0, 81.0, 289.0, 393.0, 147.0, 49.0, 8.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.312604904174805, -6.104586124420166, -5.896567344665527, -5.688548564910889, -5.48052978515625, -5.272511005401611, -5.064492225646973, -4.856472969055176, -4.648454666137695, -4.440435886383057, -4.232417106628418, -4.024398326873779, -3.8163795471191406, -3.608360767364502, -3.400341749191284, -3.1923229694366455, -2.9843039512634277, -2.776285171508789, -2.5682663917541504, -2.3602476119995117, -2.152228832244873, -1.9442099332809448, -1.7361910343170166, -1.528172254562378, -1.3201534748077393, -1.1121346950531006, -0.9041158556938171, -0.6960970163345337, -0.488078236579895, -0.28005945682525635, -0.07204055786132812, 0.13597822189331055, 0.343996524810791, 0.5520153045654297, 0.7600341439247131, 0.9680529832839966, 1.1760717630386353, 1.384090542793274, 1.5921094417572021, 1.8001282215118408, 2.0081470012664795, 2.216165781021118, 2.424184560775757, 2.6322035789489746, 2.8402223587036133, 3.048241138458252, 3.2562599182128906, 3.4642786979675293, 3.672297477722168, 3.8803162574768066, 4.088335037231445, 4.296353816986084, 4.504372596740723, 4.712391376495361, 4.92041015625, 5.128429412841797, 5.336447715759277, 5.544466495513916, 5.752485275268555, 5.960504055023193, 6.168522834777832, 6.376541614532471, 6.584560394287109, 6.792579650878906, 7.000598430633545]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 5.0, 7.0, 10.0, 9.0, 14.0, 20.0, 26.0, 16.0, 27.0, 36.0, 22.0, 55.0, 44.0, 43.0, 42.0, 43.0, 34.0, 67.0, 42.0, 55.0, 66.0, 48.0, 42.0, 35.0, 39.0, 31.0, 20.0, 16.0, 22.0, 19.0, 13.0, 10.0, 9.0, 8.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.987533688545227, -0.9483421444892883, -0.9091506004333496, -0.8699590563774109, -0.8307675123214722, -0.7915759682655334, -0.7523844242095947, -0.713192880153656, -0.6740013360977173, -0.6348097920417786, -0.5956182479858398, -0.5564267039299011, -0.5172351598739624, -0.4780436158180237, -0.43885207176208496, -0.39966052770614624, -0.3604689836502075, -0.3212774395942688, -0.2820858955383301, -0.24289435148239136, -0.20370280742645264, -0.16451126337051392, -0.1253197193145752, -0.08612817525863647, -0.046936631202697754, -0.007745087146759033, 0.03144645690917969, 0.07063800096511841, 0.10982954502105713, 0.14902108907699585, 0.18821263313293457, 0.2274041771888733, 0.26659584045410156, 0.3057873845100403, 0.344978928565979, 0.3841704726219177, 0.42336201667785645, 0.46255356073379517, 0.5017451047897339, 0.5409366488456726, 0.5801281929016113, 0.61931973695755, 0.6585112810134888, 0.6977028250694275, 0.7368943691253662, 0.7760859131813049, 0.8152774572372437, 0.8544690012931824, 0.8936605453491211, 0.9328520894050598, 0.9720436334609985, 1.011235237121582, 1.050426721572876, 1.08961820602417, 1.1288098096847534, 1.168001413345337, 1.2071928977966309, 1.2463843822479248, 1.2855759859085083, 1.3247675895690918, 1.3639590740203857, 1.4031505584716797, 1.4423421621322632, 1.4815337657928467, 1.5207252502441406]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 3.0, 1.0, 7.0, 7.0, 14.0, 5.0, 13.0, 21.0, 14.0, 40.0, 30.0, 53.0, 82.0, 103.0, 184.0, 302.0, 544.0, 997.0, 2267.0, 7512.0, 37125.0, 261904.0, 602135.0, 110050.0, 17461.0, 4240.0, 1615.0, 693.0, 388.0, 242.0, 156.0, 96.0, 63.0, 54.0, 50.0, 19.0, 14.0, 16.0, 6.0, 16.0, 6.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.18359375, -2.126556396484375, -2.06951904296875, -2.012481689453125, -1.9554443359375, -1.898406982421875, -1.84136962890625, -1.784332275390625, -1.727294921875, -1.670257568359375, -1.61322021484375, -1.556182861328125, -1.4991455078125, -1.442108154296875, -1.38507080078125, -1.328033447265625, -1.27099609375, -1.213958740234375, -1.15692138671875, -1.099884033203125, -1.0428466796875, -0.985809326171875, -0.92877197265625, -0.871734619140625, -0.814697265625, -0.757659912109375, -0.70062255859375, -0.643585205078125, -0.5865478515625, -0.529510498046875, -0.47247314453125, -0.415435791015625, -0.3583984375, -0.301361083984375, -0.24432373046875, -0.187286376953125, -0.1302490234375, -0.073211669921875, -0.01617431640625, 0.040863037109375, 0.097900390625, 0.154937744140625, 0.21197509765625, 0.269012451171875, 0.3260498046875, 0.383087158203125, 0.44012451171875, 0.497161865234375, 0.55419921875, 0.611236572265625, 0.66827392578125, 0.725311279296875, 0.7823486328125, 0.839385986328125, 0.89642333984375, 0.953460693359375, 1.010498046875, 1.067535400390625, 1.12457275390625, 1.181610107421875, 1.2386474609375, 1.295684814453125, 1.35272216796875, 1.409759521484375, 1.466796875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 8.0, 11.0, 13.0, 37.0, 46.0, 76.0, 89.0, 130.0, 151.0, 104.0, 97.0, 66.0, 57.0, 55.0, 24.0, 24.0, 7.0, 11.0, 5.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.30712890625, -0.29900360107421875, -0.2908782958984375, -0.28275299072265625, -0.274627685546875, -0.26650238037109375, -0.2583770751953125, -0.25025177001953125, -0.24212646484375, -0.23400115966796875, -0.2258758544921875, -0.21775054931640625, -0.209625244140625, -0.20149993896484375, -0.1933746337890625, -0.18524932861328125, -0.1771240234375, -0.16899871826171875, -0.1608734130859375, -0.15274810791015625, -0.144622802734375, -0.13649749755859375, -0.1283721923828125, -0.12024688720703125, -0.11212158203125, -0.10399627685546875, -0.0958709716796875, -0.08774566650390625, -0.079620361328125, -0.07149505615234375, -0.0633697509765625, -0.05524444580078125, -0.047119140625, -0.03899383544921875, -0.0308685302734375, -0.02274322509765625, -0.014617919921875, -0.00649261474609375, 0.0016326904296875, 0.00975799560546875, 0.01788330078125, 0.02600860595703125, 0.0341339111328125, 0.04225921630859375, 0.050384521484375, 0.05850982666015625, 0.0666351318359375, 0.07476043701171875, 0.0828857421875, 0.09101104736328125, 0.0991363525390625, 0.10726165771484375, 0.115386962890625, 0.12351226806640625, 0.1316375732421875, 0.13976287841796875, 0.14788818359375, 0.15601348876953125, 0.1641387939453125, 0.17226409912109375, 0.180389404296875, 0.18851470947265625, 0.1966400146484375, 0.20476531982421875, 0.212890625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 11.0, 7.0, 15.0, 20.0, 18.0, 33.0, 51.0, 61.0, 133.0, 188.0, 313.0, 521.0, 1019.0, 2104.0, 4218.0, 9900.0, 23624.0, 64968.0, 186904.0, 381415.0, 236430.0, 84451.0, 29835.0, 11961.0, 5142.0, 2404.0, 1222.0, 673.0, 353.0, 191.0, 120.0, 79.0, 48.0, 29.0, 21.0, 21.0, 10.0, 9.0, 9.0, 3.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0], "bins": [-0.806640625, -0.7833404541015625, -0.760040283203125, -0.7367401123046875, -0.71343994140625, -0.6901397705078125, -0.666839599609375, -0.6435394287109375, -0.6202392578125, -0.5969390869140625, -0.573638916015625, -0.5503387451171875, -0.52703857421875, -0.5037384033203125, -0.480438232421875, -0.4571380615234375, -0.433837890625, -0.4105377197265625, -0.387237548828125, -0.3639373779296875, -0.34063720703125, -0.3173370361328125, -0.294036865234375, -0.2707366943359375, -0.2474365234375, -0.2241363525390625, -0.200836181640625, -0.1775360107421875, -0.15423583984375, -0.1309356689453125, -0.107635498046875, -0.0843353271484375, -0.06103515625, -0.0377349853515625, -0.014434814453125, 0.0088653564453125, 0.03216552734375, 0.0554656982421875, 0.078765869140625, 0.1020660400390625, 0.1253662109375, 0.1486663818359375, 0.171966552734375, 0.1952667236328125, 0.21856689453125, 0.2418670654296875, 0.265167236328125, 0.2884674072265625, 0.311767578125, 0.3350677490234375, 0.358367919921875, 0.3816680908203125, 0.40496826171875, 0.4282684326171875, 0.451568603515625, 0.4748687744140625, 0.4981689453125, 0.5214691162109375, 0.544769287109375, 0.5680694580078125, 0.59136962890625, 0.6146697998046875, 0.637969970703125, 0.6612701416015625, 0.6845703125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 4.0, 2.0, 6.0, 7.0, 17.0, 13.0, 11.0, 24.0, 15.0, 19.0, 22.0, 22.0, 27.0, 29.0, 35.0, 40.0, 32.0, 44.0, 48.0, 50.0, 48.0, 41.0, 50.0, 52.0, 35.0, 40.0, 32.0, 33.0, 28.0, 19.0, 26.0, 22.0, 24.0, 16.0, 15.0, 18.0, 9.0, 9.0, 7.0, 2.0, 3.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.49658203125, -0.4825859069824219, -0.46858978271484375, -0.4545936584472656, -0.4405975341796875, -0.4266014099121094, -0.41260528564453125, -0.3986091613769531, -0.384613037109375, -0.3706169128417969, -0.35662078857421875, -0.3426246643066406, -0.3286285400390625, -0.3146324157714844, -0.30063629150390625, -0.2866401672363281, -0.27264404296875, -0.2586479187011719, -0.24465179443359375, -0.23065567016601562, -0.2166595458984375, -0.20266342163085938, -0.18866729736328125, -0.17467117309570312, -0.160675048828125, -0.14667892456054688, -0.13268280029296875, -0.11868667602539062, -0.1046905517578125, -0.09069442749023438, -0.07669830322265625, -0.06270217895507812, -0.0487060546875, -0.034709930419921875, -0.02071380615234375, -0.006717681884765625, 0.0072784423828125, 0.021274566650390625, 0.03527069091796875, 0.049266815185546875, 0.063262939453125, 0.07725906372070312, 0.09125518798828125, 0.10525131225585938, 0.1192474365234375, 0.13324356079101562, 0.14723968505859375, 0.16123580932617188, 0.17523193359375, 0.18922805786132812, 0.20322418212890625, 0.21722030639648438, 0.2312164306640625, 0.24521255493164062, 0.25920867919921875, 0.2732048034667969, 0.287200927734375, 0.3011970520019531, 0.31519317626953125, 0.3291893005371094, 0.3431854248046875, 0.3571815490722656, 0.37117767333984375, 0.3851737976074219, 0.399169921875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 5.0, 18.0, 22.0, 43.0, 83.0, 144.0, 276.0, 658.0, 1681.0, 6500.0, 41663.0, 430350.0, 504416.0, 51962.0, 7510.0, 1914.0, 696.0, 288.0, 141.0, 76.0, 37.0, 27.0, 13.0, 11.0, 8.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50927734375, -0.48894500732421875, -0.4686126708984375, -0.44828033447265625, -0.427947998046875, -0.40761566162109375, -0.3872833251953125, -0.36695098876953125, -0.34661865234375, -0.32628631591796875, -0.3059539794921875, -0.28562164306640625, -0.265289306640625, -0.24495697021484375, -0.2246246337890625, -0.20429229736328125, -0.1839599609375, -0.16362762451171875, -0.1432952880859375, -0.12296295166015625, -0.102630615234375, -0.08229827880859375, -0.0619659423828125, -0.04163360595703125, -0.02130126953125, -0.00096893310546875, 0.0193634033203125, 0.03969573974609375, 0.060028076171875, 0.08036041259765625, 0.1006927490234375, 0.12102508544921875, 0.141357421875, 0.16168975830078125, 0.1820220947265625, 0.20235443115234375, 0.222686767578125, 0.24301910400390625, 0.2633514404296875, 0.28368377685546875, 0.30401611328125, 0.32434844970703125, 0.3446807861328125, 0.36501312255859375, 0.385345458984375, 0.40567779541015625, 0.4260101318359375, 0.44634246826171875, 0.4666748046875, 0.48700714111328125, 0.5073394775390625, 0.5276718139648438, 0.548004150390625, 0.5683364868164062, 0.5886688232421875, 0.6090011596679688, 0.62933349609375, 0.6496658325195312, 0.6699981689453125, 0.6903305053710938, 0.710662841796875, 0.7309951782226562, 0.7513275146484375, 0.7716598510742188, 0.7919921875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 6.0, 8.0, 19.0, 20.0, 20.0, 22.0, 29.0, 41.0, 80.0, 70.0, 105.0, 113.0, 100.0, 73.0, 62.0, 54.0, 38.0, 36.0, 25.0, 22.0, 19.0, 15.0, 4.0, 8.0, 3.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.605552673339844e-05, -7.332488894462585e-05, -7.059425115585327e-05, -6.786361336708069e-05, -6.51329755783081e-05, -6.240233778953552e-05, -5.967170000076294e-05, -5.6941062211990356e-05, -5.4210424423217773e-05, -5.147978663444519e-05, -4.874914884567261e-05, -4.6018511056900024e-05, -4.328787326812744e-05, -4.055723547935486e-05, -3.7826597690582275e-05, -3.509595990180969e-05, -3.236532211303711e-05, -2.9634684324264526e-05, -2.6904046535491943e-05, -2.417340874671936e-05, -2.1442770957946777e-05, -1.8712133169174194e-05, -1.598149538040161e-05, -1.3250857591629028e-05, -1.0520219802856445e-05, -7.789582014083862e-06, -5.058944225311279e-06, -2.3283064365386963e-06, 4.023313522338867e-07, 3.1329691410064697e-06, 5.863606929779053e-06, 8.594244718551636e-06, 1.1324882507324219e-05, 1.4055520296096802e-05, 1.6786158084869385e-05, 1.9516795873641968e-05, 2.224743366241455e-05, 2.4978071451187134e-05, 2.7708709239959717e-05, 3.04393470287323e-05, 3.316998481750488e-05, 3.5900622606277466e-05, 3.863126039505005e-05, 4.136189818382263e-05, 4.4092535972595215e-05, 4.68231737613678e-05, 4.955381155014038e-05, 5.2284449338912964e-05, 5.501508712768555e-05, 5.774572491645813e-05, 6.047636270523071e-05, 6.32070004940033e-05, 6.593763828277588e-05, 6.866827607154846e-05, 7.139891386032104e-05, 7.412955164909363e-05, 7.686018943786621e-05, 7.95908272266388e-05, 8.232146501541138e-05, 8.505210280418396e-05, 8.778274059295654e-05, 9.051337838172913e-05, 9.324401617050171e-05, 9.597465395927429e-05, 9.870529174804688e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 5.0, 9.0, 8.0, 16.0, 19.0, 29.0, 62.0, 93.0, 122.0, 262.0, 562.0, 1264.0, 4153.0, 17191.0, 100632.0, 510616.0, 343812.0, 54692.0, 10291.0, 2732.0, 1002.0, 418.0, 222.0, 131.0, 66.0, 48.0, 36.0, 19.0, 8.0, 14.0, 7.0, 4.0, 6.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.459716796875, -0.4443092346191406, -0.42890167236328125, -0.4134941101074219, -0.3980865478515625, -0.3826789855957031, -0.36727142333984375, -0.3518638610839844, -0.336456298828125, -0.3210487365722656, -0.30564117431640625, -0.2902336120605469, -0.2748260498046875, -0.2594184875488281, -0.24401092529296875, -0.22860336303710938, -0.21319580078125, -0.19778823852539062, -0.18238067626953125, -0.16697311401367188, -0.1515655517578125, -0.13615798950195312, -0.12075042724609375, -0.10534286499023438, -0.089935302734375, -0.07452774047851562, -0.05912017822265625, -0.043712615966796875, -0.0283050537109375, -0.012897491455078125, 0.00251007080078125, 0.017917633056640625, 0.0333251953125, 0.048732757568359375, 0.06414031982421875, 0.07954788208007812, 0.0949554443359375, 0.11036300659179688, 0.12577056884765625, 0.14117813110351562, 0.156585693359375, 0.17199325561523438, 0.18740081787109375, 0.20280838012695312, 0.2182159423828125, 0.23362350463867188, 0.24903106689453125, 0.2644386291503906, 0.27984619140625, 0.2952537536621094, 0.31066131591796875, 0.3260688781738281, 0.3414764404296875, 0.3568840026855469, 0.37229156494140625, 0.3876991271972656, 0.403106689453125, 0.4185142517089844, 0.43392181396484375, 0.4493293762207031, 0.4647369384765625, 0.4801445007324219, 0.49555206298828125, 0.5109596252441406, 0.5263671875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 5.0, 5.0, 4.0, 2.0, 13.0, 12.0, 21.0, 26.0, 33.0, 28.0, 46.0, 60.0, 46.0, 51.0, 57.0, 71.0, 66.0, 72.0, 61.0, 54.0, 41.0, 37.0, 37.0, 32.0, 23.0, 21.0, 19.0, 10.0, 13.0, 6.0, 8.0, 5.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.28564453125, -0.2768096923828125, -0.267974853515625, -0.2591400146484375, -0.25030517578125, -0.2414703369140625, -0.232635498046875, -0.2238006591796875, -0.2149658203125, -0.2061309814453125, -0.197296142578125, -0.1884613037109375, -0.17962646484375, -0.1707916259765625, -0.161956787109375, -0.1531219482421875, -0.144287109375, -0.1354522705078125, -0.126617431640625, -0.1177825927734375, -0.10894775390625, -0.1001129150390625, -0.091278076171875, -0.0824432373046875, -0.0736083984375, -0.0647735595703125, -0.055938720703125, -0.0471038818359375, -0.03826904296875, -0.0294342041015625, -0.020599365234375, -0.0117645263671875, -0.0029296875, 0.0059051513671875, 0.014739990234375, 0.0235748291015625, 0.03240966796875, 0.0412445068359375, 0.050079345703125, 0.0589141845703125, 0.0677490234375, 0.0765838623046875, 0.085418701171875, 0.0942535400390625, 0.10308837890625, 0.1119232177734375, 0.120758056640625, 0.1295928955078125, 0.138427734375, 0.1472625732421875, 0.156097412109375, 0.1649322509765625, 0.17376708984375, 0.1826019287109375, 0.191436767578125, 0.2002716064453125, 0.2091064453125, 0.2179412841796875, 0.226776123046875, 0.2356109619140625, 0.24444580078125, 0.2532806396484375, 0.262115478515625, 0.2709503173828125, 0.27978515625]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 7.0, 9.0, 17.0, 25.0, 57.0, 124.0, 189.0, 227.0, 175.0, 99.0, 40.0, 25.0, 6.0, 8.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.865457534790039, -4.528101444244385, -4.190745830535889, -3.8533897399902344, -3.516033887863159, -3.178678035736084, -2.8413219451904297, -2.5039660930633545, -2.1666102409362793, -1.829254388809204, -1.4918984174728394, -1.1545424461364746, -0.8171865940093994, -0.4798307418823242, -0.14247465133666992, 0.19488120079040527, 0.5322370529174805, 0.8695929646492004, 1.2069488763809204, 1.5443048477172852, 1.8816606998443604, 2.2190165519714355, 2.55637264251709, 2.893728494644165, 3.2310843467712402, 3.5684401988983154, 3.9057960510253906, 4.243152141571045, 4.580508232116699, 4.917863845825195, 5.25521993637085, 5.592576026916504, 5.929931640625, 6.267287731170654, 6.60464334487915, 6.941999435424805, 7.279355049133301, 7.616711139678955, 7.954067230224609, 8.291422843933105, 8.628778457641602, 8.966134071350098, 9.30349063873291, 9.640846252441406, 9.978201866149902, 10.315557479858398, 10.652914047241211, 10.990269660949707, 11.32762622833252, 11.664981842041016, 12.002338409423828, 12.339694023132324, 12.67704963684082, 13.014406204223633, 13.351761817932129, 13.689117431640625, 14.026473999023438, 14.363829612731934, 14.701186180114746, 15.038541793823242, 15.375897407531738, 15.713253021240234, 16.050609588623047, 16.38796615600586, 16.72532081604004]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 7.0, 7.0, 9.0, 8.0, 7.0, 10.0, 11.0, 20.0, 20.0, 22.0, 28.0, 24.0, 38.0, 29.0, 32.0, 41.0, 35.0, 37.0, 50.0, 48.0, 48.0, 49.0, 52.0, 51.0, 36.0, 40.0, 35.0, 37.0, 27.0, 31.0, 21.0, 15.0, 18.0, 13.0, 7.0, 7.0, 8.0, 6.0, 7.0, 7.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0], "bins": [-3.21193528175354, -3.127472162246704, -3.043008804321289, -2.958545684814453, -2.874082565307617, -2.7896194458007812, -2.705156087875366, -2.6206929683685303, -2.5362296104431152, -2.4517664909362793, -2.3673031330108643, -2.2828400135040283, -2.1983768939971924, -2.1139135360717773, -2.0294504165649414, -1.9449872970581055, -1.8605241775512695, -1.776060938835144, -1.691597819328308, -1.6071345806121826, -1.5226714611053467, -1.4382082223892212, -1.3537449836730957, -1.2692818641662598, -1.1848186254501343, -1.1003553867340088, -1.0158922672271729, -0.9314290285110474, -0.8469658493995667, -0.7625026702880859, -0.6780394315719604, -0.5935762524604797, -0.5091128349304199, -0.4246496558189392, -0.3401864469051361, -0.255723237991333, -0.1712600588798523, -0.08679687976837158, -0.0023336410522460938, 0.08212953805923462, 0.16659271717071533, 0.25105589628219604, 0.33551910519599915, 0.41998231410980225, 0.504445493221283, 0.5889086723327637, 0.6733719110488892, 0.7578350901603699, 0.8422982692718506, 0.9267614483833313, 1.011224627494812, 1.0956878662109375, 1.1801509857177734, 1.264614224433899, 1.3490774631500244, 1.4335405826568604, 1.5180038213729858, 1.6024670600891113, 1.6869301795959473, 1.7713934183120728, 1.8558566570281982, 1.9403197765350342, 2.024783134460449, 2.109246253967285, 2.193709373474121]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 6.0, 2.0, 5.0, 2.0, 6.0, 12.0, 4.0, 6.0, 12.0, 19.0, 17.0, 21.0, 36.0, 37.0, 32.0, 48.0, 65.0, 81.0, 146.0, 254.0, 474.0, 936.0, 2354.0, 6151.0, 22400.0, 218628.0, 3850551.0, 71246.0, 12887.0, 4210.0, 1655.0, 834.0, 467.0, 230.0, 158.0, 87.0, 70.0, 46.0, 32.0, 22.0, 16.0, 9.0, 7.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9375, -1.87139892578125, -1.8052978515625, -1.73919677734375, -1.673095703125, -1.60699462890625, -1.5408935546875, -1.47479248046875, -1.40869140625, -1.34259033203125, -1.2764892578125, -1.21038818359375, -1.144287109375, -1.07818603515625, -1.0120849609375, -0.94598388671875, -0.8798828125, -0.81378173828125, -0.7476806640625, -0.68157958984375, -0.615478515625, -0.54937744140625, -0.4832763671875, -0.41717529296875, -0.35107421875, -0.28497314453125, -0.2188720703125, -0.15277099609375, -0.086669921875, -0.02056884765625, 0.0455322265625, 0.11163330078125, 0.177734375, 0.24383544921875, 0.3099365234375, 0.37603759765625, 0.442138671875, 0.50823974609375, 0.5743408203125, 0.64044189453125, 0.70654296875, 0.77264404296875, 0.8387451171875, 0.90484619140625, 0.970947265625, 1.03704833984375, 1.1031494140625, 1.16925048828125, 1.2353515625, 1.30145263671875, 1.3675537109375, 1.43365478515625, 1.499755859375, 1.56585693359375, 1.6319580078125, 1.69805908203125, 1.76416015625, 1.83026123046875, 1.8963623046875, 1.96246337890625, 2.028564453125, 2.09466552734375, 2.1607666015625, 2.22686767578125, 2.29296875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 8.0, 12.0, 29.0, 33.0, 48.0, 72.0, 72.0, 119.0, 117.0, 125.0, 84.0, 83.0, 81.0, 44.0, 28.0, 20.0, 13.0, 5.0, 4.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.306396484375, -0.2983074188232422, -0.2902183532714844, -0.28212928771972656, -0.27404022216796875, -0.26595115661621094, -0.2578620910644531, -0.2497730255126953, -0.2416839599609375, -0.2335948944091797, -0.22550582885742188, -0.21741676330566406, -0.20932769775390625, -0.20123863220214844, -0.19314956665039062, -0.1850605010986328, -0.176971435546875, -0.1688823699951172, -0.16079330444335938, -0.15270423889160156, -0.14461517333984375, -0.13652610778808594, -0.12843704223632812, -0.12034797668457031, -0.1122589111328125, -0.10416984558105469, -0.09608078002929688, -0.08799171447753906, -0.07990264892578125, -0.07181358337402344, -0.06372451782226562, -0.05563545227050781, -0.04754638671875, -0.03945732116699219, -0.031368255615234375, -0.023279190063476562, -0.01519012451171875, -0.0071010589599609375, 0.000988006591796875, 0.009077072143554688, 0.0171661376953125, 0.025255203247070312, 0.033344268798828125, 0.04143333435058594, 0.04952239990234375, 0.05761146545410156, 0.06570053100585938, 0.07378959655761719, 0.081878662109375, 0.08996772766113281, 0.09805679321289062, 0.10614585876464844, 0.11423492431640625, 0.12232398986816406, 0.13041305541992188, 0.1385021209716797, 0.1465911865234375, 0.1546802520751953, 0.16276931762695312, 0.17085838317871094, 0.17894744873046875, 0.18703651428222656, 0.19512557983398438, 0.2032146453857422, 0.2113037109375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 8.0, 15.0, 22.0, 10.0, 25.0, 31.0, 51.0, 69.0, 114.0, 266.0, 555.0, 1365.0, 3801.0, 15211.0, 105357.0, 3735810.0, 295057.0, 27225.0, 5940.0, 1843.0, 722.0, 346.0, 181.0, 82.0, 56.0, 42.0, 24.0, 18.0, 7.0, 8.0, 6.0, 9.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8935546875, -1.835601806640625, -1.77764892578125, -1.719696044921875, -1.6617431640625, -1.603790283203125, -1.54583740234375, -1.487884521484375, -1.429931640625, -1.371978759765625, -1.31402587890625, -1.256072998046875, -1.1981201171875, -1.140167236328125, -1.08221435546875, -1.024261474609375, -0.96630859375, -0.908355712890625, -0.85040283203125, -0.792449951171875, -0.7344970703125, -0.676544189453125, -0.61859130859375, -0.560638427734375, -0.502685546875, -0.444732666015625, -0.38677978515625, -0.328826904296875, -0.2708740234375, -0.212921142578125, -0.15496826171875, -0.097015380859375, -0.0390625, 0.018890380859375, 0.07684326171875, 0.134796142578125, 0.1927490234375, 0.250701904296875, 0.30865478515625, 0.366607666015625, 0.424560546875, 0.482513427734375, 0.54046630859375, 0.598419189453125, 0.6563720703125, 0.714324951171875, 0.77227783203125, 0.830230712890625, 0.88818359375, 0.946136474609375, 1.00408935546875, 1.062042236328125, 1.1199951171875, 1.177947998046875, 1.23590087890625, 1.293853759765625, 1.351806640625, 1.409759521484375, 1.46771240234375, 1.525665283203125, 1.5836181640625, 1.641571044921875, 1.69952392578125, 1.757476806640625, 1.8154296875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 5.0, 1.0, 3.0, 11.0, 11.0, 21.0, 27.0, 38.0, 51.0, 119.0, 245.0, 670.0, 1874.0, 520.0, 196.0, 110.0, 61.0, 40.0, 26.0, 20.0, 13.0, 7.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55322265625, -0.5330352783203125, -0.512847900390625, -0.4926605224609375, -0.47247314453125, -0.4522857666015625, -0.432098388671875, -0.4119110107421875, -0.3917236328125, -0.3715362548828125, -0.351348876953125, -0.3311614990234375, -0.31097412109375, -0.2907867431640625, -0.270599365234375, -0.2504119873046875, -0.230224609375, -0.2100372314453125, -0.189849853515625, -0.1696624755859375, -0.14947509765625, -0.1292877197265625, -0.109100341796875, -0.0889129638671875, -0.0687255859375, -0.0485382080078125, -0.028350830078125, -0.0081634521484375, 0.01202392578125, 0.0322113037109375, 0.052398681640625, 0.0725860595703125, 0.0927734375, 0.1129608154296875, 0.133148193359375, 0.1533355712890625, 0.17352294921875, 0.1937103271484375, 0.213897705078125, 0.2340850830078125, 0.2542724609375, 0.2744598388671875, 0.294647216796875, 0.3148345947265625, 0.33502197265625, 0.3552093505859375, 0.375396728515625, 0.3955841064453125, 0.415771484375, 0.4359588623046875, 0.456146240234375, 0.4763336181640625, 0.49652099609375, 0.5167083740234375, 0.536895751953125, 0.5570831298828125, 0.5772705078125, 0.5974578857421875, 0.617645263671875, 0.6378326416015625, 0.65802001953125, 0.6782073974609375, 0.698394775390625, 0.7185821533203125, 0.73876953125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 12.0, 24.0, 130.0, 322.0, 332.0, 125.0, 47.0, 7.0, 7.0, 1.0, 0.0, 2.0, 1.0], "bins": [-15.870895385742188, -15.582854270935059, -15.29481315612793, -15.0067720413208, -14.718730926513672, -14.43069076538086, -14.142648696899414, -13.854608535766602, -13.566567420959473, -13.278526306152344, -12.990485191345215, -12.702444076538086, -12.414402961730957, -12.126361846923828, -11.838321685791016, -11.550280570983887, -11.262239456176758, -10.974198341369629, -10.6861572265625, -10.398116111755371, -10.110074996948242, -9.82203483581543, -9.533992767333984, -9.245952606201172, -8.957910537719727, -8.669869422912598, -8.381828308105469, -8.09378719329834, -7.805746555328369, -7.51770544052124, -7.229664325714111, -6.941623687744141, -6.6535820960998535, -6.365540981292725, -6.077499866485596, -5.789459228515625, -5.501418113708496, -5.213376998901367, -4.925335884094238, -4.637294769287109, -4.3492536544799805, -4.061212539672852, -3.7731716632843018, -3.485130548477173, -3.197089672088623, -2.909048557281494, -2.6210074424743652, -2.3329665660858154, -2.0449256896972656, -1.7568846940994263, -1.468843698501587, -1.180802583694458, -0.8927615880966187, -0.6047205924987793, -0.3166794776916504, -0.028638601303100586, 0.2594025135040283, 0.5474435091018677, 0.8354845643043518, 1.123525619506836, 1.4115666151046753, 1.6996076107025146, 1.9876487255096436, 2.2756896018981934, 2.5637307167053223]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 4.0, 5.0, 8.0, 3.0, 6.0, 4.0, 11.0, 11.0, 19.0, 16.0, 30.0, 22.0, 27.0, 27.0, 28.0, 35.0, 42.0, 26.0, 46.0, 51.0, 55.0, 53.0, 40.0, 59.0, 45.0, 39.0, 34.0, 38.0, 32.0, 20.0, 36.0, 23.0, 17.0, 20.0, 14.0, 10.0, 15.0, 9.0, 6.0, 6.0, 4.0, 2.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3890295028686523, -1.3394087553024292, -1.2897881269454956, -1.2401673793792725, -1.1905467510223389, -1.1409260034561157, -1.0913052558898926, -1.041684627532959, -0.9920638799667358, -0.9424431920051575, -0.8928225040435791, -0.843201756477356, -0.7935810685157776, -0.7439603805541992, -0.6943396329879761, -0.6447189450263977, -0.5950982570648193, -0.545477569103241, -0.4958568513393402, -0.44623613357543945, -0.3966154456138611, -0.3469947576522827, -0.29737403988838196, -0.2477533221244812, -0.19813263416290283, -0.14851193130016327, -0.0988912284374237, -0.04927052557468414, 0.0003501772880554199, 0.04997088015079498, 0.09959158301353455, 0.1492123007774353, 0.19883298873901367, 0.24845369160175323, 0.2980743944644928, 0.34769511222839355, 0.3973158001899719, 0.4469364881515503, 0.49655720591545105, 0.5461779236793518, 0.5957986116409302, 0.6454192996025085, 0.6950399875640869, 0.7446607351303101, 0.7942814230918884, 0.8439021110534668, 0.8935228586196899, 0.9431435465812683, 0.9927642345428467, 1.0423849821090698, 1.0920056104660034, 1.1416263580322266, 1.1912469863891602, 1.2408677339553833, 1.2904884815216064, 1.34010910987854, 1.3897298574447632, 1.4393506050109863, 1.48897123336792, 1.538591980934143, 1.5882127285003662, 1.6378333568572998, 1.687454104423523, 1.737074851989746, 1.7866954803466797]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 7.0, 5.0, 4.0, 8.0, 10.0, 12.0, 26.0, 29.0, 64.0, 91.0, 180.0, 434.0, 988.0, 3101.0, 16685.0, 199791.0, 755842.0, 60576.0, 7602.0, 1860.0, 617.0, 254.0, 144.0, 83.0, 47.0, 30.0, 24.0, 19.0, 7.0, 6.0, 7.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6796875, -2.59918212890625, -2.5186767578125, -2.43817138671875, -2.357666015625, -2.27716064453125, -2.1966552734375, -2.11614990234375, -2.03564453125, -1.95513916015625, -1.8746337890625, -1.79412841796875, -1.713623046875, -1.63311767578125, -1.5526123046875, -1.47210693359375, -1.3916015625, -1.31109619140625, -1.2305908203125, -1.15008544921875, -1.069580078125, -0.98907470703125, -0.9085693359375, -0.82806396484375, -0.74755859375, -0.66705322265625, -0.5865478515625, -0.50604248046875, -0.425537109375, -0.34503173828125, -0.2645263671875, -0.18402099609375, -0.103515625, -0.02301025390625, 0.0574951171875, 0.13800048828125, 0.218505859375, 0.29901123046875, 0.3795166015625, 0.46002197265625, 0.54052734375, 0.62103271484375, 0.7015380859375, 0.78204345703125, 0.862548828125, 0.94305419921875, 1.0235595703125, 1.10406494140625, 1.1845703125, 1.26507568359375, 1.3455810546875, 1.42608642578125, 1.506591796875, 1.58709716796875, 1.6676025390625, 1.74810791015625, 1.82861328125, 1.90911865234375, 1.9896240234375, 2.07012939453125, 2.150634765625, 2.23114013671875, 2.3116455078125, 2.39215087890625, 2.47265625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 2.0, 5.0, 4.0, 4.0, 19.0, 23.0, 33.0, 50.0, 45.0, 64.0, 76.0, 83.0, 87.0, 100.0, 82.0, 83.0, 77.0, 48.0, 35.0, 27.0, 30.0, 13.0, 12.0, 3.0, 3.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.299560546875, -0.2916698455810547, -0.2837791442871094, -0.27588844299316406, -0.26799774169921875, -0.26010704040527344, -0.2522163391113281, -0.2443256378173828, -0.2364349365234375, -0.2285442352294922, -0.22065353393554688, -0.21276283264160156, -0.20487213134765625, -0.19698143005371094, -0.18909072875976562, -0.1812000274658203, -0.173309326171875, -0.1654186248779297, -0.15752792358398438, -0.14963722229003906, -0.14174652099609375, -0.13385581970214844, -0.12596511840820312, -0.11807441711425781, -0.1101837158203125, -0.10229301452636719, -0.09440231323242188, -0.08651161193847656, -0.07862091064453125, -0.07073020935058594, -0.06283950805664062, -0.05494880676269531, -0.04705810546875, -0.03916740417480469, -0.031276702880859375, -0.023386001586914062, -0.01549530029296875, -0.0076045989990234375, 0.000286102294921875, 0.008176803588867188, 0.0160675048828125, 0.023958206176757812, 0.031848907470703125, 0.03973960876464844, 0.04763031005859375, 0.05552101135253906, 0.06341171264648438, 0.07130241394042969, 0.079193115234375, 0.08708381652832031, 0.09497451782226562, 0.10286521911621094, 0.11075592041015625, 0.11864662170410156, 0.12653732299804688, 0.1344280242919922, 0.1423187255859375, 0.1502094268798828, 0.15810012817382812, 0.16599082946777344, 0.17388153076171875, 0.18177223205566406, 0.18966293334960938, 0.1975536346435547, 0.2054443359375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 4.0, 5.0, 4.0, 6.0, 10.0, 14.0, 17.0, 21.0, 34.0, 61.0, 84.0, 119.0, 182.0, 322.0, 628.0, 1235.0, 2497.0, 5326.0, 13298.0, 38029.0, 131987.0, 443875.0, 291279.0, 78405.0, 24096.0, 9118.0, 3841.0, 1871.0, 923.0, 492.0, 267.0, 167.0, 91.0, 95.0, 47.0, 25.0, 23.0, 13.0, 11.0, 11.0, 6.0, 4.0, 3.0, 2.0, 5.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8916015625, -0.8626480102539062, -0.8336944580078125, -0.8047409057617188, -0.775787353515625, -0.7468338012695312, -0.7178802490234375, -0.6889266967773438, -0.65997314453125, -0.6310195922851562, -0.6020660400390625, -0.5731124877929688, -0.544158935546875, -0.5152053833007812, -0.4862518310546875, -0.45729827880859375, -0.4283447265625, -0.39939117431640625, -0.3704376220703125, -0.34148406982421875, -0.312530517578125, -0.28357696533203125, -0.2546234130859375, -0.22566986083984375, -0.19671630859375, -0.16776275634765625, -0.1388092041015625, -0.10985565185546875, -0.080902099609375, -0.05194854736328125, -0.0229949951171875, 0.00595855712890625, 0.034912109375, 0.06386566162109375, 0.0928192138671875, 0.12177276611328125, 0.150726318359375, 0.17967987060546875, 0.2086334228515625, 0.23758697509765625, 0.26654052734375, 0.29549407958984375, 0.3244476318359375, 0.35340118408203125, 0.382354736328125, 0.41130828857421875, 0.4402618408203125, 0.46921539306640625, 0.4981689453125, 0.5271224975585938, 0.5560760498046875, 0.5850296020507812, 0.613983154296875, 0.6429367065429688, 0.6718902587890625, 0.7008438110351562, 0.72979736328125, 0.7587509155273438, 0.7877044677734375, 0.8166580200195312, 0.845611572265625, 0.8745651245117188, 0.9035186767578125, 0.9324722290039062, 0.96142578125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 6.0, 5.0, 2.0, 9.0, 10.0, 7.0, 10.0, 8.0, 18.0, 23.0, 21.0, 27.0, 28.0, 35.0, 33.0, 30.0, 46.0, 46.0, 43.0, 47.0, 42.0, 38.0, 39.0, 42.0, 47.0, 45.0, 38.0, 31.0, 32.0, 42.0, 18.0, 24.0, 22.0, 17.0, 19.0, 17.0, 4.0, 6.0, 8.0, 6.0, 5.0, 1.0, 5.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.59716796875, -0.5787887573242188, -0.5604095458984375, -0.5420303344726562, -0.523651123046875, -0.5052719116210938, -0.4868927001953125, -0.46851348876953125, -0.45013427734375, -0.43175506591796875, -0.4133758544921875, -0.39499664306640625, -0.376617431640625, -0.35823822021484375, -0.3398590087890625, -0.32147979736328125, -0.3031005859375, -0.28472137451171875, -0.2663421630859375, -0.24796295166015625, -0.229583740234375, -0.21120452880859375, -0.1928253173828125, -0.17444610595703125, -0.15606689453125, -0.13768768310546875, -0.1193084716796875, -0.10092926025390625, -0.082550048828125, -0.06417083740234375, -0.0457916259765625, -0.02741241455078125, -0.009033203125, 0.00934600830078125, 0.0277252197265625, 0.04610443115234375, 0.064483642578125, 0.08286285400390625, 0.1012420654296875, 0.11962127685546875, 0.13800048828125, 0.15637969970703125, 0.1747589111328125, 0.19313812255859375, 0.211517333984375, 0.22989654541015625, 0.2482757568359375, 0.26665496826171875, 0.2850341796875, 0.30341339111328125, 0.3217926025390625, 0.34017181396484375, 0.358551025390625, 0.37693023681640625, 0.3953094482421875, 0.41368865966796875, 0.43206787109375, 0.45044708251953125, 0.4688262939453125, 0.48720550537109375, 0.505584716796875, 0.5239639282226562, 0.5423431396484375, 0.5607223510742188, 0.5791015625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 5.0, 3.0, 6.0, 13.0, 18.0, 28.0, 61.0, 81.0, 136.0, 218.0, 432.0, 1287.0, 5239.0, 33991.0, 735043.0, 252017.0, 15387.0, 2918.0, 857.0, 319.0, 182.0, 93.0, 71.0, 51.0, 37.0, 21.0, 12.0, 8.0, 10.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.966796875, -0.9332427978515625, -0.899688720703125, -0.8661346435546875, -0.83258056640625, -0.7990264892578125, -0.765472412109375, -0.7319183349609375, -0.6983642578125, -0.6648101806640625, -0.631256103515625, -0.5977020263671875, -0.56414794921875, -0.5305938720703125, -0.497039794921875, -0.4634857177734375, -0.429931640625, -0.3963775634765625, -0.362823486328125, -0.3292694091796875, -0.29571533203125, -0.2621612548828125, -0.228607177734375, -0.1950531005859375, -0.1614990234375, -0.1279449462890625, -0.094390869140625, -0.0608367919921875, -0.02728271484375, 0.0062713623046875, 0.039825439453125, 0.0733795166015625, 0.10693359375, 0.1404876708984375, 0.174041748046875, 0.2075958251953125, 0.24114990234375, 0.2747039794921875, 0.308258056640625, 0.3418121337890625, 0.3753662109375, 0.4089202880859375, 0.442474365234375, 0.4760284423828125, 0.50958251953125, 0.5431365966796875, 0.576690673828125, 0.6102447509765625, 0.643798828125, 0.6773529052734375, 0.710906982421875, 0.7444610595703125, 0.77801513671875, 0.8115692138671875, 0.845123291015625, 0.8786773681640625, 0.9122314453125, 0.9457855224609375, 0.979339599609375, 1.0128936767578125, 1.04644775390625, 1.0800018310546875, 1.113555908203125, 1.1471099853515625, 1.1806640625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 7.0, 7.0, 9.0, 9.0, 8.0, 9.0, 34.0, 62.0, 78.0, 100.0, 158.0, 144.0, 127.0, 91.0, 45.0, 34.0, 29.0, 17.0, 4.0, 9.0, 10.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0001342296600341797, -0.00013001449406147003, -0.00012579932808876038, -0.00012158416211605072, -0.00011736899614334106, -0.00011315383017063141, -0.00010893866419792175, -0.0001047234982252121, -0.00010050833225250244, -9.629316627979279e-05, -9.207800030708313e-05, -8.786283433437347e-05, -8.364766836166382e-05, -7.943250238895416e-05, -7.521733641624451e-05, -7.100217044353485e-05, -6.67870044708252e-05, -6.257183849811554e-05, -5.8356672525405884e-05, -5.414150655269623e-05, -4.992634057998657e-05, -4.5711174607276917e-05, -4.149600863456726e-05, -3.7280842661857605e-05, -3.306567668914795e-05, -2.8850510716438293e-05, -2.4635344743728638e-05, -2.0420178771018982e-05, -1.6205012798309326e-05, -1.198984682559967e-05, -7.774680852890015e-06, -3.559514880180359e-06, 6.556510925292969e-07, 4.870817065238953e-06, 9.085983037948608e-06, 1.3301149010658264e-05, 1.751631498336792e-05, 2.1731480956077576e-05, 2.594664692878723e-05, 3.0161812901496887e-05, 3.437697887420654e-05, 3.85921448469162e-05, 4.2807310819625854e-05, 4.702247679233551e-05, 5.1237642765045166e-05, 5.545280873775482e-05, 5.966797471046448e-05, 6.388314068317413e-05, 6.809830665588379e-05, 7.231347262859344e-05, 7.65286386013031e-05, 8.074380457401276e-05, 8.495897054672241e-05, 8.917413651943207e-05, 9.338930249214172e-05, 9.760446846485138e-05, 0.00010181963443756104, 0.00010603480041027069, 0.00011024996638298035, 0.00011446513235569, 0.00011868029832839966, 0.00012289546430110931, 0.00012711063027381897, 0.00013132579624652863, 0.00013554096221923828]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 6.0, 13.0, 18.0, 32.0, 49.0, 79.0, 152.0, 258.0, 816.0, 9416.0, 906999.0, 126899.0, 2865.0, 487.0, 202.0, 93.0, 73.0, 39.0, 32.0, 14.0, 8.0, 8.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.150390625, -2.088592529296875, -2.02679443359375, -1.964996337890625, -1.9031982421875, -1.841400146484375, -1.77960205078125, -1.717803955078125, -1.656005859375, -1.594207763671875, -1.53240966796875, -1.470611572265625, -1.4088134765625, -1.347015380859375, -1.28521728515625, -1.223419189453125, -1.16162109375, -1.099822998046875, -1.03802490234375, -0.976226806640625, -0.9144287109375, -0.852630615234375, -0.79083251953125, -0.729034423828125, -0.667236328125, -0.605438232421875, -0.54364013671875, -0.481842041015625, -0.4200439453125, -0.358245849609375, -0.29644775390625, -0.234649658203125, -0.1728515625, -0.111053466796875, -0.04925537109375, 0.012542724609375, 0.0743408203125, 0.136138916015625, 0.19793701171875, 0.259735107421875, 0.321533203125, 0.383331298828125, 0.44512939453125, 0.506927490234375, 0.5687255859375, 0.630523681640625, 0.69232177734375, 0.754119873046875, 0.81591796875, 0.877716064453125, 0.93951416015625, 1.001312255859375, 1.0631103515625, 1.124908447265625, 1.18670654296875, 1.248504638671875, 1.310302734375, 1.372100830078125, 1.43389892578125, 1.495697021484375, 1.5574951171875, 1.619293212890625, 1.68109130859375, 1.742889404296875, 1.8046875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 11.0, 11.0, 22.0, 35.0, 59.0, 113.0, 164.0, 190.0, 152.0, 100.0, 56.0, 24.0, 21.0, 17.0, 7.0, 7.0, 4.0, 7.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9990234375, -0.9722747802734375, -0.945526123046875, -0.9187774658203125, -0.89202880859375, -0.8652801513671875, -0.838531494140625, -0.8117828369140625, -0.7850341796875, -0.7582855224609375, -0.731536865234375, -0.7047882080078125, -0.67803955078125, -0.6512908935546875, -0.624542236328125, -0.5977935791015625, -0.571044921875, -0.5442962646484375, -0.517547607421875, -0.4907989501953125, -0.46405029296875, -0.4373016357421875, -0.410552978515625, -0.3838043212890625, -0.3570556640625, -0.3303070068359375, -0.303558349609375, -0.2768096923828125, -0.25006103515625, -0.2233123779296875, -0.196563720703125, -0.1698150634765625, -0.14306640625, -0.1163177490234375, -0.089569091796875, -0.0628204345703125, -0.03607177734375, -0.0093231201171875, 0.017425537109375, 0.0441741943359375, 0.0709228515625, 0.0976715087890625, 0.124420166015625, 0.1511688232421875, 0.17791748046875, 0.2046661376953125, 0.231414794921875, 0.2581634521484375, 0.284912109375, 0.3116607666015625, 0.338409423828125, 0.3651580810546875, 0.39190673828125, 0.4186553955078125, 0.445404052734375, 0.4721527099609375, 0.4989013671875, 0.5256500244140625, 0.552398681640625, 0.5791473388671875, 0.60589599609375, 0.6326446533203125, 0.659393310546875, 0.6861419677734375, 0.712890625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 6.0, 22.0, 42.0, 120.0, 276.0, 315.0, 149.0, 45.0, 28.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.204580307006836, -25.635066986083984, -25.065555572509766, -24.496042251586914, -23.926528930664062, -23.357017517089844, -22.787504196166992, -22.217992782592773, -21.648479461669922, -21.07896614074707, -20.50945472717285, -19.93994140625, -19.37042999267578, -18.80091667175293, -18.231403350830078, -17.66189193725586, -17.092378616333008, -16.522865295410156, -15.953353881835938, -15.383840560913086, -14.81432819366455, -14.244815826416016, -13.675302505493164, -13.105790138244629, -12.536277770996094, -11.966765403747559, -11.397253036499023, -10.827739715576172, -10.258227348327637, -9.688714981079102, -9.11920166015625, -8.549689292907715, -7.980177879333496, -7.410665512084961, -6.841152667999268, -6.271639823913574, -5.702127456665039, -5.132615089416504, -4.5631022453308105, -3.9935896396636963, -3.424077033996582, -2.8545644283294678, -2.2850518226623535, -1.7155392169952393, -1.146026611328125, -0.5765140056610107, -0.007001399993896484, 0.5625112056732178, 1.132023811340332, 1.7015364170074463, 2.2710490226745605, 2.840561628341675, 3.410074234008789, 3.9795868396759033, 4.549099445343018, 5.118612289428711, 5.688124656677246, 6.257637023925781, 6.827149868011475, 7.396662712097168, 7.966175079345703, 8.535687446594238, 9.105199813842773, 9.674713134765625, 10.24422550201416]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 5.0, 14.0, 9.0, 17.0, 14.0, 23.0, 19.0, 13.0, 25.0, 20.0, 26.0, 25.0, 40.0, 35.0, 37.0, 35.0, 46.0, 37.0, 52.0, 46.0, 37.0, 41.0, 40.0, 25.0, 30.0, 28.0, 35.0, 30.0, 26.0, 19.0, 22.0, 21.0, 17.0, 18.0, 12.0, 13.0, 9.0, 15.0, 5.0, 5.0, 5.0, 3.0, 4.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.975113868713379, -2.883923292160034, -2.7927327156066895, -2.7015419006347656, -2.610351324081421, -2.519160747528076, -2.4279701709747314, -2.3367795944213867, -2.245588779449463, -2.154398202896118, -2.0632076263427734, -1.9720169305801392, -1.8808262348175049, -1.7896356582641602, -1.6984450817108154, -1.6072543859481812, -1.5160638093948364, -1.4248732328414917, -1.3336825370788574, -1.2424919605255127, -1.1513012647628784, -1.0601106882095337, -0.9689200520515442, -0.8777294158935547, -0.7865387797355652, -0.6953481435775757, -0.6041575074195862, -0.5129668712615967, -0.42177626490592957, -0.33058562874794006, -0.23939502239227295, -0.14820438623428345, -0.057013750076293945, 0.03417687863111496, 0.12536750733852386, 0.21655812859535217, 0.3077487647533417, 0.3989394009113312, 0.4901300072669983, 0.5813206434249878, 0.6725112795829773, 0.7637019157409668, 0.8548925518989563, 0.9460831880569458, 1.0372737646102905, 1.1284644603729248, 1.2196550369262695, 1.3108456134796143, 1.4020363092422485, 1.4932268857955933, 1.5844175815582275, 1.6756081581115723, 1.7667988538742065, 1.8579894304275513, 1.9491801261901855, 2.0403707027435303, 2.131561279296875, 2.2227518558502197, 2.3139424324035645, 2.4051332473754883, 2.496323823928833, 2.5875144004821777, 2.6787049770355225, 2.769895553588867, 2.861086368560791]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 4.0, 14.0, 8.0, 21.0, 11.0, 15.0, 31.0, 38.0, 55.0, 89.0, 140.0, 305.0, 710.0, 2496.0, 12883.0, 180267.0, 3948841.0, 40174.0, 5546.0, 1480.0, 595.0, 283.0, 142.0, 64.0, 30.0, 20.0, 9.0, 4.0, 4.0, 4.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.017578125, -1.930877685546875, -1.84417724609375, -1.757476806640625, -1.6707763671875, -1.584075927734375, -1.49737548828125, -1.410675048828125, -1.323974609375, -1.237274169921875, -1.15057373046875, -1.063873291015625, -0.9771728515625, -0.890472412109375, -0.80377197265625, -0.717071533203125, -0.63037109375, -0.543670654296875, -0.45697021484375, -0.370269775390625, -0.2835693359375, -0.196868896484375, -0.11016845703125, -0.023468017578125, 0.063232421875, 0.149932861328125, 0.23663330078125, 0.323333740234375, 0.4100341796875, 0.496734619140625, 0.58343505859375, 0.670135498046875, 0.7568359375, 0.843536376953125, 0.93023681640625, 1.016937255859375, 1.1036376953125, 1.190338134765625, 1.27703857421875, 1.363739013671875, 1.450439453125, 1.537139892578125, 1.62384033203125, 1.710540771484375, 1.7972412109375, 1.883941650390625, 1.97064208984375, 2.057342529296875, 2.14404296875, 2.230743408203125, 2.31744384765625, 2.404144287109375, 2.4908447265625, 2.577545166015625, 2.66424560546875, 2.750946044921875, 2.837646484375, 2.924346923828125, 3.01104736328125, 3.097747802734375, 3.1844482421875, 3.271148681640625, 3.35784912109375, 3.444549560546875, 3.53125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 9.0, 11.0, 8.0, 23.0, 25.0, 37.0, 54.0, 44.0, 78.0, 77.0, 77.0, 95.0, 69.0, 85.0, 71.0, 61.0, 45.0, 41.0, 30.0, 21.0, 22.0, 10.0, 3.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.303955078125, -0.2960948944091797, -0.2882347106933594, -0.28037452697753906, -0.27251434326171875, -0.26465415954589844, -0.2567939758300781, -0.2489337921142578, -0.2410736083984375, -0.2332134246826172, -0.22535324096679688, -0.21749305725097656, -0.20963287353515625, -0.20177268981933594, -0.19391250610351562, -0.1860523223876953, -0.178192138671875, -0.1703319549560547, -0.16247177124023438, -0.15461158752441406, -0.14675140380859375, -0.13889122009277344, -0.13103103637695312, -0.12317085266113281, -0.1153106689453125, -0.10745048522949219, -0.09959030151367188, -0.09173011779785156, -0.08386993408203125, -0.07600975036621094, -0.06814956665039062, -0.06028938293457031, -0.05242919921875, -0.04456901550292969, -0.036708831787109375, -0.028848648071289062, -0.02098846435546875, -0.013128280639648438, -0.005268096923828125, 0.0025920867919921875, 0.0104522705078125, 0.018312454223632812, 0.026172637939453125, 0.03403282165527344, 0.04189300537109375, 0.04975318908691406, 0.057613372802734375, 0.06547355651855469, 0.073333740234375, 0.08119392395019531, 0.08905410766601562, 0.09691429138183594, 0.10477447509765625, 0.11263465881347656, 0.12049484252929688, 0.1283550262451172, 0.1362152099609375, 0.1440753936767578, 0.15193557739257812, 0.15979576110839844, 0.16765594482421875, 0.17551612854003906, 0.18337631225585938, 0.1912364959716797, 0.1990966796875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 2.0, 7.0, 8.0, 19.0, 22.0, 24.0, 37.0, 67.0, 136.0, 185.0, 354.0, 586.0, 1530.0, 6057.0, 66047.0, 4064033.0, 47192.0, 5155.0, 1394.0, 601.0, 301.0, 206.0, 101.0, 77.0, 37.0, 27.0, 22.0, 23.0, 15.0, 6.0, 5.0, 4.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9921875, -2.86981201171875, -2.7474365234375, -2.62506103515625, -2.502685546875, -2.38031005859375, -2.2579345703125, -2.13555908203125, -2.01318359375, -1.89080810546875, -1.7684326171875, -1.64605712890625, -1.523681640625, -1.40130615234375, -1.2789306640625, -1.15655517578125, -1.0341796875, -0.91180419921875, -0.7894287109375, -0.66705322265625, -0.544677734375, -0.42230224609375, -0.2999267578125, -0.17755126953125, -0.05517578125, 0.06719970703125, 0.1895751953125, 0.31195068359375, 0.434326171875, 0.55670166015625, 0.6790771484375, 0.80145263671875, 0.923828125, 1.04620361328125, 1.1685791015625, 1.29095458984375, 1.413330078125, 1.53570556640625, 1.6580810546875, 1.78045654296875, 1.90283203125, 2.02520751953125, 2.1475830078125, 2.26995849609375, 2.392333984375, 2.51470947265625, 2.6370849609375, 2.75946044921875, 2.8818359375, 3.00421142578125, 3.1265869140625, 3.24896240234375, 3.371337890625, 3.49371337890625, 3.6160888671875, 3.73846435546875, 3.86083984375, 3.98321533203125, 4.1055908203125, 4.22796630859375, 4.350341796875, 4.47271728515625, 4.5950927734375, 4.71746826171875, 4.83984375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 6.0, 5.0, 17.0, 19.0, 45.0, 135.0, 515.0, 2798.0, 349.0, 101.0, 36.0, 19.0, 16.0, 10.0, 2.0, 3.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6708984375, -0.6344451904296875, -0.597991943359375, -0.5615386962890625, -0.52508544921875, -0.4886322021484375, -0.452178955078125, -0.4157257080078125, -0.3792724609375, -0.3428192138671875, -0.306365966796875, -0.2699127197265625, -0.23345947265625, -0.1970062255859375, -0.160552978515625, -0.1240997314453125, -0.087646484375, -0.0511932373046875, -0.014739990234375, 0.0217132568359375, 0.05816650390625, 0.0946197509765625, 0.131072998046875, 0.1675262451171875, 0.2039794921875, 0.2404327392578125, 0.276885986328125, 0.3133392333984375, 0.34979248046875, 0.3862457275390625, 0.422698974609375, 0.4591522216796875, 0.49560546875, 0.5320587158203125, 0.568511962890625, 0.6049652099609375, 0.64141845703125, 0.6778717041015625, 0.714324951171875, 0.7507781982421875, 0.7872314453125, 0.8236846923828125, 0.860137939453125, 0.8965911865234375, 0.93304443359375, 0.9694976806640625, 1.005950927734375, 1.0424041748046875, 1.078857421875, 1.1153106689453125, 1.151763916015625, 1.1882171630859375, 1.22467041015625, 1.2611236572265625, 1.297576904296875, 1.3340301513671875, 1.3704833984375, 1.4069366455078125, 1.443389892578125, 1.4798431396484375, 1.51629638671875, 1.5527496337890625, 1.589202880859375, 1.6256561279296875, 1.662109375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 1.0, 3.0, 7.0, 9.0, 26.0, 64.0, 158.0, 261.0, 246.0, 141.0, 48.0, 22.0, 8.0, 5.0, 1.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.11191463470459, -8.899765968322754, -8.687617301940918, -8.475468635559082, -8.263320922851562, -8.051172256469727, -7.839023590087891, -7.626874923706055, -7.414726257324219, -7.202577590942383, -6.990428924560547, -6.778280735015869, -6.566132068634033, -6.353983402252197, -6.1418352127075195, -5.929686546325684, -5.717537879943848, -5.505389213562012, -5.293240547180176, -5.081092357635498, -4.868943691253662, -4.656795024871826, -4.444646835327148, -4.2324981689453125, -4.020349502563477, -3.8082008361816406, -3.596052408218384, -3.383903980255127, -3.171755313873291, -2.959606647491455, -2.7474582195281982, -2.5353097915649414, -2.3231611251831055, -2.1110124588012695, -1.8988640308380127, -1.6867154836654663, -1.47456693649292, -1.2624183893203735, -1.0502698421478271, -0.8381212949752808, -0.6259727478027344, -0.413824200630188, -0.2016756534576416, 0.010472893714904785, 0.22262144088745117, 0.43476998805999756, 0.646918535232544, 0.8590670824050903, 1.0712156295776367, 1.283364176750183, 1.4955127239227295, 1.7076612710952759, 1.9198098182678223, 2.131958484649658, 2.344106912612915, 2.556255340576172, 2.768404006958008, 2.9805526733398438, 3.1927011013031006, 3.4048495292663574, 3.6169981956481934, 3.8291468620300293, 4.041295051574707, 4.253443717956543, 4.465592384338379]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 14.0, 14.0, 23.0, 35.0, 53.0, 67.0, 84.0, 100.0, 111.0, 103.0, 107.0, 94.0, 73.0, 40.0, 26.0, 18.0, 11.0, 15.0, 7.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.850165367126465, -4.724785327911377, -4.599405288696289, -4.474025249481201, -4.348645210266113, -4.223265647888184, -4.0978851318359375, -3.9725053310394287, -3.84712553024292, -3.721745491027832, -3.596365451812744, -3.4709854125976562, -3.3456056118011475, -3.2202255725860596, -3.0948455333709717, -2.969465494155884, -2.844085454940796, -2.718705415725708, -2.59332537651062, -2.4679455757141113, -2.3425655364990234, -2.2171854972839355, -2.0918054580688477, -1.9664254188537598, -1.8410454988479614, -1.7156654596328735, -1.5902855396270752, -1.4649055004119873, -1.3395254611968994, -1.214145541191101, -1.0887655019760132, -0.9633855223655701, -0.8380053043365479, -0.7126253247261047, -0.5872453451156616, -0.46186530590057373, -0.3364853262901306, -0.2111053466796875, -0.08572530746459961, 0.039654672145843506, 0.16503465175628662, 0.29041463136672974, 0.41579464077949524, 0.5411746501922607, 0.6665546298027039, 0.791934609413147, 0.9173146486282349, 1.0426945686340332, 1.168074607849121, 1.293454647064209, 1.4188345670700073, 1.5442146062850952, 1.6695945262908936, 1.7949745655059814, 1.9203546047210693, 2.0457346439361572, 2.171114444732666, 2.296494483947754, 2.421874523162842, 2.5472545623779297, 2.6726343631744385, 2.7980144023895264, 2.9233944416046143, 3.048774480819702, 3.17415452003479]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 1.0, 7.0, 13.0, 15.0, 19.0, 25.0, 46.0, 62.0, 124.0, 208.0, 420.0, 984.0, 3071.0, 14694.0, 166355.0, 762207.0, 86849.0, 9548.0, 2348.0, 778.0, 346.0, 157.0, 87.0, 63.0, 40.0, 25.0, 18.0, 16.0, 11.0, 3.0, 3.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.033203125, -2.947479248046875, -2.86175537109375, -2.776031494140625, -2.6903076171875, -2.604583740234375, -2.51885986328125, -2.433135986328125, -2.347412109375, -2.261688232421875, -2.17596435546875, -2.090240478515625, -2.0045166015625, -1.918792724609375, -1.83306884765625, -1.747344970703125, -1.66162109375, -1.575897216796875, -1.49017333984375, -1.404449462890625, -1.3187255859375, -1.233001708984375, -1.14727783203125, -1.061553955078125, -0.975830078125, -0.890106201171875, -0.80438232421875, -0.718658447265625, -0.6329345703125, -0.547210693359375, -0.46148681640625, -0.375762939453125, -0.2900390625, -0.204315185546875, -0.11859130859375, -0.032867431640625, 0.0528564453125, 0.138580322265625, 0.22430419921875, 0.310028076171875, 0.395751953125, 0.481475830078125, 0.56719970703125, 0.652923583984375, 0.7386474609375, 0.824371337890625, 0.91009521484375, 0.995819091796875, 1.08154296875, 1.167266845703125, 1.25299072265625, 1.338714599609375, 1.4244384765625, 1.510162353515625, 1.59588623046875, 1.681610107421875, 1.767333984375, 1.853057861328125, 1.93878173828125, 2.024505615234375, 2.1102294921875, 2.195953369140625, 2.28167724609375, 2.367401123046875, 2.453125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 15.0, 12.0, 19.0, 23.0, 30.0, 60.0, 53.0, 83.0, 67.0, 88.0, 86.0, 73.0, 87.0, 68.0, 61.0, 40.0, 46.0, 30.0, 23.0, 15.0, 10.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.382568359375, -0.3726539611816406, -0.36273956298828125, -0.3528251647949219, -0.3429107666015625, -0.3329963684082031, -0.32308197021484375, -0.3131675720214844, -0.303253173828125, -0.2933387756347656, -0.28342437744140625, -0.2735099792480469, -0.2635955810546875, -0.2536811828613281, -0.24376678466796875, -0.23385238647460938, -0.22393798828125, -0.21402359008789062, -0.20410919189453125, -0.19419479370117188, -0.1842803955078125, -0.17436599731445312, -0.16445159912109375, -0.15453720092773438, -0.144622802734375, -0.13470840454101562, -0.12479400634765625, -0.11487960815429688, -0.1049652099609375, -0.09505081176757812, -0.08513641357421875, -0.07522201538085938, -0.0653076171875, -0.055393218994140625, -0.04547882080078125, -0.035564422607421875, -0.0256500244140625, -0.015735626220703125, -0.00582122802734375, 0.004093170166015625, 0.014007568359375, 0.023921966552734375, 0.03383636474609375, 0.043750762939453125, 0.0536651611328125, 0.06357955932617188, 0.07349395751953125, 0.08340835571289062, 0.09332275390625, 0.10323715209960938, 0.11315155029296875, 0.12306594848632812, 0.1329803466796875, 0.14289474487304688, 0.15280914306640625, 0.16272354125976562, 0.172637939453125, 0.18255233764648438, 0.19246673583984375, 0.20238113403320312, 0.2122955322265625, 0.22220993041992188, 0.23212432861328125, 0.24203872680664062, 0.251953125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 7.0, 12.0, 13.0, 30.0, 35.0, 67.0, 92.0, 189.0, 383.0, 1014.0, 2782.0, 9084.0, 34981.0, 173434.0, 571225.0, 200864.0, 39348.0, 9979.0, 3099.0, 1033.0, 410.0, 221.0, 114.0, 49.0, 25.0, 20.0, 18.0, 6.0, 8.0, 5.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.455078125, -1.4116973876953125, -1.368316650390625, -1.3249359130859375, -1.28155517578125, -1.2381744384765625, -1.194793701171875, -1.1514129638671875, -1.1080322265625, -1.0646514892578125, -1.021270751953125, -0.9778900146484375, -0.93450927734375, -0.8911285400390625, -0.847747802734375, -0.8043670654296875, -0.760986328125, -0.7176055908203125, -0.674224853515625, -0.6308441162109375, -0.58746337890625, -0.5440826416015625, -0.500701904296875, -0.4573211669921875, -0.4139404296875, -0.3705596923828125, -0.327178955078125, -0.2837982177734375, -0.24041748046875, -0.1970367431640625, -0.153656005859375, -0.1102752685546875, -0.06689453125, -0.0235137939453125, 0.019866943359375, 0.0632476806640625, 0.10662841796875, 0.1500091552734375, 0.193389892578125, 0.2367706298828125, 0.2801513671875, 0.3235321044921875, 0.366912841796875, 0.4102935791015625, 0.45367431640625, 0.4970550537109375, 0.540435791015625, 0.5838165283203125, 0.627197265625, 0.6705780029296875, 0.713958740234375, 0.7573394775390625, 0.80072021484375, 0.8441009521484375, 0.887481689453125, 0.9308624267578125, 0.9742431640625, 1.0176239013671875, 1.061004638671875, 1.1043853759765625, 1.14776611328125, 1.1911468505859375, 1.234527587890625, 1.2779083251953125, 1.3212890625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 5.0, 0.0, 0.0, 2.0, 5.0, 4.0, 4.0, 2.0, 5.0, 6.0, 7.0, 12.0, 10.0, 12.0, 18.0, 14.0, 12.0, 21.0, 17.0, 30.0, 26.0, 39.0, 44.0, 36.0, 44.0, 45.0, 40.0, 45.0, 51.0, 36.0, 46.0, 36.0, 28.0, 30.0, 35.0, 28.0, 27.0, 30.0, 24.0, 15.0, 18.0, 23.0, 14.0, 6.0, 11.0, 12.0, 6.0, 6.0, 5.0, 5.0, 8.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0], "bins": [-0.76171875, -0.7396316528320312, -0.7175445556640625, -0.6954574584960938, -0.673370361328125, -0.6512832641601562, -0.6291961669921875, -0.6071090698242188, -0.58502197265625, -0.5629348754882812, -0.5408477783203125, -0.5187606811523438, -0.496673583984375, -0.47458648681640625, -0.4524993896484375, -0.43041229248046875, -0.4083251953125, -0.38623809814453125, -0.3641510009765625, -0.34206390380859375, -0.319976806640625, -0.29788970947265625, -0.2758026123046875, -0.25371551513671875, -0.23162841796875, -0.20954132080078125, -0.1874542236328125, -0.16536712646484375, -0.143280029296875, -0.12119293212890625, -0.0991058349609375, -0.07701873779296875, -0.054931640625, -0.03284454345703125, -0.0107574462890625, 0.01132965087890625, 0.033416748046875, 0.05550384521484375, 0.0775909423828125, 0.09967803955078125, 0.12176513671875, 0.14385223388671875, 0.1659393310546875, 0.18802642822265625, 0.210113525390625, 0.23220062255859375, 0.2542877197265625, 0.27637481689453125, 0.2984619140625, 0.32054901123046875, 0.3426361083984375, 0.36472320556640625, 0.386810302734375, 0.40889739990234375, 0.4309844970703125, 0.45307159423828125, 0.47515869140625, 0.49724578857421875, 0.5193328857421875, 0.5414199829101562, 0.563507080078125, 0.5855941772460938, 0.6076812744140625, 0.6297683715820312, 0.65185546875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 9.0, 8.0, 3.0, 10.0, 18.0, 18.0, 21.0, 56.0, 82.0, 112.0, 216.0, 413.0, 852.0, 2164.0, 6427.0, 28299.0, 204575.0, 632986.0, 142223.0, 21325.0, 5288.0, 1758.0, 779.0, 388.0, 206.0, 116.0, 68.0, 51.0, 21.0, 19.0, 19.0, 12.0, 6.0, 2.0, 2.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5703125, -0.5487213134765625, -0.527130126953125, -0.5055389404296875, -0.48394775390625, -0.4623565673828125, -0.440765380859375, -0.4191741943359375, -0.3975830078125, -0.3759918212890625, -0.354400634765625, -0.3328094482421875, -0.31121826171875, -0.2896270751953125, -0.268035888671875, -0.2464447021484375, -0.224853515625, -0.2032623291015625, -0.181671142578125, -0.1600799560546875, -0.13848876953125, -0.1168975830078125, -0.095306396484375, -0.0737152099609375, -0.0521240234375, -0.0305328369140625, -0.008941650390625, 0.0126495361328125, 0.03424072265625, 0.0558319091796875, 0.077423095703125, 0.0990142822265625, 0.12060546875, 0.1421966552734375, 0.163787841796875, 0.1853790283203125, 0.20697021484375, 0.2285614013671875, 0.250152587890625, 0.2717437744140625, 0.2933349609375, 0.3149261474609375, 0.336517333984375, 0.3581085205078125, 0.37969970703125, 0.4012908935546875, 0.422882080078125, 0.4444732666015625, 0.466064453125, 0.4876556396484375, 0.509246826171875, 0.5308380126953125, 0.55242919921875, 0.5740203857421875, 0.595611572265625, 0.6172027587890625, 0.6387939453125, 0.6603851318359375, 0.681976318359375, 0.7035675048828125, 0.72515869140625, 0.7467498779296875, 0.768341064453125, 0.7899322509765625, 0.8115234375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 4.0, 3.0, 3.0, 5.0, 10.0, 10.0, 15.0, 32.0, 48.0, 106.0, 161.0, 201.0, 161.0, 110.0, 46.0, 33.0, 22.0, 15.0, 7.0, 3.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00025963783264160156, -0.00025290995836257935, -0.00024618208408355713, -0.0002394542098045349, -0.0002327263355255127, -0.00022599846124649048, -0.00021927058696746826, -0.00021254271268844604, -0.00020581483840942383, -0.0001990869641304016, -0.0001923590898513794, -0.00018563121557235718, -0.00017890334129333496, -0.00017217546701431274, -0.00016544759273529053, -0.0001587197184562683, -0.0001519918441772461, -0.00014526396989822388, -0.00013853609561920166, -0.00013180822134017944, -0.00012508034706115723, -0.00011835247278213501, -0.00011162459850311279, -0.00010489672422409058, -9.816884994506836e-05, -9.144097566604614e-05, -8.471310138702393e-05, -7.798522710800171e-05, -7.125735282897949e-05, -6.452947854995728e-05, -5.780160427093506e-05, -5.107372999191284e-05, -4.4345855712890625e-05, -3.761798143386841e-05, -3.089010715484619e-05, -2.4162232875823975e-05, -1.7434358596801758e-05, -1.0706484317779541e-05, -3.978610038757324e-06, 2.7492642402648926e-06, 9.47713851928711e-06, 1.6205012798309326e-05, 2.2932887077331543e-05, 2.966076135635376e-05, 3.6388635635375977e-05, 4.311650991439819e-05, 4.984438419342041e-05, 5.657225847244263e-05, 6.330013275146484e-05, 7.002800703048706e-05, 7.675588130950928e-05, 8.34837555885315e-05, 9.021162986755371e-05, 9.693950414657593e-05, 0.00010366737842559814, 0.00011039525270462036, 0.00011712312698364258, 0.0001238510012626648, 0.000130578875541687, 0.00013730674982070923, 0.00014403462409973145, 0.00015076249837875366, 0.00015749037265777588, 0.0001642182469367981, 0.0001709461212158203]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 8.0, 8.0, 25.0, 36.0, 75.0, 180.0, 395.0, 1146.0, 3876.0, 26347.0, 548749.0, 441185.0, 21310.0, 3443.0, 1033.0, 406.0, 160.0, 67.0, 42.0, 28.0, 9.0, 9.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2021484375, -1.1704788208007812, -1.1388092041015625, -1.1071395874023438, -1.075469970703125, -1.0438003540039062, -1.0121307373046875, -0.9804611206054688, -0.94879150390625, -0.9171218872070312, -0.8854522705078125, -0.8537826538085938, -0.822113037109375, -0.7904434204101562, -0.7587738037109375, -0.7271041870117188, -0.6954345703125, -0.6637649536132812, -0.6320953369140625, -0.6004257202148438, -0.568756103515625, -0.5370864868164062, -0.5054168701171875, -0.47374725341796875, -0.44207763671875, -0.41040802001953125, -0.3787384033203125, -0.34706878662109375, -0.315399169921875, -0.28372955322265625, -0.2520599365234375, -0.22039031982421875, -0.188720703125, -0.15705108642578125, -0.1253814697265625, -0.09371185302734375, -0.062042236328125, -0.03037261962890625, 0.0012969970703125, 0.03296661376953125, 0.06463623046875, 0.09630584716796875, 0.1279754638671875, 0.15964508056640625, 0.191314697265625, 0.22298431396484375, 0.2546539306640625, 0.28632354736328125, 0.3179931640625, 0.34966278076171875, 0.3813323974609375, 0.41300201416015625, 0.444671630859375, 0.47634124755859375, 0.5080108642578125, 0.5396804809570312, 0.57135009765625, 0.6030197143554688, 0.6346893310546875, 0.6663589477539062, 0.698028564453125, 0.7296981811523438, 0.7613677978515625, 0.7930374145507812, 0.82470703125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 6.0, 1.0, 1.0, 3.0, 10.0, 9.0, 30.0, 24.0, 31.0, 40.0, 49.0, 69.0, 75.0, 85.0, 110.0, 96.0, 92.0, 71.0, 54.0, 42.0, 26.0, 22.0, 21.0, 10.0, 8.0, 6.0, 4.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.51708984375, -0.5025253295898438, -0.4879608154296875, -0.47339630126953125, -0.458831787109375, -0.44426727294921875, -0.4297027587890625, -0.41513824462890625, -0.40057373046875, -0.38600921630859375, -0.3714447021484375, -0.35688018798828125, -0.342315673828125, -0.32775115966796875, -0.3131866455078125, -0.29862213134765625, -0.2840576171875, -0.26949310302734375, -0.2549285888671875, -0.24036407470703125, -0.225799560546875, -0.21123504638671875, -0.1966705322265625, -0.18210601806640625, -0.16754150390625, -0.15297698974609375, -0.1384124755859375, -0.12384796142578125, -0.109283447265625, -0.09471893310546875, -0.0801544189453125, -0.06558990478515625, -0.051025390625, -0.03646087646484375, -0.0218963623046875, -0.00733184814453125, 0.007232666015625, 0.02179718017578125, 0.0363616943359375, 0.05092620849609375, 0.06549072265625, 0.08005523681640625, 0.0946197509765625, 0.10918426513671875, 0.123748779296875, 0.13831329345703125, 0.1528778076171875, 0.16744232177734375, 0.1820068359375, 0.19657135009765625, 0.2111358642578125, 0.22570037841796875, 0.240264892578125, 0.25482940673828125, 0.2693939208984375, 0.28395843505859375, 0.29852294921875, 0.31308746337890625, 0.3276519775390625, 0.34221649169921875, 0.356781005859375, 0.37134552001953125, 0.3859100341796875, 0.40047454833984375, 0.4150390625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 26.0, 188.0, 628.0, 156.0, 11.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.05990600585938, -70.73634338378906, -69.41277313232422, -68.0892105102539, -66.76564025878906, -65.44207763671875, -64.1185073852539, -62.794944763183594, -61.471378326416016, -60.14781188964844, -58.82424545288086, -57.50067901611328, -56.17711639404297, -54.85354995727539, -53.52998352050781, -52.206417083740234, -50.882850646972656, -49.55928421020508, -48.2357177734375, -46.91215133666992, -45.588584899902344, -44.26502227783203, -42.94145584106445, -41.617889404296875, -40.2943229675293, -38.97075653076172, -37.64719009399414, -36.32362365722656, -35.00006103515625, -33.67649459838867, -32.352928161621094, -31.029361724853516, -29.705791473388672, -28.382225036621094, -27.058658599853516, -25.73509407043457, -24.411527633666992, -23.087961196899414, -21.76439666748047, -20.44083023071289, -19.117263793945312, -17.793697357177734, -16.470130920410156, -15.146566390991211, -13.822999954223633, -12.499433517456055, -11.175868034362793, -9.852302551269531, -8.528736114501953, -7.205170154571533, -5.881604194641113, -4.558038234710693, -3.2344722747802734, -1.9109063148498535, -0.5873403549194336, 0.7362251281738281, 2.0597915649414062, 3.383357524871826, 4.706923484802246, 6.030489444732666, 7.354055404663086, 8.677621841430664, 10.001187324523926, 11.324752807617188, 12.648319244384766]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 3.0, 4.0, 3.0, 3.0, 7.0, 4.0, 6.0, 6.0, 12.0, 14.0, 11.0, 22.0, 17.0, 22.0, 17.0, 24.0, 39.0, 26.0, 37.0, 39.0, 47.0, 39.0, 38.0, 53.0, 47.0, 45.0, 50.0, 33.0, 37.0, 25.0, 37.0, 28.0, 21.0, 28.0, 35.0, 23.0, 15.0, 18.0, 14.0, 16.0, 13.0, 8.0, 7.0, 6.0, 8.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.11401104927063, -2.999189853668213, -2.884368419647217, -2.7695472240448, -2.6547257900238037, -2.5399045944213867, -2.4250831604003906, -2.3102619647979736, -2.1954407691955566, -2.0806195735931396, -1.9657981395721436, -1.8509769439697266, -1.7361555099487305, -1.6213343143463135, -1.506512999534607, -1.3916916847229004, -1.2768702507019043, -1.1620489358901978, -1.0472276210784912, -0.9324063658714294, -0.8175850510597229, -0.7027637362480164, -0.5879424810409546, -0.47312116622924805, -0.3582998514175415, -0.24347855150699615, -0.1286572515964508, -0.01383596658706665, 0.10098534822463989, 0.21580666303634644, 0.3306279182434082, 0.44544923305511475, 0.5602707862854004, 0.6750921010971069, 0.7899134159088135, 0.9047346711158752, 1.0195560455322266, 1.1343772411346436, 1.24919855594635, 1.3640198707580566, 1.4788411855697632, 1.5936625003814697, 1.7084838151931763, 1.8233051300048828, 1.9381263256072998, 2.052947759628296, 2.167768955230713, 2.282590389251709, 2.397411584854126, 2.512232780456543, 2.627054214477539, 2.741875410079956, 2.856696844100952, 2.971518039703369, 3.0863394737243652, 3.2011606693267822, 3.315981864929199, 3.430803060531616, 3.5456244945526123, 3.6604456901550293, 3.7752671241760254, 3.8900883197784424, 4.004909515380859, 4.1197309494018555, 4.234552383422852]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 6.0, 5.0, 7.0, 6.0, 2.0, 11.0, 8.0, 14.0, 18.0, 15.0, 25.0, 46.0, 39.0, 56.0, 114.0, 157.0, 264.0, 480.0, 926.0, 2157.0, 6016.0, 25216.0, 436443.0, 3673174.0, 36403.0, 7587.0, 2590.0, 1075.0, 589.0, 283.0, 201.0, 105.0, 82.0, 40.0, 33.0, 28.0, 13.0, 18.0, 7.0, 10.0, 6.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.634765625, -3.53936767578125, -3.4439697265625, -3.34857177734375, -3.253173828125, -3.15777587890625, -3.0623779296875, -2.96697998046875, -2.87158203125, -2.77618408203125, -2.6807861328125, -2.58538818359375, -2.489990234375, -2.39459228515625, -2.2991943359375, -2.20379638671875, -2.1083984375, -2.01300048828125, -1.9176025390625, -1.82220458984375, -1.726806640625, -1.63140869140625, -1.5360107421875, -1.44061279296875, -1.34521484375, -1.24981689453125, -1.1544189453125, -1.05902099609375, -0.963623046875, -0.86822509765625, -0.7728271484375, -0.67742919921875, -0.58203125, -0.48663330078125, -0.3912353515625, -0.29583740234375, -0.200439453125, -0.10504150390625, -0.0096435546875, 0.08575439453125, 0.18115234375, 0.27655029296875, 0.3719482421875, 0.46734619140625, 0.562744140625, 0.65814208984375, 0.7535400390625, 0.84893798828125, 0.9443359375, 1.03973388671875, 1.1351318359375, 1.23052978515625, 1.325927734375, 1.42132568359375, 1.5167236328125, 1.61212158203125, 1.70751953125, 1.80291748046875, 1.8983154296875, 1.99371337890625, 2.089111328125, 2.18450927734375, 2.2799072265625, 2.37530517578125, 2.470703125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 7.0, 17.0, 24.0, 27.0, 29.0, 46.0, 60.0, 68.0, 61.0, 69.0, 79.0, 69.0, 75.0, 62.0, 76.0, 55.0, 44.0, 32.0, 32.0, 24.0, 14.0, 12.0, 5.0, 5.0, 6.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.385498046875, -0.37567138671875, -0.3658447265625, -0.35601806640625, -0.34619140625, -0.33636474609375, -0.3265380859375, -0.31671142578125, -0.306884765625, -0.29705810546875, -0.2872314453125, -0.27740478515625, -0.267578125, -0.25775146484375, -0.2479248046875, -0.23809814453125, -0.228271484375, -0.21844482421875, -0.2086181640625, -0.19879150390625, -0.18896484375, -0.17913818359375, -0.1693115234375, -0.15948486328125, -0.149658203125, -0.13983154296875, -0.1300048828125, -0.12017822265625, -0.1103515625, -0.10052490234375, -0.0906982421875, -0.08087158203125, -0.071044921875, -0.06121826171875, -0.0513916015625, -0.04156494140625, -0.03173828125, -0.02191162109375, -0.0120849609375, -0.00225830078125, 0.007568359375, 0.01739501953125, 0.0272216796875, 0.03704833984375, 0.046875, 0.05670166015625, 0.0665283203125, 0.07635498046875, 0.086181640625, 0.09600830078125, 0.1058349609375, 0.11566162109375, 0.12548828125, 0.13531494140625, 0.1451416015625, 0.15496826171875, 0.164794921875, 0.17462158203125, 0.1844482421875, 0.19427490234375, 0.2041015625, 0.21392822265625, 0.2237548828125, 0.23358154296875, 0.243408203125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 8.0, 8.0, 9.0, 12.0, 20.0, 27.0, 45.0, 46.0, 59.0, 85.0, 116.0, 160.0, 202.0, 348.0, 662.0, 1313.0, 3200.0, 11866.0, 81589.0, 3901253.0, 167107.0, 18093.0, 4446.0, 1614.0, 749.0, 387.0, 239.0, 182.0, 103.0, 92.0, 71.0, 50.0, 34.0, 22.0, 23.0, 14.0, 16.0, 3.0, 5.0, 1.0, 8.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.27734375, -3.1878662109375, -3.098388671875, -3.0089111328125, -2.91943359375, -2.8299560546875, -2.740478515625, -2.6510009765625, -2.5615234375, -2.4720458984375, -2.382568359375, -2.2930908203125, -2.20361328125, -2.1141357421875, -2.024658203125, -1.9351806640625, -1.845703125, -1.7562255859375, -1.666748046875, -1.5772705078125, -1.48779296875, -1.3983154296875, -1.308837890625, -1.2193603515625, -1.1298828125, -1.0404052734375, -0.950927734375, -0.8614501953125, -0.77197265625, -0.6824951171875, -0.593017578125, -0.5035400390625, -0.4140625, -0.3245849609375, -0.235107421875, -0.1456298828125, -0.05615234375, 0.0333251953125, 0.122802734375, 0.2122802734375, 0.3017578125, 0.3912353515625, 0.480712890625, 0.5701904296875, 0.65966796875, 0.7491455078125, 0.838623046875, 0.9281005859375, 1.017578125, 1.1070556640625, 1.196533203125, 1.2860107421875, 1.37548828125, 1.4649658203125, 1.554443359375, 1.6439208984375, 1.7333984375, 1.8228759765625, 1.912353515625, 2.0018310546875, 2.09130859375, 2.1807861328125, 2.270263671875, 2.3597412109375, 2.44921875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 6.0, 11.0, 17.0, 31.0, 49.0, 140.0, 831.0, 2596.0, 209.0, 90.0, 36.0, 24.0, 15.0, 8.0, 9.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.146484375, -1.105743408203125, -1.06500244140625, -1.024261474609375, -0.9835205078125, -0.942779541015625, -0.90203857421875, -0.861297607421875, -0.820556640625, -0.779815673828125, -0.73907470703125, -0.698333740234375, -0.6575927734375, -0.616851806640625, -0.57611083984375, -0.535369873046875, -0.49462890625, -0.453887939453125, -0.41314697265625, -0.372406005859375, -0.3316650390625, -0.290924072265625, -0.25018310546875, -0.209442138671875, -0.168701171875, -0.127960205078125, -0.08721923828125, -0.046478271484375, -0.0057373046875, 0.035003662109375, 0.07574462890625, 0.116485595703125, 0.1572265625, 0.197967529296875, 0.23870849609375, 0.279449462890625, 0.3201904296875, 0.360931396484375, 0.40167236328125, 0.442413330078125, 0.483154296875, 0.523895263671875, 0.56463623046875, 0.605377197265625, 0.6461181640625, 0.686859130859375, 0.72760009765625, 0.768341064453125, 0.80908203125, 0.849822998046875, 0.89056396484375, 0.931304931640625, 0.9720458984375, 1.012786865234375, 1.05352783203125, 1.094268798828125, 1.135009765625, 1.175750732421875, 1.21649169921875, 1.257232666015625, 1.2979736328125, 1.338714599609375, 1.37945556640625, 1.420196533203125, 1.4609375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 9.0, 6.0, 35.0, 84.0, 164.0, 297.0, 231.0, 106.0, 38.0, 21.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.816176414489746, -9.580138206481934, -9.344099998474121, -9.108060836791992, -8.87202262878418, -8.635984420776367, -8.399946212768555, -8.163908004760742, -7.92786979675293, -7.691831588745117, -7.4557929039001465, -7.219754695892334, -6.9837164878845215, -6.747677803039551, -6.511639595031738, -6.275601387023926, -6.039562702178955, -5.803524494171143, -5.567485809326172, -5.331447601318359, -5.095409393310547, -4.859371185302734, -4.623332500457764, -4.387294292449951, -4.1512556076049805, -3.915217161178589, -3.6791789531707764, -3.4431405067443848, -3.2071022987365723, -2.9710638523101807, -2.735025405883789, -2.4989871978759766, -2.262948513031006, -2.0269100666046143, -1.7908718585968018, -1.5548334121704102, -1.318795084953308, -1.082756757736206, -0.8467183113098145, -0.6106799840927124, -0.37464165687561035, -0.1386032998561859, 0.09743505716323853, 0.33347344398498535, 0.5695117712020874, 0.8055500984191895, 1.041588544845581, 1.277626872062683, 1.5136651992797852, 1.7497035264968872, 1.9857418537139893, 2.221780300140381, 2.4578185081481934, 2.693856954574585, 2.9298954010009766, 3.165933609008789, 3.4019720554351807, 3.6380105018615723, 3.8740487098693848, 4.1100873947143555, 4.346125602722168, 4.5821638107299805, 4.818202018737793, 5.054240703582764, 5.290278911590576]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 5.0, 6.0, 12.0, 10.0, 19.0, 46.0, 60.0, 56.0, 77.0, 97.0, 84.0, 86.0, 87.0, 86.0, 69.0, 58.0, 48.0, 26.0, 22.0, 18.0, 13.0, 6.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.4029347896575928, -3.2981135845184326, -3.1932923793792725, -3.0884711742401123, -2.983649969100952, -2.878828763961792, -2.774007558822632, -2.6691863536834717, -2.5643651485443115, -2.4595439434051514, -2.354722738265991, -2.249901533126831, -2.145080327987671, -2.0402591228485107, -1.9354379177093506, -1.8306167125701904, -1.7257956266403198, -1.6209744215011597, -1.5161532163619995, -1.4113320112228394, -1.3065108060836792, -1.2016897201538086, -1.0968685150146484, -0.9920472502708435, -0.8872260451316833, -0.7824048399925232, -0.677583634853363, -0.5727624893188477, -0.4679412543773651, -0.36312007904052734, -0.2582988739013672, -0.15347766876220703, -0.048656463623046875, 0.056164734065532684, 0.16098593175411224, 0.2658071219921112, 0.37062832713127136, 0.47544950246810913, 0.5802707076072693, 0.6850919127464294, 0.7899131178855896, 0.8947343230247498, 0.9995555281639099, 1.1043766736984253, 1.2091978788375854, 1.3140190839767456, 1.4188402891159058, 1.523661494255066, 1.628482699394226, 1.7333039045333862, 1.8381251096725464, 1.9429463148117065, 2.047767400741577, 2.1525886058807373, 2.2574098110198975, 2.3622310161590576, 2.4670522212982178, 2.571873426437378, 2.676694631576538, 2.7815158367156982, 2.8863370418548584, 2.9911582469940186, 3.0959794521331787, 3.200800657272339, 3.305621862411499]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 0.0, 3.0, 0.0, 4.0, 5.0, 7.0, 8.0, 13.0, 10.0, 25.0, 31.0, 63.0, 51.0, 90.0, 135.0, 203.0, 310.0, 493.0, 968.0, 1877.0, 4108.0, 9721.0, 27333.0, 92556.0, 334862.0, 400888.0, 119885.0, 33660.0, 11614.0, 4798.0, 2086.0, 1137.0, 569.0, 349.0, 228.0, 142.0, 91.0, 69.0, 58.0, 21.0, 25.0, 13.0, 15.0, 13.0, 7.0, 6.0, 7.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.65234375, -1.6024169921875, -1.552490234375, -1.5025634765625, -1.45263671875, -1.4027099609375, -1.352783203125, -1.3028564453125, -1.2529296875, -1.2030029296875, -1.153076171875, -1.1031494140625, -1.05322265625, -1.0032958984375, -0.953369140625, -0.9034423828125, -0.853515625, -0.8035888671875, -0.753662109375, -0.7037353515625, -0.65380859375, -0.6038818359375, -0.553955078125, -0.5040283203125, -0.4541015625, -0.4041748046875, -0.354248046875, -0.3043212890625, -0.25439453125, -0.2044677734375, -0.154541015625, -0.1046142578125, -0.0546875, -0.0047607421875, 0.045166015625, 0.0950927734375, 0.14501953125, 0.1949462890625, 0.244873046875, 0.2947998046875, 0.3447265625, 0.3946533203125, 0.444580078125, 0.4945068359375, 0.54443359375, 0.5943603515625, 0.644287109375, 0.6942138671875, 0.744140625, 0.7940673828125, 0.843994140625, 0.8939208984375, 0.94384765625, 0.9937744140625, 1.043701171875, 1.0936279296875, 1.1435546875, 1.1934814453125, 1.243408203125, 1.2933349609375, 1.34326171875, 1.3931884765625, 1.443115234375, 1.4930419921875, 1.54296875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 9.0, 9.0, 20.0, 26.0, 18.0, 38.0, 46.0, 49.0, 54.0, 61.0, 75.0, 82.0, 94.0, 81.0, 70.0, 62.0, 52.0, 38.0, 28.0, 30.0, 27.0, 17.0, 9.0, 6.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44384765625, -0.43189239501953125, -0.4199371337890625, -0.40798187255859375, -0.396026611328125, -0.38407135009765625, -0.3721160888671875, -0.36016082763671875, -0.34820556640625, -0.33625030517578125, -0.3242950439453125, -0.31233978271484375, -0.300384521484375, -0.28842926025390625, -0.2764739990234375, -0.26451873779296875, -0.2525634765625, -0.24060821533203125, -0.2286529541015625, -0.21669769287109375, -0.204742431640625, -0.19278717041015625, -0.1808319091796875, -0.16887664794921875, -0.15692138671875, -0.14496612548828125, -0.1330108642578125, -0.12105560302734375, -0.109100341796875, -0.09714508056640625, -0.0851898193359375, -0.07323455810546875, -0.061279296875, -0.04932403564453125, -0.0373687744140625, -0.02541351318359375, -0.013458251953125, -0.00150299072265625, 0.0104522705078125, 0.02240753173828125, 0.03436279296875, 0.04631805419921875, 0.0582733154296875, 0.07022857666015625, 0.082183837890625, 0.09413909912109375, 0.1060943603515625, 0.11804962158203125, 0.1300048828125, 0.14196014404296875, 0.1539154052734375, 0.16587066650390625, 0.177825927734375, 0.18978118896484375, 0.2017364501953125, 0.21369171142578125, 0.22564697265625, 0.23760223388671875, 0.2495574951171875, 0.26151275634765625, 0.273468017578125, 0.28542327880859375, 0.2973785400390625, 0.30933380126953125, 0.3212890625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 6.0, 10.0, 12.0, 25.0, 26.0, 30.0, 46.0, 58.0, 79.0, 118.0, 187.0, 278.0, 373.0, 608.0, 1089.0, 1731.0, 3423.0, 7123.0, 16398.0, 41049.0, 113093.0, 290814.0, 336069.0, 145252.0, 52198.0, 20162.0, 8644.0, 4121.0, 2164.0, 1199.0, 796.0, 425.0, 300.0, 196.0, 146.0, 88.0, 67.0, 45.0, 24.0, 18.0, 18.0, 13.0, 14.0, 3.0, 2.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.9765625, -0.9461593627929688, -0.9157562255859375, -0.8853530883789062, -0.854949951171875, -0.8245468139648438, -0.7941436767578125, -0.7637405395507812, -0.73333740234375, -0.7029342651367188, -0.6725311279296875, -0.6421279907226562, -0.611724853515625, -0.5813217163085938, -0.5509185791015625, -0.5205154418945312, -0.4901123046875, -0.45970916748046875, -0.4293060302734375, -0.39890289306640625, -0.368499755859375, -0.33809661865234375, -0.3076934814453125, -0.27729034423828125, -0.24688720703125, -0.21648406982421875, -0.1860809326171875, -0.15567779541015625, -0.125274658203125, -0.09487152099609375, -0.0644683837890625, -0.03406524658203125, -0.003662109375, 0.02674102783203125, 0.0571441650390625, 0.08754730224609375, 0.117950439453125, 0.14835357666015625, 0.1787567138671875, 0.20915985107421875, 0.23956298828125, 0.26996612548828125, 0.3003692626953125, 0.33077239990234375, 0.361175537109375, 0.39157867431640625, 0.4219818115234375, 0.45238494873046875, 0.4827880859375, 0.5131912231445312, 0.5435943603515625, 0.5739974975585938, 0.604400634765625, 0.6348037719726562, 0.6652069091796875, 0.6956100463867188, 0.72601318359375, 0.7564163208007812, 0.7868194580078125, 0.8172225952148438, 0.847625732421875, 0.8780288696289062, 0.9084320068359375, 0.9388351440429688, 0.96923828125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 6.0, 8.0, 5.0, 9.0, 10.0, 12.0, 18.0, 17.0, 32.0, 20.0, 34.0, 37.0, 24.0, 37.0, 49.0, 38.0, 51.0, 44.0, 50.0, 46.0, 55.0, 62.0, 50.0, 35.0, 43.0, 40.0, 34.0, 28.0, 23.0, 15.0, 20.0, 14.0, 7.0, 8.0, 8.0, 7.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.208984375, -1.1733856201171875, -1.137786865234375, -1.1021881103515625, -1.06658935546875, -1.0309906005859375, -0.995391845703125, -0.9597930908203125, -0.9241943359375, -0.8885955810546875, -0.852996826171875, -0.8173980712890625, -0.78179931640625, -0.7462005615234375, -0.710601806640625, -0.6750030517578125, -0.639404296875, -0.6038055419921875, -0.568206787109375, -0.5326080322265625, -0.49700927734375, -0.4614105224609375, -0.425811767578125, -0.3902130126953125, -0.3546142578125, -0.3190155029296875, -0.283416748046875, -0.2478179931640625, -0.21221923828125, -0.1766204833984375, -0.141021728515625, -0.1054229736328125, -0.06982421875, -0.0342254638671875, 0.001373291015625, 0.0369720458984375, 0.07257080078125, 0.1081695556640625, 0.143768310546875, 0.1793670654296875, 0.2149658203125, 0.2505645751953125, 0.286163330078125, 0.3217620849609375, 0.35736083984375, 0.3929595947265625, 0.428558349609375, 0.4641571044921875, 0.499755859375, 0.5353546142578125, 0.570953369140625, 0.6065521240234375, 0.64215087890625, 0.6777496337890625, 0.713348388671875, 0.7489471435546875, 0.7845458984375, 0.8201446533203125, 0.855743408203125, 0.8913421630859375, 0.92694091796875, 0.9625396728515625, 0.998138427734375, 1.0337371826171875, 1.0693359375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 6.0, 8.0, 5.0, 19.0, 29.0, 31.0, 61.0, 95.0, 171.0, 354.0, 809.0, 2305.0, 10504.0, 112622.0, 795024.0, 112131.0, 10501.0, 2337.0, 785.0, 345.0, 167.0, 104.0, 52.0, 34.0, 18.0, 12.0, 9.0, 6.0, 4.0, 3.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8984375, -0.8585052490234375, -0.818572998046875, -0.7786407470703125, -0.73870849609375, -0.6987762451171875, -0.658843994140625, -0.6189117431640625, -0.5789794921875, -0.5390472412109375, -0.499114990234375, -0.4591827392578125, -0.41925048828125, -0.3793182373046875, -0.339385986328125, -0.2994537353515625, -0.259521484375, -0.2195892333984375, -0.179656982421875, -0.1397247314453125, -0.09979248046875, -0.0598602294921875, -0.019927978515625, 0.0200042724609375, 0.0599365234375, 0.0998687744140625, 0.139801025390625, 0.1797332763671875, 0.21966552734375, 0.2595977783203125, 0.299530029296875, 0.3394622802734375, 0.37939453125, 0.4193267822265625, 0.459259033203125, 0.4991912841796875, 0.53912353515625, 0.5790557861328125, 0.618988037109375, 0.6589202880859375, 0.6988525390625, 0.7387847900390625, 0.778717041015625, 0.8186492919921875, 0.85858154296875, 0.8985137939453125, 0.938446044921875, 0.9783782958984375, 1.018310546875, 1.0582427978515625, 1.098175048828125, 1.1381072998046875, 1.17803955078125, 1.2179718017578125, 1.257904052734375, 1.2978363037109375, 1.3377685546875, 1.3777008056640625, 1.417633056640625, 1.4575653076171875, 1.49749755859375, 1.5374298095703125, 1.577362060546875, 1.6172943115234375, 1.6572265625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 8.0, 1.0, 7.0, 4.0, 11.0, 13.0, 26.0, 35.0, 35.0, 48.0, 74.0, 77.0, 81.0, 100.0, 103.0, 80.0, 71.0, 54.0, 40.0, 32.0, 34.0, 19.0, 11.0, 13.0, 12.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011652708053588867, -0.00011247489601373672, -0.00010842271149158478, -0.00010437052696943283, -0.00010031834244728088, -9.626615792512894e-05, -9.221397340297699e-05, -8.816178888082504e-05, -8.41096043586731e-05, -8.005741983652115e-05, -7.60052353143692e-05, -7.195305079221725e-05, -6.790086627006531e-05, -6.384868174791336e-05, -5.9796497225761414e-05, -5.5744312703609467e-05, -5.169212818145752e-05, -4.763994365930557e-05, -4.3587759137153625e-05, -3.953557461500168e-05, -3.548339009284973e-05, -3.1431205570697784e-05, -2.7379021048545837e-05, -2.332683652639389e-05, -1.9274652004241943e-05, -1.5222467482089996e-05, -1.117028295993805e-05, -7.118098437786102e-06, -3.0659139156341553e-06, 9.862706065177917e-07, 5.038455128669739e-06, 9.090639650821686e-06, 1.3142824172973633e-05, 1.719500869512558e-05, 2.1247193217277527e-05, 2.5299377739429474e-05, 2.935156226158142e-05, 3.340374678373337e-05, 3.7455931305885315e-05, 4.150811582803726e-05, 4.556030035018921e-05, 4.9612484872341156e-05, 5.36646693944931e-05, 5.771685391664505e-05, 6.1769038438797e-05, 6.582122296094894e-05, 6.987340748310089e-05, 7.392559200525284e-05, 7.797777652740479e-05, 8.202996104955673e-05, 8.608214557170868e-05, 9.013433009386063e-05, 9.418651461601257e-05, 9.823869913816452e-05, 0.00010229088366031647, 0.00010634306818246841, 0.00011039525270462036, 0.00011444743722677231, 0.00011849962174892426, 0.0001225518062710762, 0.00012660399079322815, 0.0001306561753153801, 0.00013470835983753204, 0.000138760544359684, 0.00014281272888183594]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 4.0, 8.0, 23.0, 25.0, 33.0, 58.0, 117.0, 192.0, 412.0, 836.0, 2035.0, 5752.0, 18874.0, 82765.0, 395586.0, 420713.0, 90853.0, 20282.0, 6018.0, 2170.0, 884.0, 418.0, 210.0, 117.0, 64.0, 38.0, 14.0, 14.0, 11.0, 11.0, 2.0, 4.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59375, -0.5709381103515625, -0.548126220703125, -0.5253143310546875, -0.50250244140625, -0.4796905517578125, -0.456878662109375, -0.4340667724609375, -0.4112548828125, -0.3884429931640625, -0.365631103515625, -0.3428192138671875, -0.32000732421875, -0.2971954345703125, -0.274383544921875, -0.2515716552734375, -0.228759765625, -0.2059478759765625, -0.183135986328125, -0.1603240966796875, -0.13751220703125, -0.1147003173828125, -0.091888427734375, -0.0690765380859375, -0.0462646484375, -0.0234527587890625, -0.000640869140625, 0.0221710205078125, 0.04498291015625, 0.0677947998046875, 0.090606689453125, 0.1134185791015625, 0.13623046875, 0.1590423583984375, 0.181854248046875, 0.2046661376953125, 0.22747802734375, 0.2502899169921875, 0.273101806640625, 0.2959136962890625, 0.3187255859375, 0.3415374755859375, 0.364349365234375, 0.3871612548828125, 0.40997314453125, 0.4327850341796875, 0.455596923828125, 0.4784088134765625, 0.501220703125, 0.5240325927734375, 0.546844482421875, 0.5696563720703125, 0.59246826171875, 0.6152801513671875, 0.638092041015625, 0.6609039306640625, 0.6837158203125, 0.7065277099609375, 0.729339599609375, 0.7521514892578125, 0.77496337890625, 0.7977752685546875, 0.820587158203125, 0.8433990478515625, 0.8662109375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 8.0, 5.0, 15.0, 16.0, 11.0, 17.0, 23.0, 24.0, 36.0, 52.0, 63.0, 55.0, 71.0, 80.0, 70.0, 83.0, 66.0, 60.0, 52.0, 30.0, 40.0, 23.0, 21.0, 11.0, 18.0, 16.0, 7.0, 5.0, 9.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5751953125, -0.5532302856445312, -0.5312652587890625, -0.5093002319335938, -0.487335205078125, -0.46537017822265625, -0.4434051513671875, -0.42144012451171875, -0.39947509765625, -0.37751007080078125, -0.3555450439453125, -0.33358001708984375, -0.311614990234375, -0.28964996337890625, -0.2676849365234375, -0.24571990966796875, -0.2237548828125, -0.20178985595703125, -0.1798248291015625, -0.15785980224609375, -0.135894775390625, -0.11392974853515625, -0.0919647216796875, -0.06999969482421875, -0.04803466796875, -0.02606964111328125, -0.0041046142578125, 0.01786041259765625, 0.039825439453125, 0.06179046630859375, 0.0837554931640625, 0.10572052001953125, 0.127685546875, 0.14965057373046875, 0.1716156005859375, 0.19358062744140625, 0.215545654296875, 0.23751068115234375, 0.2594757080078125, 0.28144073486328125, 0.30340576171875, 0.32537078857421875, 0.3473358154296875, 0.36930084228515625, 0.391265869140625, 0.41323089599609375, 0.4351959228515625, 0.45716094970703125, 0.4791259765625, 0.5010910034179688, 0.5230560302734375, 0.5450210571289062, 0.566986083984375, 0.5889511108398438, 0.6109161376953125, 0.6328811645507812, 0.65484619140625, 0.6768112182617188, 0.6987762451171875, 0.7207412719726562, 0.742706298828125, 0.7646713256835938, 0.7866363525390625, 0.8086013793945312, 0.83056640625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 9.0, 6.0, 9.0, 27.0, 44.0, 103.0, 142.0, 183.0, 198.0, 120.0, 80.0, 41.0, 22.0, 16.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.37784194946289, -17.83738136291504, -17.296920776367188, -16.756460189819336, -16.215999603271484, -15.675539016723633, -15.135077476501465, -14.594616889953613, -14.054156303405762, -13.51369571685791, -12.973235130310059, -12.432774543762207, -11.892313003540039, -11.351852416992188, -10.811391830444336, -10.270931243896484, -9.730470657348633, -9.190010070800781, -8.64954948425293, -8.109088897705078, -7.568627834320068, -7.028167247772217, -6.487706184387207, -5.9472455978393555, -5.406785011291504, -4.866324424743652, -4.325863838195801, -3.785402774810791, -3.2449421882629395, -2.704481601715088, -2.1640207767486572, -1.6235599517822266, -1.083099365234375, -0.5426386594772339, -0.0021779537200927734, 0.5382827520370483, 1.0787434577941895, 1.619204044342041, 2.1596648693084717, 2.7001256942749023, 3.240586280822754, 3.7810468673706055, 4.321507453918457, 4.861968517303467, 5.402429103851318, 5.94288969039917, 6.48335075378418, 7.023811340332031, 7.564271926879883, 8.104732513427734, 8.645193099975586, 9.185653686523438, 9.726114273071289, 10.26657485961914, 10.807036399841309, 11.34749698638916, 11.887957572937012, 12.428418159484863, 12.968878746032715, 13.509339332580566, 14.049800872802734, 14.590261459350586, 15.130722045898438, 15.671182632446289, 16.21164321899414]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 4.0, 5.0, 8.0, 2.0, 3.0, 12.0, 14.0, 18.0, 13.0, 15.0, 19.0, 28.0, 30.0, 30.0, 39.0, 33.0, 49.0, 32.0, 35.0, 44.0, 37.0, 51.0, 42.0, 42.0, 39.0, 40.0, 33.0, 32.0, 26.0, 34.0, 22.0, 26.0, 24.0, 17.0, 25.0, 12.0, 12.0, 10.0, 12.0, 6.0, 9.0, 7.0, 1.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.618541717529297, -4.451461315155029, -4.2843804359436035, -4.117300033569336, -3.9502196311950684, -3.7831389904022217, -3.616058349609375, -3.4489779472351074, -3.2818973064422607, -3.114816665649414, -2.9477362632751465, -2.7806556224823, -2.613574981689453, -2.4464945793151855, -2.279413938522339, -2.112333297729492, -1.9452528953552246, -1.7781723737716675, -1.6110918521881104, -1.4440112113952637, -1.2769306898117065, -1.1098501682281494, -0.9427695274353027, -0.7756890058517456, -0.6086084842681885, -0.44152793288230896, -0.27444738149642944, -0.10736680030822754, 0.05971372127532959, 0.22679424285888672, 0.3938748836517334, 0.5609554052352905, 0.7280359268188477, 0.8951164484024048, 1.062196969985962, 1.2292776107788086, 1.3963581323623657, 1.5634386539459229, 1.7305192947387695, 1.8975998163223267, 2.064680337905884, 2.2317609786987305, 2.398841381072998, 2.5659220218658447, 2.7330026626586914, 2.900083065032959, 3.0671637058258057, 3.2342443466186523, 3.40132474899292, 3.5684053897857666, 3.735485792160034, 3.902566432952881, 4.069646835327148, 4.236727714538574, 4.403808116912842, 4.570888519287109, 4.737969398498535, 4.905049800872803, 5.0721306800842285, 5.239211082458496, 5.406291484832764, 5.573371887207031, 5.740452766418457, 5.907533168792725, 6.074613571166992]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 6.0, 3.0, 4.0, 11.0, 14.0, 22.0, 27.0, 33.0, 37.0, 80.0, 120.0, 186.0, 397.0, 903.0, 2534.0, 9410.0, 54807.0, 3906856.0, 193248.0, 18314.0, 4375.0, 1566.0, 664.0, 298.0, 158.0, 78.0, 52.0, 31.0, 17.0, 10.0, 10.0, 7.0, 7.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.53515625, -4.4149169921875, -4.294677734375, -4.1744384765625, -4.05419921875, -3.9339599609375, -3.813720703125, -3.6934814453125, -3.5732421875, -3.4530029296875, -3.332763671875, -3.2125244140625, -3.09228515625, -2.9720458984375, -2.851806640625, -2.7315673828125, -2.611328125, -2.4910888671875, -2.370849609375, -2.2506103515625, -2.13037109375, -2.0101318359375, -1.889892578125, -1.7696533203125, -1.6494140625, -1.5291748046875, -1.408935546875, -1.2886962890625, -1.16845703125, -1.0482177734375, -0.927978515625, -0.8077392578125, -0.6875, -0.5672607421875, -0.447021484375, -0.3267822265625, -0.20654296875, -0.0863037109375, 0.033935546875, 0.1541748046875, 0.2744140625, 0.3946533203125, 0.514892578125, 0.6351318359375, 0.75537109375, 0.8756103515625, 0.995849609375, 1.1160888671875, 1.236328125, 1.3565673828125, 1.476806640625, 1.5970458984375, 1.71728515625, 1.8375244140625, 1.957763671875, 2.0780029296875, 2.1982421875, 2.3184814453125, 2.438720703125, 2.5589599609375, 2.67919921875, 2.7994384765625, 2.919677734375, 3.0399169921875, 3.16015625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 8.0, 5.0, 11.0, 18.0, 35.0, 33.0, 37.0, 51.0, 71.0, 67.0, 72.0, 69.0, 86.0, 81.0, 70.0, 54.0, 42.0, 42.0, 39.0, 26.0, 26.0, 18.0, 17.0, 12.0, 6.0, 3.0, 2.0, 2.0, 0.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.473388671875, -0.46105194091796875, -0.4487152099609375, -0.43637847900390625, -0.424041748046875, -0.41170501708984375, -0.3993682861328125, -0.38703155517578125, -0.37469482421875, -0.36235809326171875, -0.3500213623046875, -0.33768463134765625, -0.325347900390625, -0.31301116943359375, -0.3006744384765625, -0.28833770751953125, -0.2760009765625, -0.26366424560546875, -0.2513275146484375, -0.23899078369140625, -0.226654052734375, -0.21431732177734375, -0.2019805908203125, -0.18964385986328125, -0.17730712890625, -0.16497039794921875, -0.1526336669921875, -0.14029693603515625, -0.127960205078125, -0.11562347412109375, -0.1032867431640625, -0.09095001220703125, -0.07861328125, -0.06627655029296875, -0.0539398193359375, -0.04160308837890625, -0.029266357421875, -0.01692962646484375, -0.0045928955078125, 0.00774383544921875, 0.02008056640625, 0.03241729736328125, 0.0447540283203125, 0.05709075927734375, 0.069427490234375, 0.08176422119140625, 0.0941009521484375, 0.10643768310546875, 0.1187744140625, 0.13111114501953125, 0.1434478759765625, 0.15578460693359375, 0.168121337890625, 0.18045806884765625, 0.1927947998046875, 0.20513153076171875, 0.21746826171875, 0.22980499267578125, 0.2421417236328125, 0.25447845458984375, 0.266815185546875, 0.27915191650390625, 0.2914886474609375, 0.30382537841796875, 0.316162109375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 8.0, 10.0, 24.0, 35.0, 40.0, 68.0, 144.0, 204.0, 298.0, 547.0, 957.0, 1722.0, 3493.0, 7797.0, 22851.0, 107109.0, 3618390.0, 363212.0, 44113.0, 12625.0, 5066.0, 2426.0, 1287.0, 700.0, 442.0, 282.0, 177.0, 88.0, 63.0, 42.0, 32.0, 20.0, 4.0, 6.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.38671875, -2.30908203125, -2.2314453125, -2.15380859375, -2.076171875, -1.99853515625, -1.9208984375, -1.84326171875, -1.765625, -1.68798828125, -1.6103515625, -1.53271484375, -1.455078125, -1.37744140625, -1.2998046875, -1.22216796875, -1.14453125, -1.06689453125, -0.9892578125, -0.91162109375, -0.833984375, -0.75634765625, -0.6787109375, -0.60107421875, -0.5234375, -0.44580078125, -0.3681640625, -0.29052734375, -0.212890625, -0.13525390625, -0.0576171875, 0.02001953125, 0.09765625, 0.17529296875, 0.2529296875, 0.33056640625, 0.408203125, 0.48583984375, 0.5634765625, 0.64111328125, 0.71875, 0.79638671875, 0.8740234375, 0.95166015625, 1.029296875, 1.10693359375, 1.1845703125, 1.26220703125, 1.33984375, 1.41748046875, 1.4951171875, 1.57275390625, 1.650390625, 1.72802734375, 1.8056640625, 1.88330078125, 1.9609375, 2.03857421875, 2.1162109375, 2.19384765625, 2.271484375, 2.34912109375, 2.4267578125, 2.50439453125, 2.58203125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 4.0, 3.0, 6.0, 16.0, 15.0, 36.0, 45.0, 92.0, 193.0, 1185.0, 1987.0, 239.0, 98.0, 59.0, 36.0, 17.0, 12.0, 11.0, 5.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.4560546875, -1.4076080322265625, -1.359161376953125, -1.3107147216796875, -1.26226806640625, -1.2138214111328125, -1.165374755859375, -1.1169281005859375, -1.0684814453125, -1.0200347900390625, -0.971588134765625, -0.9231414794921875, -0.87469482421875, -0.8262481689453125, -0.777801513671875, -0.7293548583984375, -0.680908203125, -0.6324615478515625, -0.584014892578125, -0.5355682373046875, -0.48712158203125, -0.4386749267578125, -0.390228271484375, -0.3417816162109375, -0.2933349609375, -0.2448883056640625, -0.196441650390625, -0.1479949951171875, -0.09954833984375, -0.0511016845703125, -0.002655029296875, 0.0457916259765625, 0.09423828125, 0.1426849365234375, 0.191131591796875, 0.2395782470703125, 0.28802490234375, 0.3364715576171875, 0.384918212890625, 0.4333648681640625, 0.4818115234375, 0.5302581787109375, 0.578704833984375, 0.6271514892578125, 0.67559814453125, 0.7240447998046875, 0.772491455078125, 0.8209381103515625, 0.869384765625, 0.9178314208984375, 0.966278076171875, 1.0147247314453125, 1.06317138671875, 1.1116180419921875, 1.160064697265625, 1.2085113525390625, 1.2569580078125, 1.3054046630859375, 1.353851318359375, 1.4022979736328125, 1.45074462890625, 1.4991912841796875, 1.547637939453125, 1.5960845947265625, 1.64453125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 5.0, 7.0, 8.0, 15.0, 18.0, 33.0, 67.0, 96.0, 130.0, 157.0, 164.0, 126.0, 76.0, 40.0, 25.0, 13.0, 4.0, 7.0, 7.0, 3.0, 6.0, 1.0, 1.0, 0.0, 2.0], "bins": [-11.89401626586914, -11.650848388671875, -11.40768051147461, -11.164512634277344, -10.921344757080078, -10.678177833557129, -10.435009956359863, -10.191842079162598, -9.948674201965332, -9.705506324768066, -9.4623384475708, -9.219170570373535, -8.976003646850586, -8.73283576965332, -8.489667892456055, -8.246500015258789, -8.003332138061523, -7.760164260864258, -7.516996383666992, -7.273828983306885, -7.030661106109619, -6.7874932289123535, -6.544325828552246, -6.3011579513549805, -6.057990074157715, -5.814822196960449, -5.571654319763184, -5.328486919403076, -5.0853190422058105, -4.842151165008545, -4.5989837646484375, -4.355815887451172, -4.112648010253906, -3.8694801330566406, -3.626312494277954, -3.3831448554992676, -3.139976978302002, -2.8968091011047363, -2.65364146232605, -2.4104738235473633, -2.1673057079315186, -1.9241379499435425, -1.6809701919555664, -1.4378024339675903, -1.1946346759796143, -0.9514669179916382, -0.7082991600036621, -0.46513140201568604, -0.22196364402770996, 0.021204113960266113, 0.2643718719482422, 0.5075396299362183, 0.7507073879241943, 0.9938751459121704, 1.2370429039001465, 1.4802106618881226, 1.7233784198760986, 1.9665461778640747, 2.209713935852051, 2.4528818130493164, 2.696049451828003, 2.9392170906066895, 3.182384967803955, 3.4255528450012207, 3.6687204837799072]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 6.0, 6.0, 8.0, 6.0, 4.0, 12.0, 3.0, 11.0, 7.0, 13.0, 6.0, 25.0, 20.0, 26.0, 33.0, 17.0, 35.0, 19.0, 28.0, 33.0, 41.0, 37.0, 29.0, 40.0, 40.0, 36.0, 39.0, 36.0, 39.0, 29.0, 33.0, 36.0, 24.0, 31.0, 20.0, 19.0, 21.0, 15.0, 18.0, 25.0, 17.0, 15.0, 6.0, 6.0, 7.0, 3.0, 6.0, 9.0, 3.0, 4.0, 5.0, 5.0], "bins": [-3.4690258502960205, -3.374457836151123, -3.2798898220062256, -3.185321807861328, -3.0907537937164307, -2.996185779571533, -2.9016177654266357, -2.8070497512817383, -2.712481737136841, -2.6179137229919434, -2.523345708847046, -2.4287776947021484, -2.334209680557251, -2.2396416664123535, -2.145073652267456, -2.0505056381225586, -1.9559376239776611, -1.8613696098327637, -1.7668015956878662, -1.6722335815429688, -1.5776655673980713, -1.4830975532531738, -1.3885295391082764, -1.293961524963379, -1.1993935108184814, -1.104825496673584, -1.0102574825286865, -0.9156894683837891, -0.8211214542388916, -0.7265534400939941, -0.6319854259490967, -0.5374174118041992, -0.44284939765930176, -0.3482813835144043, -0.25371336936950684, -0.15914535522460938, -0.06457734107971191, 0.029990673065185547, 0.12455868721008301, 0.21912670135498047, 0.31369471549987793, 0.4082627296447754, 0.5028307437896729, 0.5973987579345703, 0.6919667720794678, 0.7865347862243652, 0.8811028003692627, 0.9756708145141602, 1.0702388286590576, 1.164806842803955, 1.2593748569488525, 1.35394287109375, 1.4485108852386475, 1.543078899383545, 1.6376469135284424, 1.7322149276733398, 1.8267829418182373, 1.9213509559631348, 2.0159189701080322, 2.1104869842529297, 2.205054998397827, 2.2996230125427246, 2.394191026687622, 2.4887590408325195, 2.583327054977417]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 5.0, 3.0, 4.0, 2.0, 8.0, 10.0, 22.0, 20.0, 31.0, 81.0, 120.0, 191.0, 345.0, 653.0, 1430.0, 3375.0, 8606.0, 25118.0, 81781.0, 292408.0, 427797.0, 142939.0, 41009.0, 13507.0, 5009.0, 2058.0, 985.0, 427.0, 222.0, 148.0, 97.0, 47.0, 33.0, 26.0, 12.0, 7.0, 2.0, 8.0, 3.0, 6.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.48828125, -2.4231719970703125, -2.358062744140625, -2.2929534912109375, -2.22784423828125, -2.1627349853515625, -2.097625732421875, -2.0325164794921875, -1.9674072265625, -1.9022979736328125, -1.837188720703125, -1.7720794677734375, -1.70697021484375, -1.6418609619140625, -1.576751708984375, -1.5116424560546875, -1.446533203125, -1.3814239501953125, -1.316314697265625, -1.2512054443359375, -1.18609619140625, -1.1209869384765625, -1.055877685546875, -0.9907684326171875, -0.9256591796875, -0.8605499267578125, -0.795440673828125, -0.7303314208984375, -0.66522216796875, -0.6001129150390625, -0.535003662109375, -0.4698944091796875, -0.40478515625, -0.3396759033203125, -0.274566650390625, -0.2094573974609375, -0.14434814453125, -0.0792388916015625, -0.014129638671875, 0.0509796142578125, 0.1160888671875, 0.1811981201171875, 0.246307373046875, 0.3114166259765625, 0.37652587890625, 0.4416351318359375, 0.506744384765625, 0.5718536376953125, 0.636962890625, 0.7020721435546875, 0.767181396484375, 0.8322906494140625, 0.89739990234375, 0.9625091552734375, 1.027618408203125, 1.0927276611328125, 1.1578369140625, 1.2229461669921875, 1.288055419921875, 1.3531646728515625, 1.41827392578125, 1.4833831787109375, 1.548492431640625, 1.6136016845703125, 1.6787109375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 5.0, 8.0, 9.0, 15.0, 9.0, 22.0, 25.0, 25.0, 37.0, 38.0, 33.0, 39.0, 53.0, 54.0, 61.0, 54.0, 52.0, 53.0, 57.0, 51.0, 52.0, 27.0, 55.0, 28.0, 31.0, 27.0, 23.0, 14.0, 6.0, 11.0, 4.0, 7.0, 6.0, 6.0, 4.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5048828125, -0.4917030334472656, -0.47852325439453125, -0.4653434753417969, -0.4521636962890625, -0.4389839172363281, -0.42580413818359375, -0.4126243591308594, -0.399444580078125, -0.3862648010253906, -0.37308502197265625, -0.3599052429199219, -0.3467254638671875, -0.3335456848144531, -0.32036590576171875, -0.3071861267089844, -0.29400634765625, -0.2808265686035156, -0.26764678955078125, -0.2544670104980469, -0.2412872314453125, -0.22810745239257812, -0.21492767333984375, -0.20174789428710938, -0.188568115234375, -0.17538833618164062, -0.16220855712890625, -0.14902877807617188, -0.1358489990234375, -0.12266921997070312, -0.10948944091796875, -0.09630966186523438, -0.0831298828125, -0.06995010375976562, -0.05677032470703125, -0.043590545654296875, -0.0304107666015625, -0.017230987548828125, -0.00405120849609375, 0.009128570556640625, 0.022308349609375, 0.035488128662109375, 0.04866790771484375, 0.061847686767578125, 0.0750274658203125, 0.08820724487304688, 0.10138702392578125, 0.11456680297851562, 0.12774658203125, 0.14092636108398438, 0.15410614013671875, 0.16728591918945312, 0.1804656982421875, 0.19364547729492188, 0.20682525634765625, 0.22000503540039062, 0.233184814453125, 0.24636459350585938, 0.25954437255859375, 0.2727241516113281, 0.2859039306640625, 0.2990837097167969, 0.31226348876953125, 0.3254432678222656, 0.338623046875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 6.0, 8.0, 10.0, 15.0, 21.0, 43.0, 60.0, 65.0, 91.0, 149.0, 230.0, 394.0, 598.0, 942.0, 1640.0, 2760.0, 5438.0, 11095.0, 24942.0, 63037.0, 186896.0, 410550.0, 215347.0, 71212.0, 27619.0, 11920.0, 5917.0, 3012.0, 1721.0, 1047.0, 580.0, 387.0, 268.0, 181.0, 121.0, 65.0, 41.0, 34.0, 29.0, 15.0, 8.0, 16.0, 7.0, 4.0, 5.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-1.6748046875, -1.6233673095703125, -1.571929931640625, -1.5204925537109375, -1.46905517578125, -1.4176177978515625, -1.366180419921875, -1.3147430419921875, -1.2633056640625, -1.2118682861328125, -1.160430908203125, -1.1089935302734375, -1.05755615234375, -1.0061187744140625, -0.954681396484375, -0.9032440185546875, -0.851806640625, -0.8003692626953125, -0.748931884765625, -0.6974945068359375, -0.64605712890625, -0.5946197509765625, -0.543182373046875, -0.4917449951171875, -0.4403076171875, -0.3888702392578125, -0.337432861328125, -0.2859954833984375, -0.23455810546875, -0.1831207275390625, -0.131683349609375, -0.0802459716796875, -0.02880859375, 0.0226287841796875, 0.074066162109375, 0.1255035400390625, 0.17694091796875, 0.2283782958984375, 0.279815673828125, 0.3312530517578125, 0.3826904296875, 0.4341278076171875, 0.485565185546875, 0.5370025634765625, 0.58843994140625, 0.6398773193359375, 0.691314697265625, 0.7427520751953125, 0.794189453125, 0.8456268310546875, 0.897064208984375, 0.9485015869140625, 0.99993896484375, 1.0513763427734375, 1.102813720703125, 1.1542510986328125, 1.2056884765625, 1.2571258544921875, 1.308563232421875, 1.3600006103515625, 1.41143798828125, 1.4628753662109375, 1.514312744140625, 1.5657501220703125, 1.6171875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 0.0, 3.0, 5.0, 1.0, 2.0, 1.0, 3.0, 4.0, 8.0, 6.0, 10.0, 11.0, 7.0, 13.0, 8.0, 24.0, 17.0, 22.0, 26.0, 46.0, 33.0, 38.0, 37.0, 46.0, 34.0, 42.0, 41.0, 39.0, 27.0, 43.0, 28.0, 40.0, 29.0, 43.0, 41.0, 35.0, 30.0, 24.0, 19.0, 24.0, 16.0, 11.0, 16.0, 14.0, 7.0, 6.0, 6.0, 6.0, 2.0, 6.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.904296875, -1.84930419921875, -1.7943115234375, -1.73931884765625, -1.684326171875, -1.62933349609375, -1.5743408203125, -1.51934814453125, -1.46435546875, -1.40936279296875, -1.3543701171875, -1.29937744140625, -1.244384765625, -1.18939208984375, -1.1343994140625, -1.07940673828125, -1.0244140625, -0.96942138671875, -0.9144287109375, -0.85943603515625, -0.804443359375, -0.74945068359375, -0.6944580078125, -0.63946533203125, -0.58447265625, -0.52947998046875, -0.4744873046875, -0.41949462890625, -0.364501953125, -0.30950927734375, -0.2545166015625, -0.19952392578125, -0.14453125, -0.08953857421875, -0.0345458984375, 0.02044677734375, 0.075439453125, 0.13043212890625, 0.1854248046875, 0.24041748046875, 0.29541015625, 0.35040283203125, 0.4053955078125, 0.46038818359375, 0.515380859375, 0.57037353515625, 0.6253662109375, 0.68035888671875, 0.7353515625, 0.79034423828125, 0.8453369140625, 0.90032958984375, 0.955322265625, 1.01031494140625, 1.0653076171875, 1.12030029296875, 1.17529296875, 1.23028564453125, 1.2852783203125, 1.34027099609375, 1.395263671875, 1.45025634765625, 1.5052490234375, 1.56024169921875, 1.615234375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 4.0, 6.0, 7.0, 10.0, 14.0, 19.0, 28.0, 39.0, 53.0, 90.0, 168.0, 314.0, 658.0, 1375.0, 3725.0, 12960.0, 82493.0, 735658.0, 181335.0, 20690.0, 5307.0, 1926.0, 785.0, 380.0, 200.0, 109.0, 56.0, 35.0, 36.0, 24.0, 12.0, 12.0, 12.0, 6.0, 8.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.83984375, -1.7817230224609375, -1.723602294921875, -1.6654815673828125, -1.60736083984375, -1.5492401123046875, -1.491119384765625, -1.4329986572265625, -1.3748779296875, -1.3167572021484375, -1.258636474609375, -1.2005157470703125, -1.14239501953125, -1.0842742919921875, -1.026153564453125, -0.9680328369140625, -0.909912109375, -0.8517913818359375, -0.793670654296875, -0.7355499267578125, -0.67742919921875, -0.6193084716796875, -0.561187744140625, -0.5030670166015625, -0.4449462890625, -0.3868255615234375, -0.328704833984375, -0.2705841064453125, -0.21246337890625, -0.1543426513671875, -0.096221923828125, -0.0381011962890625, 0.02001953125, 0.0781402587890625, 0.136260986328125, 0.1943817138671875, 0.25250244140625, 0.3106231689453125, 0.368743896484375, 0.4268646240234375, 0.4849853515625, 0.5431060791015625, 0.601226806640625, 0.6593475341796875, 0.71746826171875, 0.7755889892578125, 0.833709716796875, 0.8918304443359375, 0.949951171875, 1.0080718994140625, 1.066192626953125, 1.1243133544921875, 1.18243408203125, 1.2405548095703125, 1.298675537109375, 1.3567962646484375, 1.4149169921875, 1.4730377197265625, 1.531158447265625, 1.5892791748046875, 1.64739990234375, 1.7055206298828125, 1.763641357421875, 1.8217620849609375, 1.8798828125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 6.0, 7.0, 12.0, 17.0, 17.0, 28.0, 24.0, 44.0, 68.0, 82.0, 106.0, 111.0, 119.0, 87.0, 65.0, 49.0, 32.0, 32.0, 27.0, 11.0, 10.0, 12.0, 7.0, 6.0, 3.0, 3.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00015747547149658203, -0.00015026144683361053, -0.00014304742217063904, -0.00013583339750766754, -0.00012861937284469604, -0.00012140534818172455, -0.00011419132351875305, -0.00010697729885578156, -9.976327419281006e-05, -9.254924952983856e-05, -8.533522486686707e-05, -7.812120020389557e-05, -7.090717554092407e-05, -6.369315087795258e-05, -5.647912621498108e-05, -4.926510155200958e-05, -4.2051076889038086e-05, -3.483705222606659e-05, -2.7623027563095093e-05, -2.0409002900123596e-05, -1.31949782371521e-05, -5.980953574180603e-06, 1.2330710887908936e-06, 8.44709575176239e-06, 1.5661120414733887e-05, 2.2875145077705383e-05, 3.008916974067688e-05, 3.7303194403648376e-05, 4.451721906661987e-05, 5.173124372959137e-05, 5.8945268392562866e-05, 6.615929305553436e-05, 7.337331771850586e-05, 8.058734238147736e-05, 8.780136704444885e-05, 9.501539170742035e-05, 0.00010222941637039185, 0.00010944344103336334, 0.00011665746569633484, 0.00012387149035930634, 0.00013108551502227783, 0.00013829953968524933, 0.00014551356434822083, 0.00015272758901119232, 0.00015994161367416382, 0.00016715563833713531, 0.0001743696630001068, 0.0001815836876630783, 0.0001887977123260498, 0.0001960117369890213, 0.0002032257616519928, 0.0002104397863149643, 0.0002176538109779358, 0.0002248678356409073, 0.00023208186030387878, 0.00023929588496685028, 0.0002465099096298218, 0.0002537239342927933, 0.00026093795895576477, 0.00026815198361873627, 0.00027536600828170776, 0.00028258003294467926, 0.00028979405760765076, 0.00029700808227062225, 0.00030422210693359375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 5.0, 9.0, 6.0, 7.0, 15.0, 18.0, 22.0, 35.0, 63.0, 80.0, 92.0, 211.0, 288.0, 517.0, 1040.0, 2297.0, 5996.0, 22471.0, 131826.0, 653678.0, 187760.0, 29424.0, 7361.0, 2637.0, 1159.0, 609.0, 333.0, 195.0, 136.0, 73.0, 58.0, 36.0, 33.0, 25.0, 11.0, 8.0, 11.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4150390625, -1.371612548828125, -1.32818603515625, -1.284759521484375, -1.2413330078125, -1.197906494140625, -1.15447998046875, -1.111053466796875, -1.067626953125, -1.024200439453125, -0.98077392578125, -0.937347412109375, -0.8939208984375, -0.850494384765625, -0.80706787109375, -0.763641357421875, -0.72021484375, -0.676788330078125, -0.63336181640625, -0.589935302734375, -0.5465087890625, -0.503082275390625, -0.45965576171875, -0.416229248046875, -0.372802734375, -0.329376220703125, -0.28594970703125, -0.242523193359375, -0.1990966796875, -0.155670166015625, -0.11224365234375, -0.068817138671875, -0.025390625, 0.018035888671875, 0.06146240234375, 0.104888916015625, 0.1483154296875, 0.191741943359375, 0.23516845703125, 0.278594970703125, 0.322021484375, 0.365447998046875, 0.40887451171875, 0.452301025390625, 0.4957275390625, 0.539154052734375, 0.58258056640625, 0.626007080078125, 0.66943359375, 0.712860107421875, 0.75628662109375, 0.799713134765625, 0.8431396484375, 0.886566162109375, 0.92999267578125, 0.973419189453125, 1.016845703125, 1.060272216796875, 1.10369873046875, 1.147125244140625, 1.1905517578125, 1.233978271484375, 1.27740478515625, 1.320831298828125, 1.3642578125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 7.0, 10.0, 10.0, 17.0, 19.0, 36.0, 42.0, 43.0, 70.0, 90.0, 124.0, 124.0, 112.0, 72.0, 51.0, 37.0, 40.0, 23.0, 18.0, 18.0, 6.0, 8.0, 7.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.71875, -1.6697998046875, -1.620849609375, -1.5718994140625, -1.52294921875, -1.4739990234375, -1.425048828125, -1.3760986328125, -1.3271484375, -1.2781982421875, -1.229248046875, -1.1802978515625, -1.13134765625, -1.0823974609375, -1.033447265625, -0.9844970703125, -0.935546875, -0.8865966796875, -0.837646484375, -0.7886962890625, -0.73974609375, -0.6907958984375, -0.641845703125, -0.5928955078125, -0.5439453125, -0.4949951171875, -0.446044921875, -0.3970947265625, -0.34814453125, -0.2991943359375, -0.250244140625, -0.2012939453125, -0.15234375, -0.1033935546875, -0.054443359375, -0.0054931640625, 0.04345703125, 0.0924072265625, 0.141357421875, 0.1903076171875, 0.2392578125, 0.2882080078125, 0.337158203125, 0.3861083984375, 0.43505859375, 0.4840087890625, 0.532958984375, 0.5819091796875, 0.630859375, 0.6798095703125, 0.728759765625, 0.7777099609375, 0.82666015625, 0.8756103515625, 0.924560546875, 0.9735107421875, 1.0224609375, 1.0714111328125, 1.120361328125, 1.1693115234375, 1.21826171875, 1.2672119140625, 1.316162109375, 1.3651123046875, 1.4140625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 28.0, 112.0, 291.0, 367.0, 159.0, 30.0, 18.0, 4.0, 2.0, 0.0, 1.0, 2.0], "bins": [-107.14361572265625, -105.20366668701172, -103.26371002197266, -101.32376098632812, -99.3838119506836, -97.44386291503906, -95.50390625, -93.56395721435547, -91.62400817871094, -89.6840591430664, -87.74410247802734, -85.80415344238281, -83.86420440673828, -81.92425537109375, -79.98429870605469, -78.04434967041016, -76.10440063476562, -74.1644515991211, -72.22449493408203, -70.2845458984375, -68.34459686279297, -66.40464782714844, -64.46469116210938, -62.524742126464844, -60.58478546142578, -58.644832611083984, -56.70488357543945, -54.764930725097656, -52.824981689453125, -50.88502883911133, -48.94507598876953, -47.005126953125, -45.06517791748047, -43.12522506713867, -41.18527603149414, -39.245323181152344, -37.30537414550781, -35.365421295166016, -33.42546844482422, -31.485519409179688, -29.545570373535156, -27.605619430541992, -25.665668487548828, -23.72571563720703, -21.7857666015625, -19.845813751220703, -17.90586280822754, -15.965911865234375, -14.025960922241211, -12.086009979248047, -10.146059036254883, -8.206107139587402, -6.266156196594238, -4.326205253601074, -2.3862533569335938, -0.4463024139404297, 1.4936485290527344, 3.4335997104644775, 5.373550891876221, 7.313502311706543, 9.253453254699707, 11.193404197692871, 13.133356094360352, 15.073307037353516, 17.01325798034668]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 6.0, 4.0, 4.0, 12.0, 5.0, 5.0, 15.0, 11.0, 12.0, 17.0, 15.0, 23.0, 25.0, 30.0, 28.0, 36.0, 39.0, 46.0, 48.0, 47.0, 40.0, 45.0, 43.0, 47.0, 61.0, 35.0, 49.0, 40.0, 26.0, 31.0, 18.0, 21.0, 12.0, 17.0, 16.0, 14.0, 12.0, 8.0, 7.0, 6.0, 10.0, 9.0, 5.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.62202262878418, -10.280797004699707, -9.939571380615234, -9.598345756530762, -9.257120132446289, -8.915895462036133, -8.57466983795166, -8.233444213867188, -7.892218589782715, -7.550992965698242, -7.2097673416137695, -6.868542194366455, -6.527316570281982, -6.18609094619751, -5.844865798950195, -5.503640174865723, -5.16241455078125, -4.821188926696777, -4.479963302612305, -4.13873815536499, -3.7975125312805176, -3.456286907196045, -3.1150615215301514, -2.773836135864258, -2.432610511779785, -2.0913848876953125, -1.750159502029419, -1.4089339971542358, -1.0677084922790527, -0.7264829874038696, -0.3852574825286865, -0.04403209686279297, 0.2971944808959961, 0.6384199857711792, 0.9796454906463623, 1.3208709955215454, 1.6620965003967285, 2.003322124481201, 2.3445475101470947, 2.6857728958129883, 3.026998519897461, 3.3682241439819336, 3.709449529647827, 4.050674915313721, 4.391900539398193, 4.733126163482666, 5.0743513107299805, 5.415576934814453, 5.756802558898926, 6.098028182983398, 6.439253807067871, 6.7804789543151855, 7.121704578399658, 7.462930202484131, 7.804155349731445, 8.145380973815918, 8.48660659790039, 8.827832221984863, 9.169057846069336, 9.510283470153809, 9.851509094238281, 10.192733764648438, 10.53395938873291, 10.875185012817383, 11.216410636901855]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 3.0, 9.0, 13.0, 11.0, 11.0, 27.0, 32.0, 57.0, 81.0, 181.0, 359.0, 938.0, 2895.0, 13084.0, 4040402.0, 123701.0, 8869.0, 2168.0, 721.0, 331.0, 126.0, 87.0, 43.0, 48.0, 24.0, 14.0, 12.0, 15.0, 6.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.00390625, -6.81903076171875, -6.6341552734375, -6.44927978515625, -6.264404296875, -6.07952880859375, -5.8946533203125, -5.70977783203125, -5.52490234375, -5.34002685546875, -5.1551513671875, -4.97027587890625, -4.785400390625, -4.60052490234375, -4.4156494140625, -4.23077392578125, -4.0458984375, -3.86102294921875, -3.6761474609375, -3.49127197265625, -3.306396484375, -3.12152099609375, -2.9366455078125, -2.75177001953125, -2.56689453125, -2.38201904296875, -2.1971435546875, -2.01226806640625, -1.827392578125, -1.64251708984375, -1.4576416015625, -1.27276611328125, -1.087890625, -0.90301513671875, -0.7181396484375, -0.53326416015625, -0.348388671875, -0.16351318359375, 0.0213623046875, 0.20623779296875, 0.39111328125, 0.57598876953125, 0.7608642578125, 0.94573974609375, 1.130615234375, 1.31549072265625, 1.5003662109375, 1.68524169921875, 1.8701171875, 2.05499267578125, 2.2398681640625, 2.42474365234375, 2.609619140625, 2.79449462890625, 2.9793701171875, 3.16424560546875, 3.34912109375, 3.53399658203125, 3.7188720703125, 3.90374755859375, 4.088623046875, 4.27349853515625, 4.4583740234375, 4.64324951171875, 4.828125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 7.0, 9.0, 11.0, 9.0, 17.0, 17.0, 29.0, 36.0, 42.0, 46.0, 48.0, 53.0, 65.0, 72.0, 66.0, 62.0, 61.0, 57.0, 52.0, 43.0, 42.0, 26.0, 29.0, 27.0, 14.0, 18.0, 13.0, 4.0, 4.0, 6.0, 4.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6806640625, -0.66046142578125, -0.6402587890625, -0.62005615234375, -0.599853515625, -0.57965087890625, -0.5594482421875, -0.53924560546875, -0.51904296875, -0.49884033203125, -0.4786376953125, -0.45843505859375, -0.438232421875, -0.41802978515625, -0.3978271484375, -0.37762451171875, -0.357421875, -0.33721923828125, -0.3170166015625, -0.29681396484375, -0.276611328125, -0.25640869140625, -0.2362060546875, -0.21600341796875, -0.19580078125, -0.17559814453125, -0.1553955078125, -0.13519287109375, -0.114990234375, -0.09478759765625, -0.0745849609375, -0.05438232421875, -0.0341796875, -0.01397705078125, 0.0062255859375, 0.02642822265625, 0.046630859375, 0.06683349609375, 0.0870361328125, 0.10723876953125, 0.12744140625, 0.14764404296875, 0.1678466796875, 0.18804931640625, 0.208251953125, 0.22845458984375, 0.2486572265625, 0.26885986328125, 0.2890625, 0.30926513671875, 0.3294677734375, 0.34967041015625, 0.369873046875, 0.39007568359375, 0.4102783203125, 0.43048095703125, 0.45068359375, 0.47088623046875, 0.4910888671875, 0.51129150390625, 0.531494140625, 0.55169677734375, 0.5718994140625, 0.59210205078125, 0.6123046875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 5.0, 1.0, 4.0, 5.0, 6.0, 9.0, 12.0, 11.0, 28.0, 27.0, 33.0, 37.0, 50.0, 62.0, 114.0, 103.0, 146.0, 239.0, 282.0, 447.0, 654.0, 964.0, 1563.0, 2750.0, 5309.0, 12146.0, 38124.0, 3930307.0, 157470.0, 23990.0, 8896.0, 4085.0, 2203.0, 1297.0, 847.0, 585.0, 379.0, 287.0, 200.0, 151.0, 109.0, 104.0, 53.0, 43.0, 37.0, 39.0, 23.0, 16.0, 14.0, 12.0, 9.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0], "bins": [-3.865234375, -3.739837646484375, -3.61444091796875, -3.489044189453125, -3.3636474609375, -3.238250732421875, -3.11285400390625, -2.987457275390625, -2.862060546875, -2.736663818359375, -2.61126708984375, -2.485870361328125, -2.3604736328125, -2.235076904296875, -2.10968017578125, -1.984283447265625, -1.85888671875, -1.733489990234375, -1.60809326171875, -1.482696533203125, -1.3572998046875, -1.231903076171875, -1.10650634765625, -0.981109619140625, -0.855712890625, -0.730316162109375, -0.60491943359375, -0.479522705078125, -0.3541259765625, -0.228729248046875, -0.10333251953125, 0.022064208984375, 0.1474609375, 0.272857666015625, 0.39825439453125, 0.523651123046875, 0.6490478515625, 0.774444580078125, 0.89984130859375, 1.025238037109375, 1.150634765625, 1.276031494140625, 1.40142822265625, 1.526824951171875, 1.6522216796875, 1.777618408203125, 1.90301513671875, 2.028411865234375, 2.15380859375, 2.279205322265625, 2.40460205078125, 2.529998779296875, 2.6553955078125, 2.780792236328125, 2.90618896484375, 3.031585693359375, 3.156982421875, 3.282379150390625, 3.40777587890625, 3.533172607421875, 3.6585693359375, 3.783966064453125, 3.90936279296875, 4.034759521484375, 4.16015625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 7.0, 5.0, 6.0, 9.0, 19.0, 12.0, 21.0, 56.0, 261.0, 3519.0, 72.0, 39.0, 19.0, 5.0, 7.0, 10.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1826171875, -1.142059326171875, -1.10150146484375, -1.060943603515625, -1.0203857421875, -0.979827880859375, -0.93927001953125, -0.898712158203125, -0.858154296875, -0.817596435546875, -0.77703857421875, -0.736480712890625, -0.6959228515625, -0.655364990234375, -0.61480712890625, -0.574249267578125, -0.53369140625, -0.493133544921875, -0.45257568359375, -0.412017822265625, -0.3714599609375, -0.330902099609375, -0.29034423828125, -0.249786376953125, -0.209228515625, -0.168670654296875, -0.12811279296875, -0.087554931640625, -0.0469970703125, -0.006439208984375, 0.03411865234375, 0.074676513671875, 0.115234375, 0.155792236328125, 0.19635009765625, 0.236907958984375, 0.2774658203125, 0.318023681640625, 0.35858154296875, 0.399139404296875, 0.439697265625, 0.480255126953125, 0.52081298828125, 0.561370849609375, 0.6019287109375, 0.642486572265625, 0.68304443359375, 0.723602294921875, 0.76416015625, 0.804718017578125, 0.84527587890625, 0.885833740234375, 0.9263916015625, 0.966949462890625, 1.00750732421875, 1.048065185546875, 1.088623046875, 1.129180908203125, 1.16973876953125, 1.210296630859375, 1.2508544921875, 1.291412353515625, 1.33197021484375, 1.372528076171875, 1.4130859375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 3.0, 5.0, 11.0, 7.0, 16.0, 27.0, 51.0, 87.0, 114.0, 125.0, 139.0, 106.0, 101.0, 73.0, 47.0, 28.0, 25.0, 16.0, 5.0, 8.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7021236419677734, -2.581059217453003, -2.4599947929382324, -2.338930606842041, -2.2178661823272705, -2.0968017578125, -1.9757373332977295, -1.854672908782959, -1.733608603477478, -1.6125441789627075, -1.4914798736572266, -1.370415449142456, -1.2493510246276855, -1.1282867193222046, -1.007222294807434, -0.8861579298973083, -0.7650935649871826, -0.6440292000770569, -0.5229648351669312, -0.40190041065216064, -0.2808360457420349, -0.15977168083190918, -0.03870725631713867, 0.08235710859298706, 0.2034214735031128, 0.3244858384132385, 0.44555023312568665, 0.5666146278381348, 0.6876789927482605, 0.8087433576583862, 0.9298077821731567, 1.0508720874786377, 1.1719365119934082, 1.2930009365081787, 1.4140652418136597, 1.5351296663284302, 1.6561939716339111, 1.7772583961486816, 1.8983228206634521, 2.0193872451782227, 2.140451431274414, 2.2615158557891846, 2.382580280303955, 2.5036444664001465, 2.624708890914917, 2.7457733154296875, 2.866837739944458, 2.9879021644592285, 3.108966588973999, 3.2300310134887695, 3.35109543800354, 3.4721598625183105, 3.593224048614502, 3.7142884731292725, 3.835352897644043, 3.9564173221588135, 4.077481746673584, 4.198545932769775, 4.319610595703125, 4.440674781799316, 4.561739444732666, 4.682803630828857, 4.803868293762207, 4.924932479858398, 5.04599666595459]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 5.0, 9.0, 4.0, 7.0, 8.0, 10.0, 11.0, 16.0, 8.0, 16.0, 13.0, 20.0, 29.0, 34.0, 27.0, 29.0, 42.0, 50.0, 40.0, 44.0, 44.0, 55.0, 41.0, 58.0, 48.0, 42.0, 34.0, 32.0, 27.0, 22.0, 23.0, 19.0, 19.0, 12.0, 23.0, 17.0, 15.0, 14.0, 11.0, 6.0, 6.0, 5.0, 1.0, 1.0, 3.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7838761806488037, -1.725106120109558, -1.6663360595703125, -1.607565999031067, -1.5487959384918213, -1.4900259971618652, -1.4312559366226196, -1.372485876083374, -1.3137158155441284, -1.2549457550048828, -1.1961756944656372, -1.1374056339263916, -1.0786356925964355, -1.0198655128479004, -0.9610955715179443, -0.9023255109786987, -0.8435554504394531, -0.7847853899002075, -0.7260153293609619, -0.6672453284263611, -0.6084752678871155, -0.5497052073478699, -0.49093517661094666, -0.43216514587402344, -0.37339508533477783, -0.3146250247955322, -0.255854994058609, -0.1970849484205246, -0.13831490278244019, -0.07954484224319458, -0.020774811506271362, 0.037995219230651855, 0.09676527976989746, 0.15553532540798187, 0.21430537104606628, 0.2730754017829895, 0.3318454623222351, 0.3906155228614807, 0.44938555359840393, 0.5081555843353271, 0.5669256448745728, 0.6256957054138184, 0.684465765953064, 0.7432357668876648, 0.8020058274269104, 0.860775887966156, 0.9195458889007568, 0.9783159494400024, 1.037086009979248, 1.0958560705184937, 1.1546261310577393, 1.2133961915969849, 1.2721662521362305, 1.3309361934661865, 1.3897062540054321, 1.4484763145446777, 1.5072463750839233, 1.566016435623169, 1.6247864961624146, 1.6835565567016602, 1.7423264980316162, 1.8010966777801514, 1.8598666191101074, 1.918636679649353, 1.9774067401885986]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 6.0, 7.0, 7.0, 14.0, 22.0, 26.0, 38.0, 59.0, 61.0, 109.0, 170.0, 253.0, 382.0, 538.0, 920.0, 1470.0, 2398.0, 4103.0, 7171.0, 13239.0, 24883.0, 47818.0, 92906.0, 168912.0, 236647.0, 199047.0, 117233.0, 60481.0, 31414.0, 16407.0, 9076.0, 4981.0, 2900.0, 1737.0, 1133.0, 674.0, 462.0, 291.0, 165.0, 119.0, 92.0, 53.0, 41.0, 27.0, 30.0, 14.0, 8.0, 6.0, 4.0, 6.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5, -1.4526519775390625, -1.405303955078125, -1.3579559326171875, -1.31060791015625, -1.2632598876953125, -1.215911865234375, -1.1685638427734375, -1.1212158203125, -1.0738677978515625, -1.026519775390625, -0.9791717529296875, -0.93182373046875, -0.8844757080078125, -0.837127685546875, -0.7897796630859375, -0.742431640625, -0.6950836181640625, -0.647735595703125, -0.6003875732421875, -0.55303955078125, -0.5056915283203125, -0.458343505859375, -0.4109954833984375, -0.3636474609375, -0.3162994384765625, -0.268951416015625, -0.2216033935546875, -0.17425537109375, -0.1269073486328125, -0.079559326171875, -0.0322113037109375, 0.01513671875, 0.0624847412109375, 0.109832763671875, 0.1571807861328125, 0.20452880859375, 0.2518768310546875, 0.299224853515625, 0.3465728759765625, 0.3939208984375, 0.4412689208984375, 0.488616943359375, 0.5359649658203125, 0.58331298828125, 0.6306610107421875, 0.678009033203125, 0.7253570556640625, 0.772705078125, 0.8200531005859375, 0.867401123046875, 0.9147491455078125, 0.96209716796875, 1.0094451904296875, 1.056793212890625, 1.1041412353515625, 1.1514892578125, 1.1988372802734375, 1.246185302734375, 1.2935333251953125, 1.34088134765625, 1.3882293701171875, 1.435577392578125, 1.4829254150390625, 1.5302734375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 2.0, 6.0, 6.0, 7.0, 16.0, 18.0, 17.0, 25.0, 25.0, 23.0, 41.0, 43.0, 44.0, 58.0, 56.0, 58.0, 68.0, 56.0, 57.0, 52.0, 38.0, 41.0, 44.0, 34.0, 33.0, 19.0, 19.0, 25.0, 14.0, 13.0, 10.0, 8.0, 7.0, 9.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8125, -0.7878799438476562, -0.7632598876953125, -0.7386398315429688, -0.714019775390625, -0.6893997192382812, -0.6647796630859375, -0.6401596069335938, -0.61553955078125, -0.5909194946289062, -0.5662994384765625, -0.5416793823242188, -0.517059326171875, -0.49243927001953125, -0.4678192138671875, -0.44319915771484375, -0.4185791015625, -0.39395904541015625, -0.3693389892578125, -0.34471893310546875, -0.320098876953125, -0.29547882080078125, -0.2708587646484375, -0.24623870849609375, -0.22161865234375, -0.19699859619140625, -0.1723785400390625, -0.14775848388671875, -0.123138427734375, -0.09851837158203125, -0.0738983154296875, -0.04927825927734375, -0.024658203125, -3.814697265625e-05, 0.0245819091796875, 0.04920196533203125, 0.073822021484375, 0.09844207763671875, 0.1230621337890625, 0.14768218994140625, 0.17230224609375, 0.19692230224609375, 0.2215423583984375, 0.24616241455078125, 0.270782470703125, 0.29540252685546875, 0.3200225830078125, 0.34464263916015625, 0.3692626953125, 0.39388275146484375, 0.4185028076171875, 0.44312286376953125, 0.467742919921875, 0.49236297607421875, 0.5169830322265625, 0.5416030883789062, 0.56622314453125, 0.5908432006835938, 0.6154632568359375, 0.6400833129882812, 0.664703369140625, 0.6893234252929688, 0.7139434814453125, 0.7385635375976562, 0.76318359375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 7.0, 14.0, 17.0, 41.0, 62.0, 107.0, 186.0, 490.0, 967.0, 2560.0, 7888.0, 31926.0, 183849.0, 597598.0, 179305.0, 31508.0, 7645.0, 2523.0, 991.0, 395.0, 220.0, 104.0, 63.0, 34.0, 22.0, 11.0, 13.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.458984375, -3.305206298828125, -3.15142822265625, -2.997650146484375, -2.8438720703125, -2.690093994140625, -2.53631591796875, -2.382537841796875, -2.228759765625, -2.074981689453125, -1.92120361328125, -1.767425537109375, -1.6136474609375, -1.459869384765625, -1.30609130859375, -1.152313232421875, -0.99853515625, -0.844757080078125, -0.69097900390625, -0.537200927734375, -0.3834228515625, -0.229644775390625, -0.07586669921875, 0.077911376953125, 0.231689453125, 0.385467529296875, 0.53924560546875, 0.693023681640625, 0.8468017578125, 1.000579833984375, 1.15435791015625, 1.308135986328125, 1.4619140625, 1.615692138671875, 1.76947021484375, 1.923248291015625, 2.0770263671875, 2.230804443359375, 2.38458251953125, 2.538360595703125, 2.692138671875, 2.845916748046875, 2.99969482421875, 3.153472900390625, 3.3072509765625, 3.461029052734375, 3.61480712890625, 3.768585205078125, 3.92236328125, 4.076141357421875, 4.22991943359375, 4.383697509765625, 4.5374755859375, 4.691253662109375, 4.84503173828125, 4.998809814453125, 5.152587890625, 5.306365966796875, 5.46014404296875, 5.613922119140625, 5.7677001953125, 5.921478271484375, 6.07525634765625, 6.229034423828125, 6.3828125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 1.0, 5.0, 1.0, 5.0, 5.0, 9.0, 7.0, 11.0, 13.0, 17.0, 16.0, 14.0, 16.0, 19.0, 18.0, 20.0, 33.0, 30.0, 26.0, 41.0, 40.0, 52.0, 34.0, 33.0, 41.0, 44.0, 52.0, 31.0, 40.0, 34.0, 39.0, 36.0, 31.0, 30.0, 26.0, 24.0, 16.0, 23.0, 16.0, 9.0, 13.0, 10.0, 9.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.470703125, -3.349639892578125, -3.22857666015625, -3.107513427734375, -2.9864501953125, -2.865386962890625, -2.74432373046875, -2.623260498046875, -2.502197265625, -2.381134033203125, -2.26007080078125, -2.139007568359375, -2.0179443359375, -1.896881103515625, -1.77581787109375, -1.654754638671875, -1.53369140625, -1.412628173828125, -1.29156494140625, -1.170501708984375, -1.0494384765625, -0.928375244140625, -0.80731201171875, -0.686248779296875, -0.565185546875, -0.444122314453125, -0.32305908203125, -0.201995849609375, -0.0809326171875, 0.040130615234375, 0.16119384765625, 0.282257080078125, 0.4033203125, 0.524383544921875, 0.64544677734375, 0.766510009765625, 0.8875732421875, 1.008636474609375, 1.12969970703125, 1.250762939453125, 1.371826171875, 1.492889404296875, 1.61395263671875, 1.735015869140625, 1.8560791015625, 1.977142333984375, 2.09820556640625, 2.219268798828125, 2.34033203125, 2.461395263671875, 2.58245849609375, 2.703521728515625, 2.8245849609375, 2.945648193359375, 3.06671142578125, 3.187774658203125, 3.308837890625, 3.429901123046875, 3.55096435546875, 3.672027587890625, 3.7930908203125, 3.914154052734375, 4.03521728515625, 4.156280517578125, 4.27734375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 5.0, 6.0, 12.0, 15.0, 8.0, 26.0, 33.0, 53.0, 77.0, 126.0, 216.0, 352.0, 757.0, 2025.0, 7289.0, 73556.0, 892236.0, 61478.0, 6675.0, 1990.0, 719.0, 353.0, 206.0, 115.0, 74.0, 43.0, 37.0, 20.0, 14.0, 12.0, 9.0, 7.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.27734375, -4.149566650390625, -4.02178955078125, -3.894012451171875, -3.7662353515625, -3.638458251953125, -3.51068115234375, -3.382904052734375, -3.255126953125, -3.127349853515625, -2.99957275390625, -2.871795654296875, -2.7440185546875, -2.616241455078125, -2.48846435546875, -2.360687255859375, -2.23291015625, -2.105133056640625, -1.97735595703125, -1.849578857421875, -1.7218017578125, -1.594024658203125, -1.46624755859375, -1.338470458984375, -1.210693359375, -1.082916259765625, -0.95513916015625, -0.827362060546875, -0.6995849609375, -0.571807861328125, -0.44403076171875, -0.316253662109375, -0.1884765625, -0.060699462890625, 0.06707763671875, 0.194854736328125, 0.3226318359375, 0.450408935546875, 0.57818603515625, 0.705963134765625, 0.833740234375, 0.961517333984375, 1.08929443359375, 1.217071533203125, 1.3448486328125, 1.472625732421875, 1.60040283203125, 1.728179931640625, 1.85595703125, 1.983734130859375, 2.11151123046875, 2.239288330078125, 2.3670654296875, 2.494842529296875, 2.62261962890625, 2.750396728515625, 2.878173828125, 3.005950927734375, 3.13372802734375, 3.261505126953125, 3.3892822265625, 3.517059326171875, 3.64483642578125, 3.772613525390625, 3.900390625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 9.0, 6.0, 32.0, 59.0, 79.0, 158.0, 198.0, 174.0, 124.0, 68.0, 39.0, 18.0, 12.0, 7.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004527568817138672, -0.0004329271614551544, -0.00041309744119644165, -0.0003932677209377289, -0.0003734380006790161, -0.00035360828042030334, -0.0003337785601615906, -0.0003139488399028778, -0.00029411911964416504, -0.00027428939938545227, -0.0002544596791267395, -0.00023462995886802673, -0.00021480023860931396, -0.0001949705183506012, -0.00017514079809188843, -0.00015531107783317566, -0.0001354813575744629, -0.00011565163731575012, -9.582191705703735e-05, -7.599219679832458e-05, -5.6162476539611816e-05, -3.633275628089905e-05, -1.650303602218628e-05, 3.3266842365264893e-06, 2.3156404495239258e-05, 4.2986124753952026e-05, 6.28158450126648e-05, 8.264556527137756e-05, 0.00010247528553009033, 0.0001223050057888031, 0.00014213472604751587, 0.00016196444630622864, 0.0001817941665649414, 0.00020162388682365417, 0.00022145360708236694, 0.0002412833273410797, 0.0002611130475997925, 0.00028094276785850525, 0.000300772488117218, 0.0003206022083759308, 0.00034043192863464355, 0.0003602616488933563, 0.0003800913691520691, 0.00039992108941078186, 0.00041975080966949463, 0.0004395805299282074, 0.00045941025018692017, 0.00047923997044563293, 0.0004990696907043457, 0.0005188994109630585, 0.0005387291312217712, 0.000558558851480484, 0.0005783885717391968, 0.0005982182919979095, 0.0006180480122566223, 0.0006378777325153351, 0.0006577074527740479, 0.0006775371730327606, 0.0006973668932914734, 0.0007171966135501862, 0.0007370263338088989, 0.0007568560540676117, 0.0007766857743263245, 0.0007965154945850372, 0.00081634521484375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 5.0, 2.0, 2.0, 2.0, 4.0, 3.0, 5.0, 10.0, 20.0, 26.0, 44.0, 66.0, 109.0, 218.0, 394.0, 781.0, 2173.0, 7758.0, 57445.0, 765624.0, 193054.0, 14919.0, 3613.0, 1188.0, 472.0, 251.0, 138.0, 87.0, 48.0, 24.0, 20.0, 12.0, 11.0, 5.0, 5.0, 6.0, 3.0, 0.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.251953125, -3.15545654296875, -3.0589599609375, -2.96246337890625, -2.865966796875, -2.76947021484375, -2.6729736328125, -2.57647705078125, -2.47998046875, -2.38348388671875, -2.2869873046875, -2.19049072265625, -2.093994140625, -1.99749755859375, -1.9010009765625, -1.80450439453125, -1.7080078125, -1.61151123046875, -1.5150146484375, -1.41851806640625, -1.322021484375, -1.22552490234375, -1.1290283203125, -1.03253173828125, -0.93603515625, -0.83953857421875, -0.7430419921875, -0.64654541015625, -0.550048828125, -0.45355224609375, -0.3570556640625, -0.26055908203125, -0.1640625, -0.06756591796875, 0.0289306640625, 0.12542724609375, 0.221923828125, 0.31842041015625, 0.4149169921875, 0.51141357421875, 0.60791015625, 0.70440673828125, 0.8009033203125, 0.89739990234375, 0.993896484375, 1.09039306640625, 1.1868896484375, 1.28338623046875, 1.3798828125, 1.47637939453125, 1.5728759765625, 1.66937255859375, 1.765869140625, 1.86236572265625, 1.9588623046875, 2.05535888671875, 2.15185546875, 2.24835205078125, 2.3448486328125, 2.44134521484375, 2.537841796875, 2.63433837890625, 2.7308349609375, 2.82733154296875, 2.923828125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 2.0, 9.0, 5.0, 5.0, 13.0, 19.0, 34.0, 60.0, 126.0, 169.0, 201.0, 141.0, 106.0, 43.0, 31.0, 13.0, 9.0, 3.0, 6.0, 0.0, 0.0, 2.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.13671875, -4.97705078125, -4.8173828125, -4.65771484375, -4.498046875, -4.33837890625, -4.1787109375, -4.01904296875, -3.859375, -3.69970703125, -3.5400390625, -3.38037109375, -3.220703125, -3.06103515625, -2.9013671875, -2.74169921875, -2.58203125, -2.42236328125, -2.2626953125, -2.10302734375, -1.943359375, -1.78369140625, -1.6240234375, -1.46435546875, -1.3046875, -1.14501953125, -0.9853515625, -0.82568359375, -0.666015625, -0.50634765625, -0.3466796875, -0.18701171875, -0.02734375, 0.13232421875, 0.2919921875, 0.45166015625, 0.611328125, 0.77099609375, 0.9306640625, 1.09033203125, 1.25, 1.40966796875, 1.5693359375, 1.72900390625, 1.888671875, 2.04833984375, 2.2080078125, 2.36767578125, 2.52734375, 2.68701171875, 2.8466796875, 3.00634765625, 3.166015625, 3.32568359375, 3.4853515625, 3.64501953125, 3.8046875, 3.96435546875, 4.1240234375, 4.28369140625, 4.443359375, 4.60302734375, 4.7626953125, 4.92236328125, 5.08203125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 1.0, 9.0, 17.0, 34.0, 64.0, 113.0, 161.0, 206.0, 181.0, 102.0, 52.0, 29.0, 16.0, 9.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-74.5879135131836, -72.87418365478516, -71.16046142578125, -69.44673156738281, -67.73300170898438, -66.01927947998047, -64.30554962158203, -62.591819763183594, -60.87809371948242, -59.16436767578125, -57.45063781738281, -55.73691177368164, -54.02318572998047, -52.30945587158203, -50.59572982788086, -48.88200378417969, -47.16827392578125, -45.45454788208008, -43.74081802368164, -42.02709197998047, -40.3133659362793, -38.59963607788086, -36.88591003417969, -35.17218017578125, -33.458457946777344, -31.74472999572754, -30.031003952026367, -28.317276000976562, -26.603548049926758, -24.889820098876953, -23.17609405517578, -21.462366104125977, -19.748638153076172, -18.034910202026367, -16.321184158325195, -14.60745620727539, -12.893728256225586, -11.180001258850098, -9.46627426147461, -7.752546310424805, -6.038819313049316, -4.32509183883667, -2.6113646030426025, -0.8976373672485352, 0.8160901069641113, 2.529817581176758, 4.243544578552246, 5.957272529602051, 7.670999526977539, 9.384726524353027, 11.098454475402832, 12.81218147277832, 14.525909423828125, 16.239635467529297, 17.9533634185791, 19.667091369628906, 21.380817413330078, 23.094545364379883, 24.808271408081055, 26.52199935913086, 28.235727310180664, 29.94945526123047, 31.66318130493164, 33.37690734863281, 35.09063720703125]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 5.0, 3.0, 2.0, 3.0, 5.0, 6.0, 8.0, 10.0, 14.0, 16.0, 13.0, 13.0, 20.0, 30.0, 26.0, 20.0, 27.0, 36.0, 36.0, 26.0, 31.0, 27.0, 59.0, 47.0, 44.0, 49.0, 52.0, 32.0, 45.0, 27.0, 29.0, 29.0, 30.0, 28.0, 31.0, 22.0, 22.0, 20.0, 14.0, 7.0, 7.0, 13.0, 4.0, 9.0, 1.0, 4.0, 2.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-20.776704788208008, -20.143341064453125, -19.50997543334961, -18.876611709594727, -18.243247985839844, -17.609882354736328, -16.976518630981445, -16.343154907226562, -15.709790229797363, -15.076425552368164, -14.443061828613281, -13.809697151184082, -13.176332473754883, -12.54296875, -11.9096040725708, -11.276239395141602, -10.642875671386719, -10.00951099395752, -9.376147270202637, -8.742782592773438, -8.109418869018555, -7.4760541915893555, -6.842689514160156, -6.209325313568115, -5.575961112976074, -4.942596912384033, -4.309232711791992, -3.675868034362793, -3.042503833770752, -2.409139633178711, -1.7757751941680908, -1.1424107551574707, -0.5090446472167969, 0.12431967258453369, 0.7576839923858643, 1.3910483121871948, 2.0244126319885254, 2.6577768325805664, 3.2911412715911865, 3.9245057106018066, 4.557869911193848, 5.191234111785889, 5.82459831237793, 6.457962989807129, 7.09132719039917, 7.724691390991211, 8.35805606842041, 8.99142074584961, 9.624784469604492, 10.258149147033691, 10.891512870788574, 11.524877548217773, 12.158241271972656, 12.791605949401855, 13.424970626831055, 14.058334350585938, 14.691699028015137, 15.325063705444336, 15.958427429199219, 16.5917911529541, 17.225156784057617, 17.8585205078125, 18.491884231567383, 19.1252498626709, 19.75861358642578]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 8.0, 15.0, 8.0, 12.0, 19.0, 24.0, 39.0, 59.0, 98.0, 122.0, 229.0, 344.0, 544.0, 1039.0, 1991.0, 4528.0, 14418.0, 99154.0, 4028617.0, 29190.0, 7601.0, 2923.0, 1367.0, 734.0, 433.0, 258.0, 164.0, 110.0, 79.0, 51.0, 30.0, 23.0, 10.0, 9.0, 7.0, 6.0, 3.0, 3.0, 6.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.943359375, -3.817108154296875, -3.69085693359375, -3.564605712890625, -3.4383544921875, -3.312103271484375, -3.18585205078125, -3.059600830078125, -2.933349609375, -2.807098388671875, -2.68084716796875, -2.554595947265625, -2.4283447265625, -2.302093505859375, -2.17584228515625, -2.049591064453125, -1.92333984375, -1.797088623046875, -1.67083740234375, -1.544586181640625, -1.4183349609375, -1.292083740234375, -1.16583251953125, -1.039581298828125, -0.913330078125, -0.787078857421875, -0.66082763671875, -0.534576416015625, -0.4083251953125, -0.282073974609375, -0.15582275390625, -0.029571533203125, 0.0966796875, 0.222930908203125, 0.34918212890625, 0.475433349609375, 0.6016845703125, 0.727935791015625, 0.85418701171875, 0.980438232421875, 1.106689453125, 1.232940673828125, 1.35919189453125, 1.485443115234375, 1.6116943359375, 1.737945556640625, 1.86419677734375, 1.990447998046875, 2.11669921875, 2.242950439453125, 2.36920166015625, 2.495452880859375, 2.6217041015625, 2.747955322265625, 2.87420654296875, 3.000457763671875, 3.126708984375, 3.252960205078125, 3.37921142578125, 3.505462646484375, 3.6317138671875, 3.757965087890625, 3.88421630859375, 4.010467529296875, 4.13671875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 6.0, 3.0, 7.0, 12.0, 7.0, 11.0, 27.0, 28.0, 39.0, 34.0, 60.0, 71.0, 72.0, 92.0, 90.0, 79.0, 73.0, 62.0, 52.0, 41.0, 36.0, 29.0, 15.0, 19.0, 13.0, 7.0, 4.0, 7.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0], "bins": [-1.88671875, -1.843170166015625, -1.79962158203125, -1.756072998046875, -1.7125244140625, -1.668975830078125, -1.62542724609375, -1.581878662109375, -1.538330078125, -1.494781494140625, -1.45123291015625, -1.407684326171875, -1.3641357421875, -1.320587158203125, -1.27703857421875, -1.233489990234375, -1.18994140625, -1.146392822265625, -1.10284423828125, -1.059295654296875, -1.0157470703125, -0.972198486328125, -0.92864990234375, -0.885101318359375, -0.841552734375, -0.798004150390625, -0.75445556640625, -0.710906982421875, -0.6673583984375, -0.623809814453125, -0.58026123046875, -0.536712646484375, -0.4931640625, -0.449615478515625, -0.40606689453125, -0.362518310546875, -0.3189697265625, -0.275421142578125, -0.23187255859375, -0.188323974609375, -0.144775390625, -0.101226806640625, -0.05767822265625, -0.014129638671875, 0.0294189453125, 0.072967529296875, 0.11651611328125, 0.160064697265625, 0.20361328125, 0.247161865234375, 0.29071044921875, 0.334259033203125, 0.3778076171875, 0.421356201171875, 0.46490478515625, 0.508453369140625, 0.552001953125, 0.595550537109375, 0.63909912109375, 0.682647705078125, 0.7261962890625, 0.769744873046875, 0.81329345703125, 0.856842041015625, 0.900390625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 8.0, 6.0, 9.0, 10.0, 10.0, 16.0, 21.0, 31.0, 52.0, 53.0, 82.0, 124.0, 144.0, 207.0, 326.0, 394.0, 587.0, 886.0, 1449.0, 2705.0, 5562.0, 15010.0, 81207.0, 4017004.0, 46117.0, 11456.0, 4447.0, 2284.0, 1347.0, 856.0, 537.0, 390.0, 266.0, 184.0, 122.0, 100.0, 77.0, 51.0, 41.0, 22.0, 17.0, 9.0, 13.0, 13.0, 10.0, 9.0, 5.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.3828125, -7.15478515625, -6.9267578125, -6.69873046875, -6.470703125, -6.24267578125, -6.0146484375, -5.78662109375, -5.55859375, -5.33056640625, -5.1025390625, -4.87451171875, -4.646484375, -4.41845703125, -4.1904296875, -3.96240234375, -3.734375, -3.50634765625, -3.2783203125, -3.05029296875, -2.822265625, -2.59423828125, -2.3662109375, -2.13818359375, -1.91015625, -1.68212890625, -1.4541015625, -1.22607421875, -0.998046875, -0.77001953125, -0.5419921875, -0.31396484375, -0.0859375, 0.14208984375, 0.3701171875, 0.59814453125, 0.826171875, 1.05419921875, 1.2822265625, 1.51025390625, 1.73828125, 1.96630859375, 2.1943359375, 2.42236328125, 2.650390625, 2.87841796875, 3.1064453125, 3.33447265625, 3.5625, 3.79052734375, 4.0185546875, 4.24658203125, 4.474609375, 4.70263671875, 4.9306640625, 5.15869140625, 5.38671875, 5.61474609375, 5.8427734375, 6.07080078125, 6.298828125, 6.52685546875, 6.7548828125, 6.98291015625, 7.2109375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 3.0, 3.0, 2.0, 4.0, 12.0, 9.0, 14.0, 22.0, 62.0, 366.0, 3382.0, 98.0, 37.0, 17.0, 13.0, 10.0, 2.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.587890625, -2.5199127197265625, -2.451934814453125, -2.3839569091796875, -2.31597900390625, -2.2480010986328125, -2.180023193359375, -2.1120452880859375, -2.0440673828125, -1.9760894775390625, -1.908111572265625, -1.8401336669921875, -1.77215576171875, -1.7041778564453125, -1.636199951171875, -1.5682220458984375, -1.500244140625, -1.4322662353515625, -1.364288330078125, -1.2963104248046875, -1.22833251953125, -1.1603546142578125, -1.092376708984375, -1.0243988037109375, -0.9564208984375, -0.8884429931640625, -0.820465087890625, -0.7524871826171875, -0.68450927734375, -0.6165313720703125, -0.548553466796875, -0.4805755615234375, -0.41259765625, -0.3446197509765625, -0.276641845703125, -0.2086639404296875, -0.14068603515625, -0.0727081298828125, -0.004730224609375, 0.0632476806640625, 0.1312255859375, 0.1992034912109375, 0.267181396484375, 0.3351593017578125, 0.40313720703125, 0.4711151123046875, 0.539093017578125, 0.6070709228515625, 0.675048828125, 0.7430267333984375, 0.811004638671875, 0.8789825439453125, 0.94696044921875, 1.0149383544921875, 1.082916259765625, 1.1508941650390625, 1.2188720703125, 1.2868499755859375, 1.354827880859375, 1.4228057861328125, 1.49078369140625, 1.5587615966796875, 1.626739501953125, 1.6947174072265625, 1.7626953125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 0.0, 7.0, 1.0, 7.0, 9.0, 20.0, 42.0, 61.0, 90.0, 146.0, 194.0, 174.0, 124.0, 66.0, 32.0, 17.0, 8.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.433637619018555, -14.051681518554688, -13.669726371765137, -13.28777027130127, -12.905814170837402, -12.523858070373535, -12.141902923583984, -11.759946823120117, -11.37799072265625, -10.996034622192383, -10.614079475402832, -10.232123374938965, -9.850167274475098, -9.46821117401123, -9.08625602722168, -8.704299926757812, -8.322343826293945, -7.940388202667236, -7.558432102203369, -7.17647647857666, -6.794520378112793, -6.412564754486084, -6.030609130859375, -5.648653030395508, -5.266697883605957, -4.884742259979248, -4.502786159515381, -4.120830535888672, -3.7388744354248047, -3.3569188117980957, -2.9749629497528076, -2.5930070877075195, -2.2110509872436523, -1.8290951251983643, -1.4471392631530762, -1.0651835203170776, -0.6832276582717896, -0.30127179622650146, 0.08068394660949707, 0.46263980865478516, 0.8445956707000732, 1.2265515327453613, 1.6085073947906494, 1.990463137626648, 2.3724188804626465, 2.7543749809265137, 3.1363306045532227, 3.5182864665985107, 3.900242328643799, 4.282197952270508, 4.664154052734375, 5.046109676361084, 5.428065776824951, 5.81002140045166, 6.191977500915527, 6.573933124542236, 6.955888748168945, 7.337844371795654, 7.7198004722595215, 8.10175609588623, 8.483712196350098, 8.865668296813965, 9.247623443603516, 9.629579544067383, 10.01153564453125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 3.0, 5.0, 6.0, 6.0, 8.0, 16.0, 14.0, 17.0, 18.0, 15.0, 17.0, 26.0, 28.0, 29.0, 35.0, 41.0, 35.0, 39.0, 48.0, 51.0, 49.0, 37.0, 45.0, 46.0, 42.0, 42.0, 32.0, 27.0, 25.0, 30.0, 22.0, 29.0, 16.0, 18.0, 13.0, 13.0, 14.0, 10.0, 8.0, 9.0, 5.0, 7.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.744624614715576, -3.6153879165649414, -3.4861512184143066, -3.356914758682251, -3.227678060531616, -3.0984413623809814, -2.969204902648926, -2.839968204498291, -2.7107315063476562, -2.5814948081970215, -2.4522581100463867, -2.323021650314331, -2.1937849521636963, -2.0645482540130615, -1.9353116750717163, -1.806075096130371, -1.6768383979797363, -1.5476016998291016, -1.4183651208877563, -1.2891285419464111, -1.1598918437957764, -1.0306551456451416, -0.9014185667037964, -0.7721819281578064, -0.6429452896118164, -0.5137086510658264, -0.3844720125198364, -0.25523537397384644, -0.12599873542785645, 0.003237903118133545, 0.13247454166412354, 0.2617111802101135, 0.3909473419189453, 0.5201839804649353, 0.6494206190109253, 0.7786572575569153, 0.9078938961029053, 1.03713059425354, 1.1663671731948853, 1.2956037521362305, 1.4248404502868652, 1.5540771484375, 1.6833137273788452, 1.8125503063201904, 1.9417870044708252, 2.07102370262146, 2.2002601623535156, 2.3294968605041504, 2.458733558654785, 2.58797025680542, 2.7172069549560547, 2.8464434146881104, 2.975680112838745, 3.10491681098938, 3.2341532707214355, 3.3633899688720703, 3.492626667022705, 3.62186336517334, 3.7511000633239746, 3.8803365230560303, 4.009572982788086, 4.138809680938721, 4.2680463790893555, 4.39728307723999, 4.526519775390625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 8.0, 14.0, 27.0, 21.0, 15.0, 38.0, 67.0, 78.0, 103.0, 186.0, 213.0, 348.0, 582.0, 886.0, 1460.0, 2340.0, 4163.0, 7424.0, 14245.0, 27821.0, 56742.0, 120447.0, 230341.0, 267519.0, 159495.0, 76801.0, 36517.0, 18137.0, 9493.0, 5150.0, 2992.0, 1751.0, 1057.0, 699.0, 418.0, 311.0, 189.0, 117.0, 91.0, 76.0, 53.0, 30.0, 27.0, 20.0, 10.0, 12.0, 6.0, 1.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-2.240234375, -2.166046142578125, -2.09185791015625, -2.017669677734375, -1.9434814453125, -1.869293212890625, -1.79510498046875, -1.720916748046875, -1.646728515625, -1.572540283203125, -1.49835205078125, -1.424163818359375, -1.3499755859375, -1.275787353515625, -1.20159912109375, -1.127410888671875, -1.05322265625, -0.979034423828125, -0.90484619140625, -0.830657958984375, -0.7564697265625, -0.682281494140625, -0.60809326171875, -0.533905029296875, -0.459716796875, -0.385528564453125, -0.31134033203125, -0.237152099609375, -0.1629638671875, -0.088775634765625, -0.01458740234375, 0.059600830078125, 0.1337890625, 0.207977294921875, 0.28216552734375, 0.356353759765625, 0.4305419921875, 0.504730224609375, 0.57891845703125, 0.653106689453125, 0.727294921875, 0.801483154296875, 0.87567138671875, 0.949859619140625, 1.0240478515625, 1.098236083984375, 1.17242431640625, 1.246612548828125, 1.32080078125, 1.394989013671875, 1.46917724609375, 1.543365478515625, 1.6175537109375, 1.691741943359375, 1.76593017578125, 1.840118408203125, 1.914306640625, 1.988494873046875, 2.06268310546875, 2.136871337890625, 2.2110595703125, 2.285247802734375, 2.35943603515625, 2.433624267578125, 2.5078125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 9.0, 5.0, 8.0, 7.0, 7.0, 10.0, 15.0, 11.0, 27.0, 18.0, 41.0, 50.0, 42.0, 57.0, 63.0, 64.0, 86.0, 64.0, 71.0, 55.0, 49.0, 37.0, 45.0, 30.0, 28.0, 26.0, 22.0, 16.0, 17.0, 9.0, 7.0, 10.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8251953125, -1.7757720947265625, -1.726348876953125, -1.6769256591796875, -1.62750244140625, -1.5780792236328125, -1.528656005859375, -1.4792327880859375, -1.4298095703125, -1.3803863525390625, -1.330963134765625, -1.2815399169921875, -1.23211669921875, -1.1826934814453125, -1.133270263671875, -1.0838470458984375, -1.034423828125, -0.9850006103515625, -0.935577392578125, -0.8861541748046875, -0.83673095703125, -0.7873077392578125, -0.737884521484375, -0.6884613037109375, -0.6390380859375, -0.5896148681640625, -0.540191650390625, -0.4907684326171875, -0.44134521484375, -0.3919219970703125, -0.342498779296875, -0.2930755615234375, -0.24365234375, -0.1942291259765625, -0.144805908203125, -0.0953826904296875, -0.04595947265625, 0.0034637451171875, 0.052886962890625, 0.1023101806640625, 0.1517333984375, 0.2011566162109375, 0.250579833984375, 0.3000030517578125, 0.34942626953125, 0.3988494873046875, 0.448272705078125, 0.4976959228515625, 0.547119140625, 0.5965423583984375, 0.645965576171875, 0.6953887939453125, 0.74481201171875, 0.7942352294921875, 0.843658447265625, 0.8930816650390625, 0.9425048828125, 0.9919281005859375, 1.041351318359375, 1.0907745361328125, 1.14019775390625, 1.1896209716796875, 1.239044189453125, 1.2884674072265625, 1.337890625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 6.0, 9.0, 4.0, 17.0, 17.0, 24.0, 34.0, 63.0, 90.0, 176.0, 352.0, 811.0, 2568.0, 9258.0, 52966.0, 533361.0, 398287.0, 39330.0, 7546.0, 2146.0, 740.0, 319.0, 163.0, 102.0, 66.0, 36.0, 25.0, 10.0, 16.0, 8.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5546875, -6.28076171875, -6.0068359375, -5.73291015625, -5.458984375, -5.18505859375, -4.9111328125, -4.63720703125, -4.36328125, -4.08935546875, -3.8154296875, -3.54150390625, -3.267578125, -2.99365234375, -2.7197265625, -2.44580078125, -2.171875, -1.89794921875, -1.6240234375, -1.35009765625, -1.076171875, -0.80224609375, -0.5283203125, -0.25439453125, 0.01953125, 0.29345703125, 0.5673828125, 0.84130859375, 1.115234375, 1.38916015625, 1.6630859375, 1.93701171875, 2.2109375, 2.48486328125, 2.7587890625, 3.03271484375, 3.306640625, 3.58056640625, 3.8544921875, 4.12841796875, 4.40234375, 4.67626953125, 4.9501953125, 5.22412109375, 5.498046875, 5.77197265625, 6.0458984375, 6.31982421875, 6.59375, 6.86767578125, 7.1416015625, 7.41552734375, 7.689453125, 7.96337890625, 8.2373046875, 8.51123046875, 8.78515625, 9.05908203125, 9.3330078125, 9.60693359375, 9.880859375, 10.15478515625, 10.4287109375, 10.70263671875, 10.9765625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 9.0, 5.0, 7.0, 6.0, 6.0, 6.0, 10.0, 19.0, 26.0, 27.0, 37.0, 37.0, 34.0, 40.0, 54.0, 53.0, 48.0, 64.0, 67.0, 44.0, 51.0, 60.0, 43.0, 37.0, 36.0, 34.0, 30.0, 16.0, 19.0, 13.0, 12.0, 13.0, 7.0, 12.0, 7.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-8.6953125, -8.45477294921875, -8.2142333984375, -7.97369384765625, -7.733154296875, -7.49261474609375, -7.2520751953125, -7.01153564453125, -6.77099609375, -6.53045654296875, -6.2899169921875, -6.04937744140625, -5.808837890625, -5.56829833984375, -5.3277587890625, -5.08721923828125, -4.8466796875, -4.60614013671875, -4.3656005859375, -4.12506103515625, -3.884521484375, -3.64398193359375, -3.4034423828125, -3.16290283203125, -2.92236328125, -2.68182373046875, -2.4412841796875, -2.20074462890625, -1.960205078125, -1.71966552734375, -1.4791259765625, -1.23858642578125, -0.998046875, -0.75750732421875, -0.5169677734375, -0.27642822265625, -0.035888671875, 0.20465087890625, 0.4451904296875, 0.68572998046875, 0.92626953125, 1.16680908203125, 1.4073486328125, 1.64788818359375, 1.888427734375, 2.12896728515625, 2.3695068359375, 2.61004638671875, 2.8505859375, 3.09112548828125, 3.3316650390625, 3.57220458984375, 3.812744140625, 4.05328369140625, 4.2938232421875, 4.53436279296875, 4.77490234375, 5.01544189453125, 5.2559814453125, 5.49652099609375, 5.737060546875, 5.97760009765625, 6.2181396484375, 6.45867919921875, 6.69921875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 6.0, 6.0, 5.0, 1.0, 10.0, 9.0, 8.0, 12.0, 24.0, 33.0, 46.0, 59.0, 92.0, 115.0, 201.0, 318.0, 500.0, 976.0, 2180.0, 5601.0, 19951.0, 124984.0, 686867.0, 170479.0, 24405.0, 6589.0, 2358.0, 1132.0, 564.0, 333.0, 219.0, 133.0, 108.0, 64.0, 44.0, 28.0, 24.0, 13.0, 13.0, 11.0, 11.0, 3.0, 11.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-3.0546875, -2.957916259765625, -2.86114501953125, -2.764373779296875, -2.6676025390625, -2.570831298828125, -2.47406005859375, -2.377288818359375, -2.280517578125, -2.183746337890625, -2.08697509765625, -1.990203857421875, -1.8934326171875, -1.796661376953125, -1.69989013671875, -1.603118896484375, -1.50634765625, -1.409576416015625, -1.31280517578125, -1.216033935546875, -1.1192626953125, -1.022491455078125, -0.92572021484375, -0.828948974609375, -0.732177734375, -0.635406494140625, -0.53863525390625, -0.441864013671875, -0.3450927734375, -0.248321533203125, -0.15155029296875, -0.054779052734375, 0.0419921875, 0.138763427734375, 0.23553466796875, 0.332305908203125, 0.4290771484375, 0.525848388671875, 0.62261962890625, 0.719390869140625, 0.816162109375, 0.912933349609375, 1.00970458984375, 1.106475830078125, 1.2032470703125, 1.300018310546875, 1.39678955078125, 1.493560791015625, 1.59033203125, 1.687103271484375, 1.78387451171875, 1.880645751953125, 1.9774169921875, 2.074188232421875, 2.17095947265625, 2.267730712890625, 2.364501953125, 2.461273193359375, 2.55804443359375, 2.654815673828125, 2.7515869140625, 2.848358154296875, 2.94512939453125, 3.041900634765625, 3.138671875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 8.0, 10.0, 18.0, 16.0, 35.0, 46.0, 93.0, 114.0, 161.0, 163.0, 139.0, 72.0, 44.0, 37.0, 15.0, 4.0, 8.0, 5.0, 4.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004634857177734375, -0.00044229626655578613, -0.00042110681533813477, -0.0003999173641204834, -0.00037872791290283203, -0.00035753846168518066, -0.0003363490104675293, -0.00031515955924987793, -0.00029397010803222656, -0.0002727806568145752, -0.00025159120559692383, -0.00023040175437927246, -0.0002092123031616211, -0.00018802285194396973, -0.00016683340072631836, -0.000145643949508667, -0.00012445449829101562, -0.00010326504707336426, -8.207559585571289e-05, -6.0886144638061523e-05, -3.9696693420410156e-05, -1.850724220275879e-05, 2.682209014892578e-06, 2.3871660232543945e-05, 4.506111145019531e-05, 6.625056266784668e-05, 8.744001388549805e-05, 0.00010862946510314941, 0.00012981891632080078, 0.00015100836753845215, 0.00017219781875610352, 0.00019338726997375488, 0.00021457672119140625, 0.00023576617240905762, 0.000256955623626709, 0.00027814507484436035, 0.0002993345260620117, 0.0003205239772796631, 0.00034171342849731445, 0.0003629028797149658, 0.0003840923309326172, 0.00040528178215026855, 0.0004264712333679199, 0.0004476606845855713, 0.00046885013580322266, 0.000490039587020874, 0.0005112290382385254, 0.0005324184894561768, 0.0005536079406738281, 0.0005747973918914795, 0.0005959868431091309, 0.0006171762943267822, 0.0006383657455444336, 0.000659555196762085, 0.0006807446479797363, 0.0007019340991973877, 0.0007231235504150391, 0.0007443130016326904, 0.0007655024528503418, 0.0007866919040679932, 0.0008078813552856445, 0.0008290708065032959, 0.0008502602577209473, 0.0008714497089385986, 0.00089263916015625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 0.0, 6.0, 13.0, 8.0, 20.0, 23.0, 38.0, 48.0, 90.0, 144.0, 237.0, 540.0, 1256.0, 3819.0, 17071.0, 228786.0, 734936.0, 50384.0, 7463.0, 2037.0, 778.0, 373.0, 178.0, 109.0, 57.0, 57.0, 25.0, 19.0, 14.0, 11.0, 2.0, 3.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.15234375, -3.0223388671875, -2.892333984375, -2.7623291015625, -2.63232421875, -2.5023193359375, -2.372314453125, -2.2423095703125, -2.1123046875, -1.9822998046875, -1.852294921875, -1.7222900390625, -1.59228515625, -1.4622802734375, -1.332275390625, -1.2022705078125, -1.072265625, -0.9422607421875, -0.812255859375, -0.6822509765625, -0.55224609375, -0.4222412109375, -0.292236328125, -0.1622314453125, -0.0322265625, 0.0977783203125, 0.227783203125, 0.3577880859375, 0.48779296875, 0.6177978515625, 0.747802734375, 0.8778076171875, 1.0078125, 1.1378173828125, 1.267822265625, 1.3978271484375, 1.52783203125, 1.6578369140625, 1.787841796875, 1.9178466796875, 2.0478515625, 2.1778564453125, 2.307861328125, 2.4378662109375, 2.56787109375, 2.6978759765625, 2.827880859375, 2.9578857421875, 3.087890625, 3.2178955078125, 3.347900390625, 3.4779052734375, 3.60791015625, 3.7379150390625, 3.867919921875, 3.9979248046875, 4.1279296875, 4.2579345703125, 4.387939453125, 4.5179443359375, 4.64794921875, 4.7779541015625, 4.907958984375, 5.0379638671875, 5.16796875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 2.0, 1.0, 4.0, 5.0, 7.0, 10.0, 9.0, 24.0, 17.0, 33.0, 41.0, 71.0, 86.0, 96.0, 80.0, 94.0, 85.0, 88.0, 68.0, 51.0, 41.0, 23.0, 20.0, 16.0, 11.0, 7.0, 5.0, 0.0, 3.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.560546875, -3.461822509765625, -3.36309814453125, -3.264373779296875, -3.1656494140625, -3.066925048828125, -2.96820068359375, -2.869476318359375, -2.770751953125, -2.672027587890625, -2.57330322265625, -2.474578857421875, -2.3758544921875, -2.277130126953125, -2.17840576171875, -2.079681396484375, -1.98095703125, -1.882232666015625, -1.78350830078125, -1.684783935546875, -1.5860595703125, -1.487335205078125, -1.38861083984375, -1.289886474609375, -1.191162109375, -1.092437744140625, -0.99371337890625, -0.894989013671875, -0.7962646484375, -0.697540283203125, -0.59881591796875, -0.500091552734375, -0.4013671875, -0.302642822265625, -0.20391845703125, -0.105194091796875, -0.0064697265625, 0.092254638671875, 0.19097900390625, 0.289703369140625, 0.388427734375, 0.487152099609375, 0.58587646484375, 0.684600830078125, 0.7833251953125, 0.882049560546875, 0.98077392578125, 1.079498291015625, 1.17822265625, 1.276947021484375, 1.37567138671875, 1.474395751953125, 1.5731201171875, 1.671844482421875, 1.77056884765625, 1.869293212890625, 1.968017578125, 2.066741943359375, 2.16546630859375, 2.264190673828125, 2.3629150390625, 2.461639404296875, 2.56036376953125, 2.659088134765625, 2.7578125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 15.0, 25.0, 106.0, 250.0, 320.0, 179.0, 80.0, 18.0, 10.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-172.21542358398438, -168.31869506835938, -164.42196655273438, -160.5252227783203, -156.6284942626953, -152.7317657470703, -148.8350372314453, -144.93829345703125, -141.04156494140625, -137.14483642578125, -133.24810791015625, -129.3513641357422, -125.45463562011719, -121.55790710449219, -117.66117858886719, -113.76444244384766, -109.86771392822266, -105.97098541259766, -102.07424926757812, -98.17752075195312, -94.2807846069336, -90.3840560913086, -86.48731994628906, -82.59059143066406, -78.69386291503906, -74.79713439941406, -70.90039825439453, -67.00366973876953, -63.10693359375, -59.210205078125, -55.313472747802734, -51.41674041748047, -47.52001190185547, -43.6232795715332, -39.72654724121094, -35.82981872558594, -31.93308448791504, -28.036352157592773, -24.13962173461914, -20.242889404296875, -16.34615707397461, -12.449424743652344, -8.552693367004395, -4.655961990356445, -0.7592296600341797, 3.137502670288086, 7.034233093261719, 10.930965423583984, 14.82769775390625, 18.724430084228516, 22.62116241455078, 26.517892837524414, 30.41462516784668, 34.31135559082031, 38.20808792114258, 42.104820251464844, 46.00155258178711, 49.898284912109375, 53.79501724243164, 57.691749572753906, 61.588478088378906, 65.48521423339844, 69.38194274902344, 73.27867126464844, 77.17540740966797]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 4.0, 7.0, 4.0, 10.0, 5.0, 12.0, 13.0, 21.0, 22.0, 19.0, 24.0, 27.0, 35.0, 36.0, 41.0, 46.0, 52.0, 55.0, 59.0, 58.0, 64.0, 62.0, 35.0, 47.0, 32.0, 32.0, 32.0, 26.0, 29.0, 19.0, 17.0, 12.0, 14.0, 9.0, 10.0, 3.0, 1.0, 8.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.93239974975586, -28.862197875976562, -27.7919979095459, -26.7217960357666, -25.651594161987305, -24.58139419555664, -23.511192321777344, -22.440990447998047, -21.37078857421875, -20.300586700439453, -19.23038673400879, -18.160184860229492, -17.089982986450195, -16.01978302001953, -14.949581146240234, -13.879379272460938, -12.809179306030273, -11.738978385925293, -10.668776512145996, -9.598575592041016, -8.528373718261719, -7.458172798156738, -6.387971878051758, -5.317770481109619, -4.2475690841674805, -3.177367687225342, -2.1071665287017822, -1.0369653701782227, 0.033236026763916016, 1.1034374237060547, 2.173638343811035, 3.243839740753174, 4.3140411376953125, 5.384242534637451, 6.45444393157959, 7.52464485168457, 8.594846725463867, 9.665047645568848, 10.735248565673828, 11.805450439453125, 12.875651359558105, 13.945852279663086, 15.016054153442383, 16.086254119873047, 17.156455993652344, 18.22665786743164, 19.296859741210938, 20.3670597076416, 21.4372615814209, 22.507463455200195, 23.57766342163086, 24.647865295410156, 25.718067169189453, 26.78826904296875, 27.858469009399414, 28.92867088317871, 29.998870849609375, 31.069072723388672, 32.13927459716797, 33.20947265625, 34.2796745300293, 35.349876403808594, 36.42007827758789, 37.49028015136719, 38.560482025146484]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 6.0, 1.0, 6.0, 5.0, 6.0, 14.0, 19.0, 23.0, 49.0, 62.0, 127.0, 199.0, 386.0, 747.0, 1773.0, 4900.0, 30886.0, 4134614.0, 14250.0, 3450.0, 1316.0, 640.0, 336.0, 185.0, 99.0, 71.0, 38.0, 18.0, 21.0, 11.0, 6.0, 6.0, 9.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.9453125, -9.6378173828125, -9.330322265625, -9.0228271484375, -8.71533203125, -8.4078369140625, -8.100341796875, -7.7928466796875, -7.4853515625, -7.1778564453125, -6.870361328125, -6.5628662109375, -6.25537109375, -5.9478759765625, -5.640380859375, -5.3328857421875, -5.025390625, -4.7178955078125, -4.410400390625, -4.1029052734375, -3.79541015625, -3.4879150390625, -3.180419921875, -2.8729248046875, -2.5654296875, -2.2579345703125, -1.950439453125, -1.6429443359375, -1.33544921875, -1.0279541015625, -0.720458984375, -0.4129638671875, -0.10546875, 0.2020263671875, 0.509521484375, 0.8170166015625, 1.12451171875, 1.4320068359375, 1.739501953125, 2.0469970703125, 2.3544921875, 2.6619873046875, 2.969482421875, 3.2769775390625, 3.58447265625, 3.8919677734375, 4.199462890625, 4.5069580078125, 4.814453125, 5.1219482421875, 5.429443359375, 5.7369384765625, 6.04443359375, 6.3519287109375, 6.659423828125, 6.9669189453125, 7.2744140625, 7.5819091796875, 7.889404296875, 8.1968994140625, 8.50439453125, 8.8118896484375, 9.119384765625, 9.4268798828125, 9.734375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 1.0, 2.0, 6.0, 2.0, 15.0, 10.0, 19.0, 19.0, 24.0, 36.0, 42.0, 79.0, 73.0, 109.0, 88.0, 91.0, 89.0, 80.0, 62.0, 43.0, 32.0, 25.0, 20.0, 10.0, 8.0, 5.0, 7.0, 6.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.38671875, -2.306549072265625, -2.22637939453125, -2.146209716796875, -2.0660400390625, -1.985870361328125, -1.90570068359375, -1.825531005859375, -1.745361328125, -1.665191650390625, -1.58502197265625, -1.504852294921875, -1.4246826171875, -1.344512939453125, -1.26434326171875, -1.184173583984375, -1.10400390625, -1.023834228515625, -0.94366455078125, -0.863494873046875, -0.7833251953125, -0.703155517578125, -0.62298583984375, -0.542816162109375, -0.462646484375, -0.382476806640625, -0.30230712890625, -0.222137451171875, -0.1419677734375, -0.061798095703125, 0.01837158203125, 0.098541259765625, 0.1787109375, 0.258880615234375, 0.33905029296875, 0.419219970703125, 0.4993896484375, 0.579559326171875, 0.65972900390625, 0.739898681640625, 0.820068359375, 0.900238037109375, 0.98040771484375, 1.060577392578125, 1.1407470703125, 1.220916748046875, 1.30108642578125, 1.381256103515625, 1.46142578125, 1.541595458984375, 1.62176513671875, 1.701934814453125, 1.7821044921875, 1.862274169921875, 1.94244384765625, 2.022613525390625, 2.102783203125, 2.182952880859375, 2.26312255859375, 2.343292236328125, 2.4234619140625, 2.503631591796875, 2.58380126953125, 2.663970947265625, 2.744140625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 8.0, 4.0, 13.0, 14.0, 19.0, 19.0, 23.0, 35.0, 50.0, 67.0, 116.0, 156.0, 231.0, 355.0, 522.0, 742.0, 1131.0, 1688.0, 2876.0, 5554.0, 14746.0, 177759.0, 3955611.0, 17787.0, 6049.0, 3100.0, 1873.0, 1185.0, 801.0, 526.0, 368.0, 251.0, 167.0, 126.0, 101.0, 63.0, 48.0, 30.0, 27.0, 17.0, 7.0, 9.0, 4.0, 1.0, 3.0, 6.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.6875, -7.41357421875, -7.1396484375, -6.86572265625, -6.591796875, -6.31787109375, -6.0439453125, -5.77001953125, -5.49609375, -5.22216796875, -4.9482421875, -4.67431640625, -4.400390625, -4.12646484375, -3.8525390625, -3.57861328125, -3.3046875, -3.03076171875, -2.7568359375, -2.48291015625, -2.208984375, -1.93505859375, -1.6611328125, -1.38720703125, -1.11328125, -0.83935546875, -0.5654296875, -0.29150390625, -0.017578125, 0.25634765625, 0.5302734375, 0.80419921875, 1.078125, 1.35205078125, 1.6259765625, 1.89990234375, 2.173828125, 2.44775390625, 2.7216796875, 2.99560546875, 3.26953125, 3.54345703125, 3.8173828125, 4.09130859375, 4.365234375, 4.63916015625, 4.9130859375, 5.18701171875, 5.4609375, 5.73486328125, 6.0087890625, 6.28271484375, 6.556640625, 6.83056640625, 7.1044921875, 7.37841796875, 7.65234375, 7.92626953125, 8.2001953125, 8.47412109375, 8.748046875, 9.02197265625, 9.2958984375, 9.56982421875, 9.84375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 2.0, 8.0, 8.0, 17.0, 23.0, 61.0, 3721.0, 150.0, 26.0, 17.0, 10.0, 3.0, 3.0, 6.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.28515625, -2.20831298828125, -2.1314697265625, -2.05462646484375, -1.977783203125, -1.90093994140625, -1.8240966796875, -1.74725341796875, -1.67041015625, -1.59356689453125, -1.5167236328125, -1.43988037109375, -1.363037109375, -1.28619384765625, -1.2093505859375, -1.13250732421875, -1.0556640625, -0.97882080078125, -0.9019775390625, -0.82513427734375, -0.748291015625, -0.67144775390625, -0.5946044921875, -0.51776123046875, -0.44091796875, -0.36407470703125, -0.2872314453125, -0.21038818359375, -0.133544921875, -0.05670166015625, 0.0201416015625, 0.09698486328125, 0.173828125, 0.25067138671875, 0.3275146484375, 0.40435791015625, 0.481201171875, 0.55804443359375, 0.6348876953125, 0.71173095703125, 0.78857421875, 0.86541748046875, 0.9422607421875, 1.01910400390625, 1.095947265625, 1.17279052734375, 1.2496337890625, 1.32647705078125, 1.4033203125, 1.48016357421875, 1.5570068359375, 1.63385009765625, 1.710693359375, 1.78753662109375, 1.8643798828125, 1.94122314453125, 2.01806640625, 2.09490966796875, 2.1717529296875, 2.24859619140625, 2.325439453125, 2.40228271484375, 2.4791259765625, 2.55596923828125, 2.6328125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 9.0, 8.0, 9.0, 31.0, 67.0, 177.0, 192.0, 211.0, 134.0, 81.0, 47.0, 20.0, 10.0, 7.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.363758087158203, -17.943307876586914, -17.522857666015625, -17.10240936279297, -16.68195915222168, -16.26150894165039, -15.841058731079102, -15.420608520507812, -15.000158309936523, -14.579708099365234, -14.159258842468262, -13.738808631896973, -13.318358421325684, -12.897909164428711, -12.477458953857422, -12.057008743286133, -11.63655948638916, -11.216109275817871, -10.795660018920898, -10.37520980834961, -9.95475959777832, -9.534309387207031, -9.113860130310059, -8.69340991973877, -8.272960662841797, -7.852510929107666, -7.432060718536377, -7.011610984802246, -6.591160774230957, -6.170711040496826, -5.750261306762695, -5.329811096191406, -4.909359931945801, -4.48891019821167, -4.068459987640381, -3.64801025390625, -3.22756028175354, -2.80711030960083, -2.386660575866699, -1.9662106037139893, -1.5457606315612793, -1.1253106594085693, -0.7048608064651489, -0.2844109535217285, 0.13603901863098145, 0.5564889907836914, 0.9769387245178223, 1.3973886966705322, 1.8178386688232422, 2.238288640975952, 2.658738613128662, 3.079188346862793, 3.499638319015503, 3.920088291168213, 4.340538024902344, 4.760988235473633, 5.181437969207764, 5.6018877029418945, 6.022337913513184, 6.4427876472473145, 6.863237380981445, 7.283687591552734, 7.704137325286865, 8.124587059020996, 8.545037269592285]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 6.0, 2.0, 8.0, 9.0, 8.0, 8.0, 12.0, 9.0, 16.0, 18.0, 21.0, 24.0, 17.0, 27.0, 26.0, 32.0, 28.0, 36.0, 32.0, 37.0, 45.0, 29.0, 34.0, 33.0, 49.0, 41.0, 37.0, 40.0, 29.0, 38.0, 29.0, 24.0, 29.0, 33.0, 19.0, 21.0, 12.0, 16.0, 16.0, 10.0, 5.0, 9.0, 6.0, 3.0, 3.0, 6.0, 5.0, 3.0, 5.0, 4.0, 1.0], "bins": [-4.406777858734131, -4.285886764526367, -4.1649956703186035, -4.04410457611084, -3.923213481903076, -3.8023223876953125, -3.681431293487549, -3.560540199279785, -3.4396491050720215, -3.318758010864258, -3.197866916656494, -3.0769758224487305, -2.956084728240967, -2.835193634033203, -2.7143025398254395, -2.593411445617676, -2.472520351409912, -2.3516292572021484, -2.2307381629943848, -2.109847068786621, -1.9889559745788574, -1.8680648803710938, -1.74717378616333, -1.6262826919555664, -1.5053918361663818, -1.3845007419586182, -1.2636096477508545, -1.1427185535430908, -1.0218274593353271, -0.9009364247322083, -0.7800453305244446, -0.6591542363166809, -0.5382630825042725, -0.4173719882965088, -0.2964808940887451, -0.17558982968330383, -0.05469873547554016, 0.06619232892990112, 0.1870834231376648, 0.30797451734542847, 0.42886561155319214, 0.5497567057609558, 0.6706477999687195, 0.7915388345718384, 0.912429928779602, 1.0333210229873657, 1.1542121171951294, 1.275103211402893, 1.3959943056106567, 1.5168853998184204, 1.637776494026184, 1.7586675882339478, 1.8795586824417114, 2.0004496574401855, 2.121340751647949, 2.242231845855713, 2.3631229400634766, 2.4840140342712402, 2.604905128479004, 2.7257962226867676, 2.8466873168945312, 2.967578411102295, 3.0884695053100586, 3.2093605995178223, 3.330251693725586]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 3.0, 4.0, 10.0, 13.0, 10.0, 19.0, 34.0, 52.0, 98.0, 130.0, 274.0, 407.0, 820.0, 1864.0, 4650.0, 13536.0, 46968.0, 199232.0, 529657.0, 185852.0, 44070.0, 12881.0, 4278.0, 1850.0, 854.0, 413.0, 213.0, 125.0, 76.0, 49.0, 34.0, 19.0, 15.0, 15.0, 14.0, 9.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0], "bins": [-6.4453125, -6.26861572265625, -6.0919189453125, -5.91522216796875, -5.738525390625, -5.56182861328125, -5.3851318359375, -5.20843505859375, -5.03173828125, -4.85504150390625, -4.6783447265625, -4.50164794921875, -4.324951171875, -4.14825439453125, -3.9715576171875, -3.79486083984375, -3.6181640625, -3.44146728515625, -3.2647705078125, -3.08807373046875, -2.911376953125, -2.73468017578125, -2.5579833984375, -2.38128662109375, -2.20458984375, -2.02789306640625, -1.8511962890625, -1.67449951171875, -1.497802734375, -1.32110595703125, -1.1444091796875, -0.96771240234375, -0.791015625, -0.61431884765625, -0.4376220703125, -0.26092529296875, -0.084228515625, 0.09246826171875, 0.2691650390625, 0.44586181640625, 0.62255859375, 0.79925537109375, 0.9759521484375, 1.15264892578125, 1.329345703125, 1.50604248046875, 1.6827392578125, 1.85943603515625, 2.0361328125, 2.21282958984375, 2.3895263671875, 2.56622314453125, 2.742919921875, 2.91961669921875, 3.0963134765625, 3.27301025390625, 3.44970703125, 3.62640380859375, 3.8031005859375, 3.97979736328125, 4.156494140625, 4.33319091796875, 4.5098876953125, 4.68658447265625, 4.86328125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 2.0, 5.0, 15.0, 15.0, 23.0, 22.0, 32.0, 41.0, 55.0, 75.0, 80.0, 89.0, 98.0, 75.0, 69.0, 75.0, 61.0, 46.0, 38.0, 26.0, 11.0, 9.0, 15.0, 8.0, 5.0, 3.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.173828125, -3.08428955078125, -2.9947509765625, -2.90521240234375, -2.815673828125, -2.72613525390625, -2.6365966796875, -2.54705810546875, -2.45751953125, -2.36798095703125, -2.2784423828125, -2.18890380859375, -2.099365234375, -2.00982666015625, -1.9202880859375, -1.83074951171875, -1.7412109375, -1.65167236328125, -1.5621337890625, -1.47259521484375, -1.383056640625, -1.29351806640625, -1.2039794921875, -1.11444091796875, -1.02490234375, -0.93536376953125, -0.8458251953125, -0.75628662109375, -0.666748046875, -0.57720947265625, -0.4876708984375, -0.39813232421875, -0.30859375, -0.21905517578125, -0.1295166015625, -0.03997802734375, 0.049560546875, 0.13909912109375, 0.2286376953125, 0.31817626953125, 0.40771484375, 0.49725341796875, 0.5867919921875, 0.67633056640625, 0.765869140625, 0.85540771484375, 0.9449462890625, 1.03448486328125, 1.1240234375, 1.21356201171875, 1.3031005859375, 1.39263916015625, 1.482177734375, 1.57171630859375, 1.6612548828125, 1.75079345703125, 1.84033203125, 1.92987060546875, 2.0194091796875, 2.10894775390625, 2.198486328125, 2.28802490234375, 2.3775634765625, 2.46710205078125, 2.556640625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 6.0, 4.0, 3.0, 8.0, 7.0, 5.0, 4.0, 7.0, 15.0, 13.0, 17.0, 25.0, 36.0, 49.0, 88.0, 137.0, 238.0, 439.0, 885.0, 2101.0, 5518.0, 19177.0, 93377.0, 551613.0, 306183.0, 50048.0, 11862.0, 3650.0, 1455.0, 685.0, 344.0, 188.0, 116.0, 68.0, 43.0, 43.0, 34.0, 15.0, 8.0, 15.0, 3.0, 8.0, 5.0, 3.0, 1.0, 2.0, 3.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-6.33984375, -6.13409423828125, -5.9283447265625, -5.72259521484375, -5.516845703125, -5.31109619140625, -5.1053466796875, -4.89959716796875, -4.69384765625, -4.48809814453125, -4.2823486328125, -4.07659912109375, -3.870849609375, -3.66510009765625, -3.4593505859375, -3.25360107421875, -3.0478515625, -2.84210205078125, -2.6363525390625, -2.43060302734375, -2.224853515625, -2.01910400390625, -1.8133544921875, -1.60760498046875, -1.40185546875, -1.19610595703125, -0.9903564453125, -0.78460693359375, -0.578857421875, -0.37310791015625, -0.1673583984375, 0.03839111328125, 0.244140625, 0.44989013671875, 0.6556396484375, 0.86138916015625, 1.067138671875, 1.27288818359375, 1.4786376953125, 1.68438720703125, 1.89013671875, 2.09588623046875, 2.3016357421875, 2.50738525390625, 2.713134765625, 2.91888427734375, 3.1246337890625, 3.33038330078125, 3.5361328125, 3.74188232421875, 3.9476318359375, 4.15338134765625, 4.359130859375, 4.56488037109375, 4.7706298828125, 4.97637939453125, 5.18212890625, 5.38787841796875, 5.5936279296875, 5.79937744140625, 6.005126953125, 6.21087646484375, 6.4166259765625, 6.62237548828125, 6.828125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 2.0, 4.0, 9.0, 11.0, 13.0, 16.0, 19.0, 17.0, 26.0, 25.0, 32.0, 31.0, 55.0, 50.0, 62.0, 50.0, 44.0, 59.0, 53.0, 48.0, 46.0, 55.0, 42.0, 41.0, 34.0, 35.0, 29.0, 20.0, 12.0, 18.0, 13.0, 4.0, 11.0, 4.0, 2.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.453125, -8.1458740234375, -7.838623046875, -7.5313720703125, -7.22412109375, -6.9168701171875, -6.609619140625, -6.3023681640625, -5.9951171875, -5.6878662109375, -5.380615234375, -5.0733642578125, -4.76611328125, -4.4588623046875, -4.151611328125, -3.8443603515625, -3.537109375, -3.2298583984375, -2.922607421875, -2.6153564453125, -2.30810546875, -2.0008544921875, -1.693603515625, -1.3863525390625, -1.0791015625, -0.7718505859375, -0.464599609375, -0.1573486328125, 0.14990234375, 0.4571533203125, 0.764404296875, 1.0716552734375, 1.37890625, 1.6861572265625, 1.993408203125, 2.3006591796875, 2.60791015625, 2.9151611328125, 3.222412109375, 3.5296630859375, 3.8369140625, 4.1441650390625, 4.451416015625, 4.7586669921875, 5.06591796875, 5.3731689453125, 5.680419921875, 5.9876708984375, 6.294921875, 6.6021728515625, 6.909423828125, 7.2166748046875, 7.52392578125, 7.8311767578125, 8.138427734375, 8.4456787109375, 8.7529296875, 9.0601806640625, 9.367431640625, 9.6746826171875, 9.98193359375, 10.2891845703125, 10.596435546875, 10.9036865234375, 11.2109375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 2.0, 5.0, 10.0, 12.0, 15.0, 35.0, 66.0, 127.0, 273.0, 677.0, 3172.0, 39592.0, 972174.0, 28585.0, 2668.0, 651.0, 266.0, 95.0, 52.0, 30.0, 24.0, 11.0, 5.0, 5.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.203125, -7.880859375, -7.55859375, -7.236328125, -6.9140625, -6.591796875, -6.26953125, -5.947265625, -5.625, -5.302734375, -4.98046875, -4.658203125, -4.3359375, -4.013671875, -3.69140625, -3.369140625, -3.046875, -2.724609375, -2.40234375, -2.080078125, -1.7578125, -1.435546875, -1.11328125, -0.791015625, -0.46875, -0.146484375, 0.17578125, 0.498046875, 0.8203125, 1.142578125, 1.46484375, 1.787109375, 2.109375, 2.431640625, 2.75390625, 3.076171875, 3.3984375, 3.720703125, 4.04296875, 4.365234375, 4.6875, 5.009765625, 5.33203125, 5.654296875, 5.9765625, 6.298828125, 6.62109375, 6.943359375, 7.265625, 7.587890625, 7.91015625, 8.232421875, 8.5546875, 8.876953125, 9.19921875, 9.521484375, 9.84375, 10.166015625, 10.48828125, 10.810546875, 11.1328125, 11.455078125, 11.77734375, 12.099609375, 12.421875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 4.0, 10.0, 9.0, 23.0, 45.0, 111.0, 252.0, 284.0, 143.0, 57.0, 31.0, 21.0, 4.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001247406005859375, -0.0012013912200927734, -0.0011553764343261719, -0.0011093616485595703, -0.0010633468627929688, -0.0010173320770263672, -0.0009713172912597656, -0.0009253025054931641, -0.0008792877197265625, -0.0008332729339599609, -0.0007872581481933594, -0.0007412433624267578, -0.0006952285766601562, -0.0006492137908935547, -0.0006031990051269531, -0.0005571842193603516, -0.00051116943359375, -0.00046515464782714844, -0.0004191398620605469, -0.0003731250762939453, -0.00032711029052734375, -0.0002810955047607422, -0.00023508071899414062, -0.00018906593322753906, -0.0001430511474609375, -9.703636169433594e-05, -5.1021575927734375e-05, -5.0067901611328125e-06, 4.100799560546875e-05, 8.702278137207031e-05, 0.00013303756713867188, 0.00017905235290527344, 0.000225067138671875, 0.00027108192443847656, 0.0003170967102050781, 0.0003631114959716797, 0.00040912628173828125, 0.0004551410675048828, 0.0005011558532714844, 0.0005471706390380859, 0.0005931854248046875, 0.0006392002105712891, 0.0006852149963378906, 0.0007312297821044922, 0.0007772445678710938, 0.0008232593536376953, 0.0008692741394042969, 0.0009152889251708984, 0.0009613037109375, 0.0010073184967041016, 0.0010533332824707031, 0.0010993480682373047, 0.0011453628540039062, 0.0011913776397705078, 0.0012373924255371094, 0.001283407211303711, 0.0013294219970703125, 0.001375436782836914, 0.0014214515686035156, 0.0014674663543701172, 0.0015134811401367188, 0.0015594959259033203, 0.0016055107116699219, 0.0016515254974365234, 0.001697540283203125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 9.0, 1.0, 9.0, 9.0, 13.0, 16.0, 14.0, 28.0, 49.0, 63.0, 93.0, 188.0, 359.0, 817.0, 1945.0, 5804.0, 30985.0, 829497.0, 160679.0, 12253.0, 3240.0, 1259.0, 547.0, 283.0, 157.0, 87.0, 55.0, 31.0, 25.0, 11.0, 5.0, 5.0, 7.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.2734375, -8.0543212890625, -7.835205078125, -7.6160888671875, -7.39697265625, -7.1778564453125, -6.958740234375, -6.7396240234375, -6.5205078125, -6.3013916015625, -6.082275390625, -5.8631591796875, -5.64404296875, -5.4249267578125, -5.205810546875, -4.9866943359375, -4.767578125, -4.5484619140625, -4.329345703125, -4.1102294921875, -3.89111328125, -3.6719970703125, -3.452880859375, -3.2337646484375, -3.0146484375, -2.7955322265625, -2.576416015625, -2.3572998046875, -2.13818359375, -1.9190673828125, -1.699951171875, -1.4808349609375, -1.26171875, -1.0426025390625, -0.823486328125, -0.6043701171875, -0.38525390625, -0.1661376953125, 0.052978515625, 0.2720947265625, 0.4912109375, 0.7103271484375, 0.929443359375, 1.1485595703125, 1.36767578125, 1.5867919921875, 1.805908203125, 2.0250244140625, 2.244140625, 2.4632568359375, 2.682373046875, 2.9014892578125, 3.12060546875, 3.3397216796875, 3.558837890625, 3.7779541015625, 3.9970703125, 4.2161865234375, 4.435302734375, 4.6544189453125, 4.87353515625, 5.0926513671875, 5.311767578125, 5.5308837890625, 5.75]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 4.0, 4.0, 4.0, 4.0, 7.0, 9.0, 6.0, 17.0, 22.0, 38.0, 56.0, 101.0, 129.0, 148.0, 138.0, 132.0, 67.0, 31.0, 21.0, 17.0, 15.0, 14.0, 4.0, 6.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.08203125, -5.8836669921875, -5.685302734375, -5.4869384765625, -5.28857421875, -5.0902099609375, -4.891845703125, -4.6934814453125, -4.4951171875, -4.2967529296875, -4.098388671875, -3.9000244140625, -3.70166015625, -3.5032958984375, -3.304931640625, -3.1065673828125, -2.908203125, -2.7098388671875, -2.511474609375, -2.3131103515625, -2.11474609375, -1.9163818359375, -1.718017578125, -1.5196533203125, -1.3212890625, -1.1229248046875, -0.924560546875, -0.7261962890625, -0.52783203125, -0.3294677734375, -0.131103515625, 0.0672607421875, 0.265625, 0.4639892578125, 0.662353515625, 0.8607177734375, 1.05908203125, 1.2574462890625, 1.455810546875, 1.6541748046875, 1.8525390625, 2.0509033203125, 2.249267578125, 2.4476318359375, 2.64599609375, 2.8443603515625, 3.042724609375, 3.2410888671875, 3.439453125, 3.6378173828125, 3.836181640625, 4.0345458984375, 4.23291015625, 4.4312744140625, 4.629638671875, 4.8280029296875, 5.0263671875, 5.2247314453125, 5.423095703125, 5.6214599609375, 5.81982421875, 6.0181884765625, 6.216552734375, 6.4149169921875, 6.61328125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 1.0, 2.0, 4.0, 3.0, 10.0, 17.0, 18.0, 53.0, 60.0, 98.0, 119.0, 151.0, 144.0, 118.0, 73.0, 61.0, 30.0, 16.0, 11.0, 8.0, 5.0, 0.0, 3.0, 0.0, 1.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.47226333618164, -26.52532958984375, -24.578393936157227, -22.631458282470703, -20.684524536132812, -18.737590789794922, -16.7906551361084, -14.843720436096191, -12.896785736083984, -10.949851036071777, -9.00291633605957, -7.055981636047363, -5.109046936035156, -3.162112236022949, -1.2151775360107422, 0.7317571640014648, 2.678691864013672, 4.625626564025879, 6.572561264038086, 8.519495964050293, 10.4664306640625, 12.413365364074707, 14.360300064086914, 16.307235717773438, 18.254169464111328, 20.20110321044922, 22.148038864135742, 24.094974517822266, 26.041908264160156, 27.988842010498047, 29.93577766418457, 31.882713317871094, 33.82964324951172, 35.77657699584961, 37.7235107421875, 39.670448303222656, 41.61738204956055, 43.56431579589844, 45.511253356933594, 47.458187103271484, 49.405120849609375, 51.352054595947266, 53.298988342285156, 55.24592590332031, 57.1928596496582, 59.139793395996094, 61.08673095703125, 63.03366470336914, 64.98059844970703, 66.92753601074219, 68.87446594238281, 70.82140350341797, 72.76834106445312, 74.71527099609375, 76.6622085571289, 78.60913848876953, 80.55607604980469, 82.50301361083984, 84.44994354248047, 86.39688110351562, 88.34381103515625, 90.2907485961914, 92.23768615722656, 94.18461608886719, 96.13155364990234]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 9.0, 5.0, 10.0, 12.0, 20.0, 29.0, 25.0, 30.0, 24.0, 57.0, 61.0, 65.0, 88.0, 76.0, 86.0, 82.0, 72.0, 39.0, 49.0, 45.0, 22.0, 24.0, 21.0, 13.0, 13.0, 7.0, 10.0, 4.0, 4.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.255859375, -76.07733154296875, -73.89879608154297, -71.72026062011719, -69.54173278808594, -67.36320495605469, -65.1846694946289, -63.00613784790039, -60.827606201171875, -58.64907455444336, -56.470542907714844, -54.29201126098633, -52.11347961425781, -49.9349479675293, -47.75641632080078, -45.577884674072266, -43.39935302734375, -41.220821380615234, -39.04228973388672, -36.8637580871582, -34.68522644042969, -32.50669479370117, -30.328163146972656, -28.14963150024414, -25.971099853515625, -23.79256820678711, -21.614036560058594, -19.435504913330078, -17.256973266601562, -15.078441619873047, -12.899909973144531, -10.721378326416016, -8.5428466796875, -6.364315032958984, -4.185783386230469, -2.007251739501953, 0.1712799072265625, 2.349811553955078, 4.528343200683594, 6.706874847412109, 8.885406494140625, 11.06393814086914, 13.242469787597656, 15.421001434326172, 17.599533081054688, 19.778064727783203, 21.95659637451172, 24.135128021240234, 26.31365966796875, 28.492191314697266, 30.67072296142578, 32.8492546081543, 35.02778625488281, 37.20631790161133, 39.384849548339844, 41.56338119506836, 43.741912841796875, 45.92044448852539, 48.098976135253906, 50.27750778198242, 52.45603942871094, 54.63457107543945, 56.81310272216797, 58.991634368896484, 61.170166015625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 1.0, 1.0, 2.0, 11.0, 3.0, 17.0, 28.0, 20.0, 36.0, 49.0, 76.0, 118.0, 244.0, 421.0, 814.0, 1747.0, 4674.0, 17104.0, 3677397.0, 467188.0, 16345.0, 4448.0, 1730.0, 844.0, 385.0, 200.0, 127.0, 84.0, 58.0, 27.0, 27.0, 12.0, 13.0, 7.0, 7.0, 8.0, 2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.53125, -7.2520751953125, -6.972900390625, -6.6937255859375, -6.41455078125, -6.1353759765625, -5.856201171875, -5.5770263671875, -5.2978515625, -5.0186767578125, -4.739501953125, -4.4603271484375, -4.18115234375, -3.9019775390625, -3.622802734375, -3.3436279296875, -3.064453125, -2.7852783203125, -2.506103515625, -2.2269287109375, -1.94775390625, -1.6685791015625, -1.389404296875, -1.1102294921875, -0.8310546875, -0.5518798828125, -0.272705078125, 0.0064697265625, 0.28564453125, 0.5648193359375, 0.843994140625, 1.1231689453125, 1.40234375, 1.6815185546875, 1.960693359375, 2.2398681640625, 2.51904296875, 2.7982177734375, 3.077392578125, 3.3565673828125, 3.6357421875, 3.9149169921875, 4.194091796875, 4.4732666015625, 4.75244140625, 5.0316162109375, 5.310791015625, 5.5899658203125, 5.869140625, 6.1483154296875, 6.427490234375, 6.7066650390625, 6.98583984375, 7.2650146484375, 7.544189453125, 7.8233642578125, 8.1025390625, 8.3817138671875, 8.660888671875, 8.9400634765625, 9.21923828125, 9.4984130859375, 9.777587890625, 10.0567626953125, 10.3359375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 7.0, 7.0, 4.0, 8.0, 13.0, 23.0, 20.0, 36.0, 65.0, 80.0, 84.0, 100.0, 108.0, 98.0, 117.0, 61.0, 44.0, 32.0, 20.0, 20.0, 14.0, 12.0, 7.0, 4.0, 3.0, 1.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.96875, -2.860198974609375, -2.75164794921875, -2.643096923828125, -2.5345458984375, -2.425994873046875, -2.31744384765625, -2.208892822265625, -2.100341796875, -1.991790771484375, -1.88323974609375, -1.774688720703125, -1.6661376953125, -1.557586669921875, -1.44903564453125, -1.340484619140625, -1.23193359375, -1.123382568359375, -1.01483154296875, -0.906280517578125, -0.7977294921875, -0.689178466796875, -0.58062744140625, -0.472076416015625, -0.363525390625, -0.254974365234375, -0.14642333984375, -0.037872314453125, 0.0706787109375, 0.179229736328125, 0.28778076171875, 0.396331787109375, 0.5048828125, 0.613433837890625, 0.72198486328125, 0.830535888671875, 0.9390869140625, 1.047637939453125, 1.15618896484375, 1.264739990234375, 1.373291015625, 1.481842041015625, 1.59039306640625, 1.698944091796875, 1.8074951171875, 1.916046142578125, 2.02459716796875, 2.133148193359375, 2.24169921875, 2.350250244140625, 2.45880126953125, 2.567352294921875, 2.6759033203125, 2.784454345703125, 2.89300537109375, 3.001556396484375, 3.110107421875, 3.218658447265625, 3.32720947265625, 3.435760498046875, 3.5443115234375, 3.652862548828125, 3.76141357421875, 3.869964599609375, 3.978515625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 6.0, 5.0, 8.0, 4.0, 7.0, 15.0, 21.0, 23.0, 34.0, 33.0, 46.0, 76.0, 124.0, 241.0, 447.0, 933.0, 2490.0, 14842.0, 4123935.0, 44556.0, 3873.0, 1320.0, 553.0, 235.0, 144.0, 90.0, 44.0, 47.0, 35.0, 26.0, 14.0, 10.0, 14.0, 12.0, 7.0, 2.0, 8.0, 6.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.015625, -22.26513671875, -21.5146484375, -20.76416015625, -20.013671875, -19.26318359375, -18.5126953125, -17.76220703125, -17.01171875, -16.26123046875, -15.5107421875, -14.76025390625, -14.009765625, -13.25927734375, -12.5087890625, -11.75830078125, -11.0078125, -10.25732421875, -9.5068359375, -8.75634765625, -8.005859375, -7.25537109375, -6.5048828125, -5.75439453125, -5.00390625, -4.25341796875, -3.5029296875, -2.75244140625, -2.001953125, -1.25146484375, -0.5009765625, 0.24951171875, 1.0, 1.75048828125, 2.5009765625, 3.25146484375, 4.001953125, 4.75244140625, 5.5029296875, 6.25341796875, 7.00390625, 7.75439453125, 8.5048828125, 9.25537109375, 10.005859375, 10.75634765625, 11.5068359375, 12.25732421875, 13.0078125, 13.75830078125, 14.5087890625, 15.25927734375, 16.009765625, 16.76025390625, 17.5107421875, 18.26123046875, 19.01171875, 19.76220703125, 20.5126953125, 21.26318359375, 22.013671875, 22.76416015625, 23.5146484375, 24.26513671875, 25.015625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 7.0, 9.0, 26.0, 42.0, 144.0, 3498.0, 253.0, 48.0, 22.0, 6.0, 10.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.09765625, -6.85882568359375, -6.6199951171875, -6.38116455078125, -6.142333984375, -5.90350341796875, -5.6646728515625, -5.42584228515625, -5.18701171875, -4.94818115234375, -4.7093505859375, -4.47052001953125, -4.231689453125, -3.99285888671875, -3.7540283203125, -3.51519775390625, -3.2763671875, -3.03753662109375, -2.7987060546875, -2.55987548828125, -2.321044921875, -2.08221435546875, -1.8433837890625, -1.60455322265625, -1.36572265625, -1.12689208984375, -0.8880615234375, -0.64923095703125, -0.410400390625, -0.17156982421875, 0.0672607421875, 0.30609130859375, 0.544921875, 0.78375244140625, 1.0225830078125, 1.26141357421875, 1.500244140625, 1.73907470703125, 1.9779052734375, 2.21673583984375, 2.45556640625, 2.69439697265625, 2.9332275390625, 3.17205810546875, 3.410888671875, 3.64971923828125, 3.8885498046875, 4.12738037109375, 4.3662109375, 4.60504150390625, 4.8438720703125, 5.08270263671875, 5.321533203125, 5.56036376953125, 5.7991943359375, 6.03802490234375, 6.27685546875, 6.51568603515625, 6.7545166015625, 6.99334716796875, 7.232177734375, 7.47100830078125, 7.7098388671875, 7.94866943359375, 8.1875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 3.0, 9.0, 7.0, 19.0, 22.0, 48.0, 63.0, 139.0, 175.0, 183.0, 121.0, 109.0, 53.0, 26.0, 15.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-38.48661422729492, -37.54632568359375, -36.60603713989258, -35.66575241088867, -34.7254638671875, -33.78517532348633, -32.844886779785156, -31.904598236083984, -30.964311599731445, -30.024023056030273, -29.083736419677734, -28.143447875976562, -27.20315933227539, -26.26287269592285, -25.32258415222168, -24.38229751586914, -23.44200897216797, -22.501720428466797, -21.561433792114258, -20.621145248413086, -19.680858612060547, -18.740570068359375, -17.800281524658203, -16.85999298095703, -15.919706344604492, -14.979418754577637, -14.039131164550781, -13.09884262084961, -12.158555030822754, -11.218267440795898, -10.277978897094727, -9.337691307067871, -8.397401809692383, -7.457114219665527, -6.516826152801514, -5.5765380859375, -4.6362504959106445, -3.695962905883789, -2.7556748390197754, -1.8153867721557617, -0.8750991821289062, 0.06518864631652832, 1.005476474761963, 1.9457643032073975, 2.886052131652832, 3.8263397216796875, 4.766627788543701, 5.706915855407715, 6.64720344543457, 7.587491035461426, 8.527778625488281, 9.468067169189453, 10.408354759216309, 11.348642349243164, 12.288930892944336, 13.229218482971191, 14.169506072998047, 15.109793663024902, 16.050081253051758, 16.99036979675293, 17.93065643310547, 18.87094497680664, 19.811233520507812, 20.751522064208984, 21.691808700561523]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 6.0, 7.0, 9.0, 12.0, 10.0, 27.0, 19.0, 23.0, 28.0, 41.0, 43.0, 57.0, 50.0, 54.0, 36.0, 62.0, 62.0, 51.0, 58.0, 46.0, 51.0, 57.0, 41.0, 28.0, 20.0, 21.0, 20.0, 18.0, 14.0, 9.0, 6.0, 6.0, 2.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-19.763521194458008, -19.256900787353516, -18.750280380249023, -18.24365997314453, -17.73703956604004, -17.230419158935547, -16.723798751831055, -16.217178344726562, -15.71055793762207, -15.203937530517578, -14.697317123413086, -14.190696716308594, -13.684076309204102, -13.17745590209961, -12.670835494995117, -12.164215087890625, -11.657593727111816, -11.150973320007324, -10.644352912902832, -10.13773250579834, -9.631112098693848, -9.124491691589355, -8.617870330810547, -8.111249923706055, -7.604629993438721, -7.0980095863342285, -6.591389179229736, -6.084768295288086, -5.578147888183594, -5.071527481079102, -4.564907073974609, -4.058286666870117, -3.5516672134399414, -3.045046806335449, -2.538426399230957, -2.0318057537078857, -1.5251853466033936, -1.0185649394989014, -0.5119442939758301, -0.005323886871337891, 0.5012965202331543, 1.0079169273376465, 1.5145374536514282, 2.02115797996521, 2.527778387069702, 3.0343987941741943, 3.5410194396972656, 4.047639846801758, 4.55426025390625, 5.060880661010742, 5.567501068115234, 6.074121475219727, 6.580741882324219, 7.087362289428711, 7.593983173370361, 8.100603103637695, 8.607223510742188, 9.11384391784668, 9.620464324951172, 10.127084732055664, 10.633705139160156, 11.140325546264648, 11.64694595336914, 12.153566360473633, 12.660187721252441]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 12.0, 19.0, 23.0, 37.0, 40.0, 84.0, 137.0, 247.0, 543.0, 1012.0, 2379.0, 6516.0, 21460.0, 91978.0, 454655.0, 369855.0, 72226.0, 17711.0, 5567.0, 2106.0, 922.0, 449.0, 247.0, 138.0, 87.0, 32.0, 24.0, 18.0, 11.0, 9.0, 9.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.25, -6.0089111328125, -5.767822265625, -5.5267333984375, -5.28564453125, -5.0445556640625, -4.803466796875, -4.5623779296875, -4.3212890625, -4.0802001953125, -3.839111328125, -3.5980224609375, -3.35693359375, -3.1158447265625, -2.874755859375, -2.6336669921875, -2.392578125, -2.1514892578125, -1.910400390625, -1.6693115234375, -1.42822265625, -1.1871337890625, -0.946044921875, -0.7049560546875, -0.4638671875, -0.2227783203125, 0.018310546875, 0.2593994140625, 0.50048828125, 0.7415771484375, 0.982666015625, 1.2237548828125, 1.46484375, 1.7059326171875, 1.947021484375, 2.1881103515625, 2.42919921875, 2.6702880859375, 2.911376953125, 3.1524658203125, 3.3935546875, 3.6346435546875, 3.875732421875, 4.1168212890625, 4.35791015625, 4.5989990234375, 4.840087890625, 5.0811767578125, 5.322265625, 5.5633544921875, 5.804443359375, 6.0455322265625, 6.28662109375, 6.5277099609375, 6.768798828125, 7.0098876953125, 7.2509765625, 7.4920654296875, 7.733154296875, 7.9742431640625, 8.21533203125, 8.4564208984375, 8.697509765625, 8.9385986328125, 9.1796875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 5.0, 5.0, 13.0, 14.0, 19.0, 23.0, 29.0, 34.0, 38.0, 55.0, 53.0, 64.0, 72.0, 86.0, 74.0, 78.0, 68.0, 52.0, 45.0, 30.0, 39.0, 25.0, 11.0, 11.0, 10.0, 10.0, 5.0, 7.0, 3.0, 2.0, 0.0, 4.0, 3.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.953125, -2.850555419921875, -2.74798583984375, -2.645416259765625, -2.5428466796875, -2.440277099609375, -2.33770751953125, -2.235137939453125, -2.132568359375, -2.029998779296875, -1.92742919921875, -1.824859619140625, -1.7222900390625, -1.619720458984375, -1.51715087890625, -1.414581298828125, -1.31201171875, -1.209442138671875, -1.10687255859375, -1.004302978515625, -0.9017333984375, -0.799163818359375, -0.69659423828125, -0.594024658203125, -0.491455078125, -0.388885498046875, -0.28631591796875, -0.183746337890625, -0.0811767578125, 0.021392822265625, 0.12396240234375, 0.226531982421875, 0.3291015625, 0.431671142578125, 0.53424072265625, 0.636810302734375, 0.7393798828125, 0.841949462890625, 0.94451904296875, 1.047088623046875, 1.149658203125, 1.252227783203125, 1.35479736328125, 1.457366943359375, 1.5599365234375, 1.662506103515625, 1.76507568359375, 1.867645263671875, 1.97021484375, 2.072784423828125, 2.17535400390625, 2.277923583984375, 2.3804931640625, 2.483062744140625, 2.58563232421875, 2.688201904296875, 2.790771484375, 2.893341064453125, 2.99591064453125, 3.098480224609375, 3.2010498046875, 3.303619384765625, 3.40618896484375, 3.508758544921875, 3.611328125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 5.0, 8.0, 7.0, 18.0, 25.0, 39.0, 70.0, 156.0, 252.0, 673.0, 2140.0, 15117.0, 732073.0, 287307.0, 8046.0, 1540.0, 540.0, 230.0, 125.0, 78.0, 37.0, 26.0, 13.0, 9.0, 5.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.875, -21.209716796875, -20.54443359375, -19.879150390625, -19.2138671875, -18.548583984375, -17.88330078125, -17.218017578125, -16.552734375, -15.887451171875, -15.22216796875, -14.556884765625, -13.8916015625, -13.226318359375, -12.56103515625, -11.895751953125, -11.23046875, -10.565185546875, -9.89990234375, -9.234619140625, -8.5693359375, -7.904052734375, -7.23876953125, -6.573486328125, -5.908203125, -5.242919921875, -4.57763671875, -3.912353515625, -3.2470703125, -2.581787109375, -1.91650390625, -1.251220703125, -0.5859375, 0.079345703125, 0.74462890625, 1.409912109375, 2.0751953125, 2.740478515625, 3.40576171875, 4.071044921875, 4.736328125, 5.401611328125, 6.06689453125, 6.732177734375, 7.3974609375, 8.062744140625, 8.72802734375, 9.393310546875, 10.05859375, 10.723876953125, 11.38916015625, 12.054443359375, 12.7197265625, 13.385009765625, 14.05029296875, 14.715576171875, 15.380859375, 16.046142578125, 16.71142578125, 17.376708984375, 18.0419921875, 18.707275390625, 19.37255859375, 20.037841796875, 20.703125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 0.0, 5.0, 10.0, 13.0, 13.0, 27.0, 49.0, 60.0, 98.0, 110.0, 98.0, 100.0, 98.0, 99.0, 77.0, 49.0, 34.0, 26.0, 15.0, 8.0, 10.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.1875, -24.4287109375, -23.669921875, -22.9111328125, -22.15234375, -21.3935546875, -20.634765625, -19.8759765625, -19.1171875, -18.3583984375, -17.599609375, -16.8408203125, -16.08203125, -15.3232421875, -14.564453125, -13.8056640625, -13.046875, -12.2880859375, -11.529296875, -10.7705078125, -10.01171875, -9.2529296875, -8.494140625, -7.7353515625, -6.9765625, -6.2177734375, -5.458984375, -4.7001953125, -3.94140625, -3.1826171875, -2.423828125, -1.6650390625, -0.90625, -0.1474609375, 0.611328125, 1.3701171875, 2.12890625, 2.8876953125, 3.646484375, 4.4052734375, 5.1640625, 5.9228515625, 6.681640625, 7.4404296875, 8.19921875, 8.9580078125, 9.716796875, 10.4755859375, 11.234375, 11.9931640625, 12.751953125, 13.5107421875, 14.26953125, 15.0283203125, 15.787109375, 16.5458984375, 17.3046875, 18.0634765625, 18.822265625, 19.5810546875, 20.33984375, 21.0986328125, 21.857421875, 22.6162109375, 23.375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 6.0, 4.0, 4.0, 12.0, 9.0, 19.0, 31.0, 51.0, 69.0, 142.0, 269.0, 586.0, 1461.0, 4445.0, 20054.0, 198979.0, 736943.0, 70577.0, 10270.0, 2705.0, 988.0, 433.0, 192.0, 117.0, 65.0, 42.0, 20.0, 18.0, 8.0, 4.0, 6.0, 8.0, 6.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.591796875, -3.469207763671875, -3.34661865234375, -3.224029541015625, -3.1014404296875, -2.978851318359375, -2.85626220703125, -2.733673095703125, -2.611083984375, -2.488494873046875, -2.36590576171875, -2.243316650390625, -2.1207275390625, -1.998138427734375, -1.87554931640625, -1.752960205078125, -1.63037109375, -1.507781982421875, -1.38519287109375, -1.262603759765625, -1.1400146484375, -1.017425537109375, -0.89483642578125, -0.772247314453125, -0.649658203125, -0.527069091796875, -0.40447998046875, -0.281890869140625, -0.1593017578125, -0.036712646484375, 0.08587646484375, 0.208465576171875, 0.3310546875, 0.453643798828125, 0.57623291015625, 0.698822021484375, 0.8214111328125, 0.944000244140625, 1.06658935546875, 1.189178466796875, 1.311767578125, 1.434356689453125, 1.55694580078125, 1.679534912109375, 1.8021240234375, 1.924713134765625, 2.04730224609375, 2.169891357421875, 2.29248046875, 2.415069580078125, 2.53765869140625, 2.660247802734375, 2.7828369140625, 2.905426025390625, 3.02801513671875, 3.150604248046875, 3.273193359375, 3.395782470703125, 3.51837158203125, 3.640960693359375, 3.7635498046875, 3.886138916015625, 4.00872802734375, 4.131317138671875, 4.25390625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 6.0, 2.0, 7.0, 9.0, 6.0, 14.0, 25.0, 25.0, 33.0, 53.0, 90.0, 140.0, 160.0, 126.0, 104.0, 57.0, 39.0, 37.0, 25.0, 12.0, 11.0, 3.0, 8.0, 4.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006809234619140625, -0.0006562992930412292, -0.000631675124168396, -0.0006070509552955627, -0.0005824267864227295, -0.0005578026175498962, -0.000533178448677063, -0.0005085542798042297, -0.0004839301109313965, -0.00045930594205856323, -0.00043468177318573, -0.00041005760431289673, -0.0003854334354400635, -0.0003608092665672302, -0.00033618509769439697, -0.0003115609288215637, -0.00028693675994873047, -0.0002623125910758972, -0.00023768842220306396, -0.0002130642533302307, -0.00018844008445739746, -0.0001638159155845642, -0.00013919174671173096, -0.0001145675778388977, -8.994340896606445e-05, -6.53192400932312e-05, -4.069507122039795e-05, -1.6070902347564697e-05, 8.553266525268555e-06, 3.317743539810181e-05, 5.780160427093506e-05, 8.242577314376831e-05, 0.00010704994201660156, 0.00013167411088943481, 0.00015629827976226807, 0.00018092244863510132, 0.00020554661750793457, 0.00023017078638076782, 0.0002547949552536011, 0.0002794191241264343, 0.0003040432929992676, 0.00032866746187210083, 0.0003532916307449341, 0.00037791579961776733, 0.0004025399684906006, 0.00042716413736343384, 0.0004517883062362671, 0.00047641247510910034, 0.0005010366439819336, 0.0005256608128547668, 0.0005502849817276001, 0.0005749091506004333, 0.0005995333194732666, 0.0006241574883460999, 0.0006487816572189331, 0.0006734058260917664, 0.0006980299949645996, 0.0007226541638374329, 0.0007472783327102661, 0.0007719025015830994, 0.0007965266704559326, 0.0008211508393287659, 0.0008457750082015991, 0.0008703991770744324, 0.0008950233459472656]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 10.0, 7.0, 10.0, 17.0, 20.0, 38.0, 63.0, 77.0, 135.0, 218.0, 451.0, 787.0, 2104.0, 6673.0, 29826.0, 263574.0, 652906.0, 73096.0, 12510.0, 3459.0, 1271.0, 551.0, 277.0, 181.0, 105.0, 47.0, 44.0, 21.0, 24.0, 17.0, 11.0, 10.0, 4.0, 1.0, 3.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.21875, -4.1112060546875, -4.003662109375, -3.8961181640625, -3.78857421875, -3.6810302734375, -3.573486328125, -3.4659423828125, -3.3583984375, -3.2508544921875, -3.143310546875, -3.0357666015625, -2.92822265625, -2.8206787109375, -2.713134765625, -2.6055908203125, -2.498046875, -2.3905029296875, -2.282958984375, -2.1754150390625, -2.06787109375, -1.9603271484375, -1.852783203125, -1.7452392578125, -1.6376953125, -1.5301513671875, -1.422607421875, -1.3150634765625, -1.20751953125, -1.0999755859375, -0.992431640625, -0.8848876953125, -0.77734375, -0.6697998046875, -0.562255859375, -0.4547119140625, -0.34716796875, -0.2396240234375, -0.132080078125, -0.0245361328125, 0.0830078125, 0.1905517578125, 0.298095703125, 0.4056396484375, 0.51318359375, 0.6207275390625, 0.728271484375, 0.8358154296875, 0.943359375, 1.0509033203125, 1.158447265625, 1.2659912109375, 1.37353515625, 1.4810791015625, 1.588623046875, 1.6961669921875, 1.8037109375, 1.9112548828125, 2.018798828125, 2.1263427734375, 2.23388671875, 2.3414306640625, 2.448974609375, 2.5565185546875, 2.6640625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 7.0, 4.0, 3.0, 5.0, 5.0, 8.0, 13.0, 20.0, 27.0, 26.0, 32.0, 50.0, 55.0, 55.0, 83.0, 73.0, 84.0, 72.0, 79.0, 56.0, 48.0, 34.0, 35.0, 37.0, 21.0, 20.0, 11.0, 16.0, 5.0, 8.0, 2.0, 6.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.92578125, -2.8328857421875, -2.739990234375, -2.6470947265625, -2.55419921875, -2.4613037109375, -2.368408203125, -2.2755126953125, -2.1826171875, -2.0897216796875, -1.996826171875, -1.9039306640625, -1.81103515625, -1.7181396484375, -1.625244140625, -1.5323486328125, -1.439453125, -1.3465576171875, -1.253662109375, -1.1607666015625, -1.06787109375, -0.9749755859375, -0.882080078125, -0.7891845703125, -0.6962890625, -0.6033935546875, -0.510498046875, -0.4176025390625, -0.32470703125, -0.2318115234375, -0.138916015625, -0.0460205078125, 0.046875, 0.1397705078125, 0.232666015625, 0.3255615234375, 0.41845703125, 0.5113525390625, 0.604248046875, 0.6971435546875, 0.7900390625, 0.8829345703125, 0.975830078125, 1.0687255859375, 1.16162109375, 1.2545166015625, 1.347412109375, 1.4403076171875, 1.533203125, 1.6260986328125, 1.718994140625, 1.8118896484375, 1.90478515625, 1.9976806640625, 2.090576171875, 2.1834716796875, 2.2763671875, 2.3692626953125, 2.462158203125, 2.5550537109375, 2.64794921875, 2.7408447265625, 2.833740234375, 2.9266357421875, 3.01953125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 7.0, 10.0, 12.0, 19.0, 23.0, 37.0, 54.0, 77.0, 111.0, 119.0, 123.0, 98.0, 104.0, 64.0, 44.0, 29.0, 21.0, 13.0, 13.0, 7.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.66254425048828, -61.568138122558594, -59.473731994628906, -57.37932586669922, -55.28491973876953, -53.190513610839844, -51.09611129760742, -49.001705169677734, -46.90729904174805, -44.81289291381836, -42.71848678588867, -40.624080657958984, -38.52967834472656, -36.435272216796875, -34.34086608886719, -32.2464599609375, -30.152053833007812, -28.057647705078125, -25.963241577148438, -23.868837356567383, -21.774431228637695, -19.680025100708008, -17.585620880126953, -15.491214752197266, -13.396808624267578, -11.30240249633789, -9.20799732208252, -7.11359167098999, -5.019186019897461, -2.9247798919677734, -0.8303747177124023, 1.2640304565429688, 3.3584442138671875, 5.452849864959717, 7.547255516052246, 9.641660690307617, 11.736066818237305, 13.830472946166992, 15.924878120422363, 18.019283294677734, 20.113689422607422, 22.20809555053711, 24.302501678466797, 26.39690589904785, 28.49131202697754, 30.585718154907227, 32.68012237548828, 34.77452850341797, 36.868934631347656, 38.963340759277344, 41.05774688720703, 43.15215301513672, 45.246559143066406, 47.340965270996094, 49.435367584228516, 51.5297737121582, 53.62417984008789, 55.71858596801758, 57.812992095947266, 59.90739822387695, 62.001800537109375, 64.09620666503906, 66.19061279296875, 68.28501892089844, 70.37942504882812]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 3.0, 4.0, 12.0, 12.0, 12.0, 18.0, 11.0, 15.0, 18.0, 21.0, 21.0, 28.0, 38.0, 25.0, 35.0, 46.0, 49.0, 57.0, 49.0, 56.0, 48.0, 43.0, 47.0, 45.0, 43.0, 42.0, 21.0, 25.0, 27.0, 29.0, 16.0, 19.0, 14.0, 10.0, 11.0, 5.0, 8.0, 4.0, 3.0, 6.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-61.69361114501953, -59.840736389160156, -57.98786163330078, -56.134986877441406, -54.282108306884766, -52.42923355102539, -50.576358795166016, -48.72348403930664, -46.87060546875, -45.017730712890625, -43.16485595703125, -41.311981201171875, -39.459102630615234, -37.60622787475586, -35.753353118896484, -33.90047836303711, -32.047603607177734, -30.19472885131836, -28.34185218811035, -26.488977432250977, -24.63610076904297, -22.783226013183594, -20.93035125732422, -19.077476501464844, -17.224599838256836, -15.371724128723145, -13.518848419189453, -11.665973663330078, -9.813097953796387, -7.960222244262695, -6.10734748840332, -4.254471778869629, -2.4015960693359375, -0.5487205982208252, 1.304154872894287, 3.1570301055908203, 5.009905815124512, 6.862781524658203, 8.715656280517578, 10.56853199005127, 12.421407699584961, 14.274283409118652, 16.127159118652344, 17.98003387451172, 19.832908630371094, 21.6857852935791, 23.538660049438477, 25.391536712646484, 27.24441146850586, 29.097286224365234, 30.950162887573242, 32.80303955078125, 34.655914306640625, 36.5087890625, 38.361663818359375, 40.21453857421875, 42.067413330078125, 43.9202880859375, 45.773162841796875, 47.62603759765625, 49.47891616821289, 51.331790924072266, 53.18466567993164, 55.037540435791016, 56.890419006347656]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 14.0, 9.0, 23.0, 25.0, 35.0, 37.0, 79.0, 141.0, 285.0, 631.0, 1663.0, 5177.0, 23568.0, 350871.0, 3745020.0, 52511.0, 9500.0, 2728.0, 1002.0, 432.0, 220.0, 109.0, 81.0, 45.0, 25.0, 19.0, 11.0, 3.0, 7.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.1015625, -10.777099609375, -10.45263671875, -10.128173828125, -9.8037109375, -9.479248046875, -9.15478515625, -8.830322265625, -8.505859375, -8.181396484375, -7.85693359375, -7.532470703125, -7.2080078125, -6.883544921875, -6.55908203125, -6.234619140625, -5.91015625, -5.585693359375, -5.26123046875, -4.936767578125, -4.6123046875, -4.287841796875, -3.96337890625, -3.638916015625, -3.314453125, -2.989990234375, -2.66552734375, -2.341064453125, -2.0166015625, -1.692138671875, -1.36767578125, -1.043212890625, -0.71875, -0.394287109375, -0.06982421875, 0.254638671875, 0.5791015625, 0.903564453125, 1.22802734375, 1.552490234375, 1.876953125, 2.201416015625, 2.52587890625, 2.850341796875, 3.1748046875, 3.499267578125, 3.82373046875, 4.148193359375, 4.47265625, 4.797119140625, 5.12158203125, 5.446044921875, 5.7705078125, 6.094970703125, 6.41943359375, 6.743896484375, 7.068359375, 7.392822265625, 7.71728515625, 8.041748046875, 8.3662109375, 8.690673828125, 9.01513671875, 9.339599609375, 9.6640625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 8.0, 9.0, 13.0, 14.0, 11.0, 21.0, 19.0, 31.0, 40.0, 41.0, 71.0, 73.0, 75.0, 67.0, 72.0, 54.0, 61.0, 44.0, 59.0, 40.0, 36.0, 29.0, 31.0, 9.0, 20.0, 8.0, 6.0, 10.0, 4.0, 4.0, 7.0, 4.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.912109375, -1.82659912109375, -1.7410888671875, -1.65557861328125, -1.570068359375, -1.48455810546875, -1.3990478515625, -1.31353759765625, -1.22802734375, -1.14251708984375, -1.0570068359375, -0.97149658203125, -0.885986328125, -0.80047607421875, -0.7149658203125, -0.62945556640625, -0.5439453125, -0.45843505859375, -0.3729248046875, -0.28741455078125, -0.201904296875, -0.11639404296875, -0.0308837890625, 0.05462646484375, 0.14013671875, 0.22564697265625, 0.3111572265625, 0.39666748046875, 0.482177734375, 0.56768798828125, 0.6531982421875, 0.73870849609375, 0.82421875, 0.90972900390625, 0.9952392578125, 1.08074951171875, 1.166259765625, 1.25177001953125, 1.3372802734375, 1.42279052734375, 1.50830078125, 1.59381103515625, 1.6793212890625, 1.76483154296875, 1.850341796875, 1.93585205078125, 2.0213623046875, 2.10687255859375, 2.1923828125, 2.27789306640625, 2.3634033203125, 2.44891357421875, 2.534423828125, 2.61993408203125, 2.7054443359375, 2.79095458984375, 2.87646484375, 2.96197509765625, 3.0474853515625, 3.13299560546875, 3.218505859375, 3.30401611328125, 3.3895263671875, 3.47503662109375, 3.560546875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 1.0, 5.0, 8.0, 9.0, 16.0, 12.0, 39.0, 47.0, 92.0, 187.0, 352.0, 822.0, 2071.0, 6299.0, 27731.0, 290372.0, 3758649.0, 87092.0, 14182.0, 3829.0, 1319.0, 568.0, 251.0, 142.0, 73.0, 44.0, 22.0, 21.0, 7.0, 10.0, 3.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.109375, -10.775634765625, -10.44189453125, -10.108154296875, -9.7744140625, -9.440673828125, -9.10693359375, -8.773193359375, -8.439453125, -8.105712890625, -7.77197265625, -7.438232421875, -7.1044921875, -6.770751953125, -6.43701171875, -6.103271484375, -5.76953125, -5.435791015625, -5.10205078125, -4.768310546875, -4.4345703125, -4.100830078125, -3.76708984375, -3.433349609375, -3.099609375, -2.765869140625, -2.43212890625, -2.098388671875, -1.7646484375, -1.430908203125, -1.09716796875, -0.763427734375, -0.4296875, -0.095947265625, 0.23779296875, 0.571533203125, 0.9052734375, 1.239013671875, 1.57275390625, 1.906494140625, 2.240234375, 2.573974609375, 2.90771484375, 3.241455078125, 3.5751953125, 3.908935546875, 4.24267578125, 4.576416015625, 4.91015625, 5.243896484375, 5.57763671875, 5.911376953125, 6.2451171875, 6.578857421875, 6.91259765625, 7.246337890625, 7.580078125, 7.913818359375, 8.24755859375, 8.581298828125, 8.9150390625, 9.248779296875, 9.58251953125, 9.916259765625, 10.25]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 6.0, 8.0, 9.0, 8.0, 5.0, 15.0, 16.0, 26.0, 32.0, 40.0, 73.0, 181.0, 637.0, 1777.0, 698.0, 222.0, 102.0, 79.0, 35.0, 30.0, 22.0, 13.0, 10.0, 4.0, 9.0, 5.0, 4.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-11.8203125, -11.49755859375, -11.1748046875, -10.85205078125, -10.529296875, -10.20654296875, -9.8837890625, -9.56103515625, -9.23828125, -8.91552734375, -8.5927734375, -8.27001953125, -7.947265625, -7.62451171875, -7.3017578125, -6.97900390625, -6.65625, -6.33349609375, -6.0107421875, -5.68798828125, -5.365234375, -5.04248046875, -4.7197265625, -4.39697265625, -4.07421875, -3.75146484375, -3.4287109375, -3.10595703125, -2.783203125, -2.46044921875, -2.1376953125, -1.81494140625, -1.4921875, -1.16943359375, -0.8466796875, -0.52392578125, -0.201171875, 0.12158203125, 0.4443359375, 0.76708984375, 1.08984375, 1.41259765625, 1.7353515625, 2.05810546875, 2.380859375, 2.70361328125, 3.0263671875, 3.34912109375, 3.671875, 3.99462890625, 4.3173828125, 4.64013671875, 4.962890625, 5.28564453125, 5.6083984375, 5.93115234375, 6.25390625, 6.57666015625, 6.8994140625, 7.22216796875, 7.544921875, 7.86767578125, 8.1904296875, 8.51318359375, 8.8359375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 15.0, 30.0, 81.0, 197.0, 300.0, 212.0, 96.0, 32.0, 21.0, 8.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-95.21401977539062, -91.74302673339844, -88.27204132080078, -84.8010482788086, -81.33006286621094, -77.85906982421875, -74.38807678222656, -70.9170913696289, -67.44610595703125, -63.97511672973633, -60.504127502441406, -57.03313446044922, -53.56214904785156, -50.091156005859375, -46.62016677856445, -43.14917755126953, -39.678184509277344, -36.20719528198242, -32.7362060546875, -29.265214920043945, -25.794225692749023, -22.3232364654541, -18.852245330810547, -15.381256103515625, -11.910266876220703, -8.439277648925781, -4.968287467956543, -1.4972972869873047, 1.9736919403076172, 5.444681167602539, 8.915672302246094, 12.386661529541016, 15.857650756835938, 19.32863998413086, 22.79962921142578, 26.270620346069336, 29.741609573364258, 33.21260070800781, 36.683589935302734, 40.154579162597656, 43.62556838989258, 47.0965576171875, 50.56754684448242, 54.038536071777344, 57.50952911376953, 60.98051452636719, 64.45150756835938, 67.92250061035156, 71.39348602294922, 74.8644790649414, 78.33546447753906, 81.80645751953125, 85.2774429321289, 88.7484359741211, 92.21942138671875, 95.69041442871094, 99.16140747070312, 102.63240051269531, 106.10338592529297, 109.57437896728516, 113.04536437988281, 116.516357421875, 119.98735046386719, 123.45833587646484, 126.9293212890625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 5.0, 10.0, 11.0, 16.0, 19.0, 30.0, 23.0, 30.0, 41.0, 41.0, 58.0, 57.0, 61.0, 58.0, 63.0, 59.0, 69.0, 58.0, 44.0, 64.0, 43.0, 36.0, 28.0, 19.0, 18.0, 9.0, 6.0, 7.0, 5.0, 6.0, 4.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-61.09820556640625, -59.50714874267578, -57.91608810424805, -56.32503128051758, -54.733970642089844, -53.142913818359375, -51.551856994628906, -49.96080017089844, -48.3697395324707, -46.778682708740234, -45.1876220703125, -43.59656524658203, -42.00550842285156, -40.41444778442383, -38.82339096069336, -37.232330322265625, -35.641273498535156, -34.05021667480469, -32.45915603637695, -30.868099212646484, -29.277040481567383, -27.68598175048828, -26.094924926757812, -24.50386619567871, -22.91280746459961, -21.321748733520508, -19.730690002441406, -18.139633178710938, -16.548574447631836, -14.957515716552734, -13.36645793914795, -11.775400161743164, -10.184341430664062, -8.593282699584961, -7.002224922180176, -5.411166667938232, -3.820108413696289, -2.2290501594543457, -0.6379919052124023, 0.9530658721923828, 2.5441246032714844, 4.135182857513428, 5.726241111755371, 7.3172993659973145, 8.908357620239258, 10.49941635131836, 12.090474128723145, 13.68153190612793, 15.272590637207031, 16.863649368286133, 18.454708099365234, 20.045764923095703, 21.636823654174805, 23.227882385253906, 24.818939208984375, 26.409997940063477, 28.001056671142578, 29.59211540222168, 31.18317413330078, 32.77423095703125, 34.36528778076172, 35.95634841918945, 37.54740524291992, 39.138465881347656, 40.729522705078125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 11.0, 10.0, 22.0, 20.0, 42.0, 67.0, 120.0, 231.0, 444.0, 886.0, 1977.0, 4788.0, 13314.0, 41276.0, 140151.0, 405813.0, 304824.0, 91087.0, 27507.0, 9486.0, 3560.0, 1479.0, 667.0, 322.0, 188.0, 107.0, 60.0, 35.0, 28.0, 7.0, 12.0, 6.0, 6.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.890625, -5.71649169921875, -5.5423583984375, -5.36822509765625, -5.194091796875, -5.01995849609375, -4.8458251953125, -4.67169189453125, -4.49755859375, -4.32342529296875, -4.1492919921875, -3.97515869140625, -3.801025390625, -3.62689208984375, -3.4527587890625, -3.27862548828125, -3.1044921875, -2.93035888671875, -2.7562255859375, -2.58209228515625, -2.407958984375, -2.23382568359375, -2.0596923828125, -1.88555908203125, -1.71142578125, -1.53729248046875, -1.3631591796875, -1.18902587890625, -1.014892578125, -0.84075927734375, -0.6666259765625, -0.49249267578125, -0.318359375, -0.14422607421875, 0.0299072265625, 0.20404052734375, 0.378173828125, 0.55230712890625, 0.7264404296875, 0.90057373046875, 1.07470703125, 1.24884033203125, 1.4229736328125, 1.59710693359375, 1.771240234375, 1.94537353515625, 2.1195068359375, 2.29364013671875, 2.4677734375, 2.64190673828125, 2.8160400390625, 2.99017333984375, 3.164306640625, 3.33843994140625, 3.5125732421875, 3.68670654296875, 3.86083984375, 4.03497314453125, 4.2091064453125, 4.38323974609375, 4.557373046875, 4.73150634765625, 4.9056396484375, 5.07977294921875, 5.25390625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 8.0, 8.0, 7.0, 11.0, 9.0, 19.0, 17.0, 22.0, 45.0, 35.0, 30.0, 41.0, 43.0, 54.0, 53.0, 58.0, 57.0, 67.0, 63.0, 48.0, 51.0, 38.0, 35.0, 30.0, 29.0, 35.0, 26.0, 7.0, 9.0, 10.0, 11.0, 11.0, 5.0, 4.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9619140625, -1.8853912353515625, -1.808868408203125, -1.7323455810546875, -1.65582275390625, -1.5792999267578125, -1.502777099609375, -1.4262542724609375, -1.3497314453125, -1.2732086181640625, -1.196685791015625, -1.1201629638671875, -1.04364013671875, -0.9671173095703125, -0.890594482421875, -0.8140716552734375, -0.737548828125, -0.6610260009765625, -0.584503173828125, -0.5079803466796875, -0.43145751953125, -0.3549346923828125, -0.278411865234375, -0.2018890380859375, -0.1253662109375, -0.0488433837890625, 0.027679443359375, 0.1042022705078125, 0.18072509765625, 0.2572479248046875, 0.333770751953125, 0.4102935791015625, 0.48681640625, 0.5633392333984375, 0.639862060546875, 0.7163848876953125, 0.79290771484375, 0.8694305419921875, 0.945953369140625, 1.0224761962890625, 1.0989990234375, 1.1755218505859375, 1.252044677734375, 1.3285675048828125, 1.40509033203125, 1.4816131591796875, 1.558135986328125, 1.6346588134765625, 1.711181640625, 1.7877044677734375, 1.864227294921875, 1.9407501220703125, 2.01727294921875, 2.0937957763671875, 2.170318603515625, 2.2468414306640625, 2.3233642578125, 2.3998870849609375, 2.476409912109375, 2.5529327392578125, 2.62945556640625, 2.7059783935546875, 2.782501220703125, 2.8590240478515625, 2.935546875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 7.0, 8.0, 11.0, 12.0, 14.0, 26.0, 20.0, 34.0, 59.0, 86.0, 153.0, 246.0, 389.0, 767.0, 1541.0, 3799.0, 12757.0, 75978.0, 643619.0, 265829.0, 31230.0, 6957.0, 2496.0, 1107.0, 576.0, 339.0, 195.0, 104.0, 77.0, 40.0, 28.0, 23.0, 11.0, 7.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.6484375, -12.3304443359375, -12.012451171875, -11.6944580078125, -11.37646484375, -11.0584716796875, -10.740478515625, -10.4224853515625, -10.1044921875, -9.7864990234375, -9.468505859375, -9.1505126953125, -8.83251953125, -8.5145263671875, -8.196533203125, -7.8785400390625, -7.560546875, -7.2425537109375, -6.924560546875, -6.6065673828125, -6.28857421875, -5.9705810546875, -5.652587890625, -5.3345947265625, -5.0166015625, -4.6986083984375, -4.380615234375, -4.0626220703125, -3.74462890625, -3.4266357421875, -3.108642578125, -2.7906494140625, -2.47265625, -2.1546630859375, -1.836669921875, -1.5186767578125, -1.20068359375, -0.8826904296875, -0.564697265625, -0.2467041015625, 0.0712890625, 0.3892822265625, 0.707275390625, 1.0252685546875, 1.34326171875, 1.6612548828125, 1.979248046875, 2.2972412109375, 2.615234375, 2.9332275390625, 3.251220703125, 3.5692138671875, 3.88720703125, 4.2052001953125, 4.523193359375, 4.8411865234375, 5.1591796875, 5.4771728515625, 5.795166015625, 6.1131591796875, 6.43115234375, 6.7491455078125, 7.067138671875, 7.3851318359375, 7.703125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 4.0, 5.0, 6.0, 8.0, 6.0, 11.0, 11.0, 23.0, 25.0, 21.0, 28.0, 30.0, 35.0, 47.0, 44.0, 61.0, 57.0, 44.0, 45.0, 46.0, 58.0, 49.0, 53.0, 39.0, 37.0, 29.0, 39.0, 30.0, 24.0, 22.0, 15.0, 10.0, 8.0, 7.0, 10.0, 3.0, 5.0, 3.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-14.0546875, -13.6724853515625, -13.290283203125, -12.9080810546875, -12.52587890625, -12.1436767578125, -11.761474609375, -11.3792724609375, -10.9970703125, -10.6148681640625, -10.232666015625, -9.8504638671875, -9.46826171875, -9.0860595703125, -8.703857421875, -8.3216552734375, -7.939453125, -7.5572509765625, -7.175048828125, -6.7928466796875, -6.41064453125, -6.0284423828125, -5.646240234375, -5.2640380859375, -4.8818359375, -4.4996337890625, -4.117431640625, -3.7352294921875, -3.35302734375, -2.9708251953125, -2.588623046875, -2.2064208984375, -1.82421875, -1.4420166015625, -1.059814453125, -0.6776123046875, -0.29541015625, 0.0867919921875, 0.468994140625, 0.8511962890625, 1.2333984375, 1.6156005859375, 1.997802734375, 2.3800048828125, 2.76220703125, 3.1444091796875, 3.526611328125, 3.9088134765625, 4.291015625, 4.6732177734375, 5.055419921875, 5.4376220703125, 5.81982421875, 6.2020263671875, 6.584228515625, 6.9664306640625, 7.3486328125, 7.7308349609375, 8.113037109375, 8.4952392578125, 8.87744140625, 9.2596435546875, 9.641845703125, 10.0240478515625, 10.40625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 7.0, 7.0, 4.0, 11.0, 17.0, 25.0, 42.0, 82.0, 141.0, 280.0, 741.0, 2503.0, 17173.0, 877408.0, 141491.0, 6318.0, 1362.0, 512.0, 202.0, 102.0, 57.0, 17.0, 19.0, 11.0, 5.0, 2.0, 6.0, 4.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.2578125, -9.9788818359375, -9.699951171875, -9.4210205078125, -9.14208984375, -8.8631591796875, -8.584228515625, -8.3052978515625, -8.0263671875, -7.7474365234375, -7.468505859375, -7.1895751953125, -6.91064453125, -6.6317138671875, -6.352783203125, -6.0738525390625, -5.794921875, -5.5159912109375, -5.237060546875, -4.9581298828125, -4.67919921875, -4.4002685546875, -4.121337890625, -3.8424072265625, -3.5634765625, -3.2845458984375, -3.005615234375, -2.7266845703125, -2.44775390625, -2.1688232421875, -1.889892578125, -1.6109619140625, -1.33203125, -1.0531005859375, -0.774169921875, -0.4952392578125, -0.21630859375, 0.0626220703125, 0.341552734375, 0.6204833984375, 0.8994140625, 1.1783447265625, 1.457275390625, 1.7362060546875, 2.01513671875, 2.2940673828125, 2.572998046875, 2.8519287109375, 3.130859375, 3.4097900390625, 3.688720703125, 3.9676513671875, 4.24658203125, 4.5255126953125, 4.804443359375, 5.0833740234375, 5.3623046875, 5.6412353515625, 5.920166015625, 6.1990966796875, 6.47802734375, 6.7569580078125, 7.035888671875, 7.3148193359375, 7.59375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 3.0, 1.0, 7.0, 8.0, 7.0, 11.0, 11.0, 24.0, 49.0, 80.0, 104.0, 134.0, 170.0, 111.0, 95.0, 76.0, 32.0, 33.0, 18.0, 9.0, 9.0, 4.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0013856887817382812, -0.0013529956340789795, -0.0013203024864196777, -0.001287609338760376, -0.0012549161911010742, -0.0012222230434417725, -0.0011895298957824707, -0.001156836748123169, -0.0011241436004638672, -0.0010914504528045654, -0.0010587573051452637, -0.001026064157485962, -0.0009933710098266602, -0.0009606778621673584, -0.0009279847145080566, -0.0008952915668487549, -0.0008625984191894531, -0.0008299052715301514, -0.0007972121238708496, -0.0007645189762115479, -0.0007318258285522461, -0.0006991326808929443, -0.0006664395332336426, -0.0006337463855743408, -0.0006010532379150391, -0.0005683600902557373, -0.0005356669425964355, -0.0005029737949371338, -0.00047028064727783203, -0.0004375874996185303, -0.0004048943519592285, -0.00037220120429992676, -0.000339508056640625, -0.00030681490898132324, -0.0002741217613220215, -0.00024142861366271973, -0.00020873546600341797, -0.0001760423183441162, -0.00014334917068481445, -0.0001106560230255127, -7.796287536621094e-05, -4.526972770690918e-05, -1.2576580047607422e-05, 2.0116567611694336e-05, 5.2809715270996094e-05, 8.550286293029785e-05, 0.00011819601058959961, 0.00015088915824890137, 0.00018358230590820312, 0.00021627545356750488, 0.00024896860122680664, 0.0002816617488861084, 0.00031435489654541016, 0.0003470480442047119, 0.00037974119186401367, 0.00041243433952331543, 0.0004451274871826172, 0.00047782063484191895, 0.0005105137825012207, 0.0005432069301605225, 0.0005759000778198242, 0.000608593225479126, 0.0006412863731384277, 0.0006739795207977295, 0.0007066726684570312]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 2.0, 11.0, 5.0, 11.0, 23.0, 23.0, 49.0, 71.0, 140.0, 312.0, 724.0, 2030.0, 8497.0, 87483.0, 857080.0, 80792.0, 8088.0, 1924.0, 676.0, 268.0, 140.0, 91.0, 43.0, 19.0, 17.0, 10.0, 6.0, 9.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.7265625, -6.55621337890625, -6.3858642578125, -6.21551513671875, -6.045166015625, -5.87481689453125, -5.7044677734375, -5.53411865234375, -5.36376953125, -5.19342041015625, -5.0230712890625, -4.85272216796875, -4.682373046875, -4.51202392578125, -4.3416748046875, -4.17132568359375, -4.0009765625, -3.83062744140625, -3.6602783203125, -3.48992919921875, -3.319580078125, -3.14923095703125, -2.9788818359375, -2.80853271484375, -2.63818359375, -2.46783447265625, -2.2974853515625, -2.12713623046875, -1.956787109375, -1.78643798828125, -1.6160888671875, -1.44573974609375, -1.275390625, -1.10504150390625, -0.9346923828125, -0.76434326171875, -0.593994140625, -0.42364501953125, -0.2532958984375, -0.08294677734375, 0.08740234375, 0.25775146484375, 0.4281005859375, 0.59844970703125, 0.768798828125, 0.93914794921875, 1.1094970703125, 1.27984619140625, 1.4501953125, 1.62054443359375, 1.7908935546875, 1.96124267578125, 2.131591796875, 2.30194091796875, 2.4722900390625, 2.64263916015625, 2.81298828125, 2.98333740234375, 3.1536865234375, 3.32403564453125, 3.494384765625, 3.66473388671875, 3.8350830078125, 4.00543212890625, 4.17578125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 6.0, 2.0, 3.0, 5.0, 6.0, 9.0, 17.0, 21.0, 21.0, 35.0, 65.0, 65.0, 97.0, 100.0, 101.0, 99.0, 88.0, 74.0, 47.0, 39.0, 23.0, 25.0, 16.0, 15.0, 10.0, 8.0, 4.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-6.48046875, -6.3350830078125, -6.189697265625, -6.0443115234375, -5.89892578125, -5.7535400390625, -5.608154296875, -5.4627685546875, -5.3173828125, -5.1719970703125, -5.026611328125, -4.8812255859375, -4.73583984375, -4.5904541015625, -4.445068359375, -4.2996826171875, -4.154296875, -4.0089111328125, -3.863525390625, -3.7181396484375, -3.57275390625, -3.4273681640625, -3.281982421875, -3.1365966796875, -2.9912109375, -2.8458251953125, -2.700439453125, -2.5550537109375, -2.40966796875, -2.2642822265625, -2.118896484375, -1.9735107421875, -1.828125, -1.6827392578125, -1.537353515625, -1.3919677734375, -1.24658203125, -1.1011962890625, -0.955810546875, -0.8104248046875, -0.6650390625, -0.5196533203125, -0.374267578125, -0.2288818359375, -0.08349609375, 0.0618896484375, 0.207275390625, 0.3526611328125, 0.498046875, 0.6434326171875, 0.788818359375, 0.9342041015625, 1.07958984375, 1.2249755859375, 1.370361328125, 1.5157470703125, 1.6611328125, 1.8065185546875, 1.951904296875, 2.0972900390625, 2.24267578125, 2.3880615234375, 2.533447265625, 2.6788330078125, 2.82421875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 8.0, 12.0, 18.0, 53.0, 80.0, 163.0, 219.0, 203.0, 99.0, 63.0, 36.0, 15.0, 8.0, 4.0, 5.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.42872619628906, -96.5566635131836, -93.68460083007812, -90.81254577636719, -87.94048309326172, -85.06842041015625, -82.19635772705078, -79.32429504394531, -76.45223999023438, -73.5801773071289, -70.70811462402344, -67.8360595703125, -64.96399688720703, -62.09193420410156, -59.219871520996094, -56.347808837890625, -53.475746154785156, -50.60368347167969, -47.731624603271484, -44.859561920166016, -41.98750305175781, -39.115440368652344, -36.243377685546875, -33.371315002441406, -30.499256134033203, -27.627195358276367, -24.75513458251953, -21.883071899414062, -19.011011123657227, -16.13895034790039, -13.266887664794922, -10.394826889038086, -7.522773742675781, -4.650712490081787, -1.778651237487793, 1.0934104919433594, 3.9654712677001953, 6.837532043457031, 9.7095947265625, 12.581655502319336, 15.453716278076172, 18.325777053833008, 21.197837829589844, 24.069900512695312, 26.94196128845215, 29.814022064208984, 32.68608474731445, 35.558143615722656, 38.430206298828125, 41.302268981933594, 44.1743278503418, 47.046390533447266, 49.91844940185547, 52.79051208496094, 55.662574768066406, 58.534637451171875, 61.40669631958008, 64.27875518798828, 67.15081787109375, 70.02288055419922, 72.89494323730469, 75.76699829101562, 78.63906860351562, 81.51112365722656, 84.38318634033203]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 6.0, 7.0, 10.0, 8.0, 20.0, 24.0, 13.0, 23.0, 35.0, 35.0, 37.0, 38.0, 40.0, 51.0, 66.0, 56.0, 83.0, 62.0, 66.0, 42.0, 42.0, 39.0, 36.0, 42.0, 28.0, 23.0, 27.0, 12.0, 8.0, 4.0, 7.0, 6.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-63.788604736328125, -62.07896423339844, -60.36932373046875, -58.6596794128418, -56.95003890991211, -55.24039840698242, -53.530757904052734, -51.82111358642578, -50.111473083496094, -48.401832580566406, -46.69219207763672, -44.982547760009766, -43.27290725708008, -41.56326675415039, -39.8536262512207, -38.14398193359375, -36.43434143066406, -34.724700927734375, -33.01506042480469, -31.305418014526367, -29.595775604248047, -27.88613510131836, -26.176494598388672, -24.46685218811035, -22.757213592529297, -21.04757308959961, -19.33793067932129, -17.6282901763916, -15.918647766113281, -14.209007263183594, -12.49936580657959, -10.789724349975586, -9.080081939697266, -7.370440483093262, -5.660799026489258, -3.951158046722412, -2.241516590118408, -0.5318756103515625, 1.1777658462524414, 2.8874073028564453, 4.597048759460449, 6.306690216064453, 8.016331672668457, 9.725973129272461, 11.435613632202148, 13.145255088806152, 14.854896545410156, 16.564537048339844, 18.274179458618164, 19.98381996154785, 21.693462371826172, 23.40310287475586, 25.11274528503418, 26.822385787963867, 28.532028198242188, 30.241668701171875, 31.951309204101562, 33.66094970703125, 35.37059020996094, 37.08023452758789, 38.78987503051758, 40.499515533447266, 42.20915603637695, 43.918800354003906, 45.628440856933594]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 4.0, 1.0, 8.0, 8.0, 11.0, 9.0, 19.0, 19.0, 28.0, 33.0, 75.0, 113.0, 274.0, 710.0, 2794.0, 14757.0, 318398.0, 3810465.0, 38923.0, 5519.0, 1255.0, 402.0, 196.0, 98.0, 55.0, 37.0, 25.0, 15.0, 13.0, 8.0, 5.0, 4.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.421875, -11.0673828125, -10.712890625, -10.3583984375, -10.00390625, -9.6494140625, -9.294921875, -8.9404296875, -8.5859375, -8.2314453125, -7.876953125, -7.5224609375, -7.16796875, -6.8134765625, -6.458984375, -6.1044921875, -5.75, -5.3955078125, -5.041015625, -4.6865234375, -4.33203125, -3.9775390625, -3.623046875, -3.2685546875, -2.9140625, -2.5595703125, -2.205078125, -1.8505859375, -1.49609375, -1.1416015625, -0.787109375, -0.4326171875, -0.078125, 0.2763671875, 0.630859375, 0.9853515625, 1.33984375, 1.6943359375, 2.048828125, 2.4033203125, 2.7578125, 3.1123046875, 3.466796875, 3.8212890625, 4.17578125, 4.5302734375, 4.884765625, 5.2392578125, 5.59375, 5.9482421875, 6.302734375, 6.6572265625, 7.01171875, 7.3662109375, 7.720703125, 8.0751953125, 8.4296875, 8.7841796875, 9.138671875, 9.4931640625, 9.84765625, 10.2021484375, 10.556640625, 10.9111328125, 11.265625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 8.0, 8.0, 5.0, 9.0, 19.0, 27.0, 27.0, 43.0, 53.0, 75.0, 98.0, 108.0, 77.0, 106.0, 84.0, 67.0, 58.0, 44.0, 31.0, 17.0, 16.0, 10.0, 11.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.626953125, -3.498992919921875, -3.37103271484375, -3.243072509765625, -3.1151123046875, -2.987152099609375, -2.85919189453125, -2.731231689453125, -2.603271484375, -2.475311279296875, -2.34735107421875, -2.219390869140625, -2.0914306640625, -1.963470458984375, -1.83551025390625, -1.707550048828125, -1.57958984375, -1.451629638671875, -1.32366943359375, -1.195709228515625, -1.0677490234375, -0.939788818359375, -0.81182861328125, -0.683868408203125, -0.555908203125, -0.427947998046875, -0.29998779296875, -0.172027587890625, -0.0440673828125, 0.083892822265625, 0.21185302734375, 0.339813232421875, 0.4677734375, 0.595733642578125, 0.72369384765625, 0.851654052734375, 0.9796142578125, 1.107574462890625, 1.23553466796875, 1.363494873046875, 1.491455078125, 1.619415283203125, 1.74737548828125, 1.875335693359375, 2.0032958984375, 2.131256103515625, 2.25921630859375, 2.387176513671875, 2.51513671875, 2.643096923828125, 2.77105712890625, 2.899017333984375, 3.0269775390625, 3.154937744140625, 3.28289794921875, 3.410858154296875, 3.538818359375, 3.666778564453125, 3.79473876953125, 3.922698974609375, 4.0506591796875, 4.178619384765625, 4.30657958984375, 4.434539794921875, 4.5625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 1.0, 7.0, 8.0, 10.0, 8.0, 12.0, 21.0, 32.0, 48.0, 67.0, 116.0, 186.0, 402.0, 856.0, 1786.0, 4993.0, 17614.0, 99467.0, 3604564.0, 415762.0, 34951.0, 8239.0, 2732.0, 1081.0, 543.0, 259.0, 146.0, 118.0, 63.0, 45.0, 36.0, 25.0, 13.0, 17.0, 14.0, 6.0, 12.0, 6.0, 3.0, 2.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1328125, -8.82568359375, -8.5185546875, -8.21142578125, -7.904296875, -7.59716796875, -7.2900390625, -6.98291015625, -6.67578125, -6.36865234375, -6.0615234375, -5.75439453125, -5.447265625, -5.14013671875, -4.8330078125, -4.52587890625, -4.21875, -3.91162109375, -3.6044921875, -3.29736328125, -2.990234375, -2.68310546875, -2.3759765625, -2.06884765625, -1.76171875, -1.45458984375, -1.1474609375, -0.84033203125, -0.533203125, -0.22607421875, 0.0810546875, 0.38818359375, 0.6953125, 1.00244140625, 1.3095703125, 1.61669921875, 1.923828125, 2.23095703125, 2.5380859375, 2.84521484375, 3.15234375, 3.45947265625, 3.7666015625, 4.07373046875, 4.380859375, 4.68798828125, 4.9951171875, 5.30224609375, 5.609375, 5.91650390625, 6.2236328125, 6.53076171875, 6.837890625, 7.14501953125, 7.4521484375, 7.75927734375, 8.06640625, 8.37353515625, 8.6806640625, 8.98779296875, 9.294921875, 9.60205078125, 9.9091796875, 10.21630859375, 10.5234375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 7.0, 13.0, 14.0, 31.0, 36.0, 60.0, 149.0, 435.0, 1861.0, 1003.0, 238.0, 107.0, 39.0, 33.0, 19.0, 14.0, 7.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.609375, -7.181396484375, -6.75341796875, -6.325439453125, -5.8974609375, -5.469482421875, -5.04150390625, -4.613525390625, -4.185546875, -3.757568359375, -3.32958984375, -2.901611328125, -2.4736328125, -2.045654296875, -1.61767578125, -1.189697265625, -0.76171875, -0.333740234375, 0.09423828125, 0.522216796875, 0.9501953125, 1.378173828125, 1.80615234375, 2.234130859375, 2.662109375, 3.090087890625, 3.51806640625, 3.946044921875, 4.3740234375, 4.802001953125, 5.22998046875, 5.657958984375, 6.0859375, 6.513916015625, 6.94189453125, 7.369873046875, 7.7978515625, 8.225830078125, 8.65380859375, 9.081787109375, 9.509765625, 9.937744140625, 10.36572265625, 10.793701171875, 11.2216796875, 11.649658203125, 12.07763671875, 12.505615234375, 12.93359375, 13.361572265625, 13.78955078125, 14.217529296875, 14.6455078125, 15.073486328125, 15.50146484375, 15.929443359375, 16.357421875, 16.785400390625, 17.21337890625, 17.641357421875, 18.0693359375, 18.497314453125, 18.92529296875, 19.353271484375, 19.78125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 4.0, 13.0, 35.0, 74.0, 162.0, 249.0, 246.0, 115.0, 42.0, 23.0, 15.0, 8.0, 3.0, 3.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-98.06118774414062, -95.5317153930664, -93.00223541259766, -90.47276306152344, -87.94329071044922, -85.413818359375, -82.88433837890625, -80.35486602783203, -77.82539367675781, -75.2959213256836, -72.76644134521484, -70.23696899414062, -67.7074966430664, -65.17802429199219, -62.64854431152344, -60.11907196044922, -57.58959197998047, -55.060115814208984, -52.530643463134766, -50.00116729736328, -47.47169494628906, -44.94221878051758, -42.412742614746094, -39.883270263671875, -37.35379409790039, -34.824317932128906, -32.29484558105469, -29.765369415283203, -27.23589515686035, -24.7064208984375, -22.176944732666016, -19.647470474243164, -17.117996215820312, -14.588521957397461, -12.059046745300293, -9.529571533203125, -7.000097274780273, -4.470623016357422, -1.941147804260254, 0.5883274078369141, 3.1178016662597656, 5.647276401519775, 8.176751136779785, 10.706226348876953, 13.235700607299805, 15.765174865722656, 18.29465103149414, 20.824125289916992, 23.353599548339844, 25.883073806762695, 28.412548065185547, 30.94202423095703, 33.47149658203125, 36.000972747802734, 38.53044891357422, 41.05992126464844, 43.58939743041992, 46.118873596191406, 48.648345947265625, 51.17782211303711, 53.707298278808594, 56.23677062988281, 58.7662467956543, 61.29572296142578, 63.8251953125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 7.0, 6.0, 11.0, 12.0, 14.0, 13.0, 16.0, 19.0, 25.0, 25.0, 27.0, 27.0, 44.0, 51.0, 52.0, 47.0, 45.0, 51.0, 47.0, 45.0, 65.0, 47.0, 36.0, 31.0, 36.0, 25.0, 27.0, 25.0, 22.0, 22.0, 17.0, 15.0, 15.0, 10.0, 8.0, 3.0, 5.0, 8.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-31.665313720703125, -30.710559844970703, -29.75580406188965, -28.801048278808594, -27.846294403076172, -26.89154052734375, -25.936784744262695, -24.98202896118164, -24.02727508544922, -23.072521209716797, -22.117765426635742, -21.163009643554688, -20.208255767822266, -19.253501892089844, -18.29874610900879, -17.343990325927734, -16.389236450195312, -15.434481620788574, -14.479726791381836, -13.524971961975098, -12.57021713256836, -11.615462303161621, -10.660707473754883, -9.705952644348145, -8.751197814941406, -7.796442985534668, -6.84168815612793, -5.886933326721191, -4.932178497314453, -3.977423667907715, -3.0226688385009766, -2.0679140090942383, -1.1131591796875, -0.15840435028076172, 0.7963504791259766, 1.7511053085327148, 2.705860137939453, 3.6606149673461914, 4.61536979675293, 5.570124626159668, 6.524879455566406, 7.4796342849731445, 8.434389114379883, 9.389143943786621, 10.34389877319336, 11.298653602600098, 12.253408432006836, 13.208163261413574, 14.162918090820312, 15.11767292022705, 16.07242774963379, 17.027183532714844, 17.981937408447266, 18.936691284179688, 19.891447067260742, 20.846202850341797, 21.80095672607422, 22.75571060180664, 23.710466384887695, 24.66522216796875, 25.619976043701172, 26.574729919433594, 27.52948570251465, 28.484241485595703, 29.438995361328125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 5.0, 7.0, 10.0, 17.0, 19.0, 23.0, 36.0, 80.0, 74.0, 122.0, 191.0, 327.0, 474.0, 793.0, 1232.0, 2173.0, 3746.0, 6908.0, 12439.0, 24460.0, 48435.0, 99127.0, 203729.0, 292361.0, 177847.0, 85469.0, 41327.0, 21264.0, 11109.0, 6151.0, 3470.0, 1938.0, 1170.0, 681.0, 451.0, 303.0, 202.0, 124.0, 82.0, 64.0, 43.0, 23.0, 9.0, 14.0, 10.0, 3.0, 4.0, 5.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-3.80078125, -3.6834716796875, -3.566162109375, -3.4488525390625, -3.33154296875, -3.2142333984375, -3.096923828125, -2.9796142578125, -2.8623046875, -2.7449951171875, -2.627685546875, -2.5103759765625, -2.39306640625, -2.2757568359375, -2.158447265625, -2.0411376953125, -1.923828125, -1.8065185546875, -1.689208984375, -1.5718994140625, -1.45458984375, -1.3372802734375, -1.219970703125, -1.1026611328125, -0.9853515625, -0.8680419921875, -0.750732421875, -0.6334228515625, -0.51611328125, -0.3988037109375, -0.281494140625, -0.1641845703125, -0.046875, 0.0704345703125, 0.187744140625, 0.3050537109375, 0.42236328125, 0.5396728515625, 0.656982421875, 0.7742919921875, 0.8916015625, 1.0089111328125, 1.126220703125, 1.2435302734375, 1.36083984375, 1.4781494140625, 1.595458984375, 1.7127685546875, 1.830078125, 1.9473876953125, 2.064697265625, 2.1820068359375, 2.29931640625, 2.4166259765625, 2.533935546875, 2.6512451171875, 2.7685546875, 2.8858642578125, 3.003173828125, 3.1204833984375, 3.23779296875, 3.3551025390625, 3.472412109375, 3.5897216796875, 3.70703125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 6.0, 5.0, 6.0, 9.0, 5.0, 10.0, 9.0, 10.0, 16.0, 17.0, 29.0, 24.0, 22.0, 22.0, 34.0, 38.0, 50.0, 32.0, 31.0, 50.0, 53.0, 43.0, 40.0, 55.0, 50.0, 35.0, 31.0, 48.0, 34.0, 28.0, 26.0, 22.0, 19.0, 20.0, 12.0, 10.0, 8.0, 8.0, 9.0, 7.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.3125, -2.24298095703125, -2.1734619140625, -2.10394287109375, -2.034423828125, -1.96490478515625, -1.8953857421875, -1.82586669921875, -1.75634765625, -1.68682861328125, -1.6173095703125, -1.54779052734375, -1.478271484375, -1.40875244140625, -1.3392333984375, -1.26971435546875, -1.2001953125, -1.13067626953125, -1.0611572265625, -0.99163818359375, -0.922119140625, -0.85260009765625, -0.7830810546875, -0.71356201171875, -0.64404296875, -0.57452392578125, -0.5050048828125, -0.43548583984375, -0.365966796875, -0.29644775390625, -0.2269287109375, -0.15740966796875, -0.087890625, -0.01837158203125, 0.0511474609375, 0.12066650390625, 0.190185546875, 0.25970458984375, 0.3292236328125, 0.39874267578125, 0.46826171875, 0.53778076171875, 0.6072998046875, 0.67681884765625, 0.746337890625, 0.81585693359375, 0.8853759765625, 0.95489501953125, 1.0244140625, 1.09393310546875, 1.1634521484375, 1.23297119140625, 1.302490234375, 1.37200927734375, 1.4415283203125, 1.51104736328125, 1.58056640625, 1.65008544921875, 1.7196044921875, 1.78912353515625, 1.858642578125, 1.92816162109375, 1.9976806640625, 2.06719970703125, 2.13671875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 7.0, 7.0, 8.0, 16.0, 27.0, 26.0, 39.0, 50.0, 79.0, 106.0, 165.0, 259.0, 476.0, 843.0, 1832.0, 4579.0, 15859.0, 77060.0, 524742.0, 345651.0, 57077.0, 12561.0, 3754.0, 1514.0, 716.0, 372.0, 249.0, 135.0, 99.0, 65.0, 45.0, 44.0, 27.0, 13.0, 19.0, 4.0, 6.0, 7.0, 6.0, 2.0, 0.0, 3.0, 3.0, 2.0, 2.0], "bins": [-11.375, -11.074951171875, -10.77490234375, -10.474853515625, -10.1748046875, -9.874755859375, -9.57470703125, -9.274658203125, -8.974609375, -8.674560546875, -8.37451171875, -8.074462890625, -7.7744140625, -7.474365234375, -7.17431640625, -6.874267578125, -6.57421875, -6.274169921875, -5.97412109375, -5.674072265625, -5.3740234375, -5.073974609375, -4.77392578125, -4.473876953125, -4.173828125, -3.873779296875, -3.57373046875, -3.273681640625, -2.9736328125, -2.673583984375, -2.37353515625, -2.073486328125, -1.7734375, -1.473388671875, -1.17333984375, -0.873291015625, -0.5732421875, -0.273193359375, 0.02685546875, 0.326904296875, 0.626953125, 0.927001953125, 1.22705078125, 1.527099609375, 1.8271484375, 2.127197265625, 2.42724609375, 2.727294921875, 3.02734375, 3.327392578125, 3.62744140625, 3.927490234375, 4.2275390625, 4.527587890625, 4.82763671875, 5.127685546875, 5.427734375, 5.727783203125, 6.02783203125, 6.327880859375, 6.6279296875, 6.927978515625, 7.22802734375, 7.528076171875, 7.828125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 7.0, 8.0, 7.0, 8.0, 15.0, 11.0, 13.0, 19.0, 32.0, 24.0, 33.0, 41.0, 35.0, 53.0, 51.0, 55.0, 52.0, 78.0, 37.0, 49.0, 50.0, 33.0, 45.0, 54.0, 29.0, 29.0, 23.0, 23.0, 17.0, 9.0, 14.0, 7.0, 7.0, 5.0, 6.0, 4.0, 3.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-13.796875, -13.4326171875, -13.068359375, -12.7041015625, -12.33984375, -11.9755859375, -11.611328125, -11.2470703125, -10.8828125, -10.5185546875, -10.154296875, -9.7900390625, -9.42578125, -9.0615234375, -8.697265625, -8.3330078125, -7.96875, -7.6044921875, -7.240234375, -6.8759765625, -6.51171875, -6.1474609375, -5.783203125, -5.4189453125, -5.0546875, -4.6904296875, -4.326171875, -3.9619140625, -3.59765625, -3.2333984375, -2.869140625, -2.5048828125, -2.140625, -1.7763671875, -1.412109375, -1.0478515625, -0.68359375, -0.3193359375, 0.044921875, 0.4091796875, 0.7734375, 1.1376953125, 1.501953125, 1.8662109375, 2.23046875, 2.5947265625, 2.958984375, 3.3232421875, 3.6875, 4.0517578125, 4.416015625, 4.7802734375, 5.14453125, 5.5087890625, 5.873046875, 6.2373046875, 6.6015625, 6.9658203125, 7.330078125, 7.6943359375, 8.05859375, 8.4228515625, 8.787109375, 9.1513671875, 9.515625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 6.0, 12.0, 11.0, 20.0, 20.0, 38.0, 47.0, 83.0, 155.0, 275.0, 556.0, 1418.0, 5189.0, 37326.0, 647456.0, 328863.0, 21122.0, 3785.0, 1109.0, 465.0, 222.0, 128.0, 72.0, 52.0, 27.0, 18.0, 15.0, 12.0, 15.0, 5.0, 6.0, 0.0, 5.0, 3.0, 5.0, 0.0, 2.0, 2.0, 1.0], "bins": [-6.0078125, -5.857177734375, -5.70654296875, -5.555908203125, -5.4052734375, -5.254638671875, -5.10400390625, -4.953369140625, -4.802734375, -4.652099609375, -4.50146484375, -4.350830078125, -4.2001953125, -4.049560546875, -3.89892578125, -3.748291015625, -3.59765625, -3.447021484375, -3.29638671875, -3.145751953125, -2.9951171875, -2.844482421875, -2.69384765625, -2.543212890625, -2.392578125, -2.241943359375, -2.09130859375, -1.940673828125, -1.7900390625, -1.639404296875, -1.48876953125, -1.338134765625, -1.1875, -1.036865234375, -0.88623046875, -0.735595703125, -0.5849609375, -0.434326171875, -0.28369140625, -0.133056640625, 0.017578125, 0.168212890625, 0.31884765625, 0.469482421875, 0.6201171875, 0.770751953125, 0.92138671875, 1.072021484375, 1.22265625, 1.373291015625, 1.52392578125, 1.674560546875, 1.8251953125, 1.975830078125, 2.12646484375, 2.277099609375, 2.427734375, 2.578369140625, 2.72900390625, 2.879638671875, 3.0302734375, 3.180908203125, 3.33154296875, 3.482177734375, 3.6328125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 5.0, 2.0, 4.0, 4.0, 5.0, 5.0, 9.0, 13.0, 18.0, 15.0, 24.0, 30.0, 40.0, 26.0, 44.0, 48.0, 64.0, 62.0, 82.0, 66.0, 62.0, 52.0, 43.0, 55.0, 34.0, 38.0, 34.0, 24.0, 17.0, 18.0, 10.0, 15.0, 9.0, 6.0, 5.0, 5.0, 3.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.0005655288696289062, -0.0005498901009559631, -0.00053425133228302, -0.0005186125636100769, -0.0005029737949371338, -0.0004873350262641907, -0.00047169625759124756, -0.00045605748891830444, -0.00044041872024536133, -0.0004247799515724182, -0.0004091411828994751, -0.000393502414226532, -0.00037786364555358887, -0.00036222487688064575, -0.00034658610820770264, -0.0003309473395347595, -0.0003153085708618164, -0.0002996698021888733, -0.0002840310335159302, -0.00026839226484298706, -0.00025275349617004395, -0.00023711472749710083, -0.00022147595882415771, -0.0002058371901512146, -0.00019019842147827148, -0.00017455965280532837, -0.00015892088413238525, -0.00014328211545944214, -0.00012764334678649902, -0.00011200457811355591, -9.636580944061279e-05, -8.072704076766968e-05, -6.508827209472656e-05, -4.944950342178345e-05, -3.381073474884033e-05, -1.8171966075897217e-05, -2.5331974029541016e-06, 1.3105571269989014e-05, 2.874433994293213e-05, 4.4383108615875244e-05, 6.002187728881836e-05, 7.566064596176147e-05, 9.129941463470459e-05, 0.0001069381833076477, 0.00012257695198059082, 0.00013821572065353394, 0.00015385448932647705, 0.00016949325799942017, 0.00018513202667236328, 0.0002007707953453064, 0.0002164095640182495, 0.00023204833269119263, 0.00024768710136413574, 0.00026332587003707886, 0.00027896463871002197, 0.0002946034073829651, 0.0003102421760559082, 0.0003258809447288513, 0.00034151971340179443, 0.00035715848207473755, 0.00037279725074768066, 0.0003884360194206238, 0.0004040747880935669, 0.00041971355676651, 0.0004353523254394531]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 7.0, 6.0, 3.0, 5.0, 8.0, 14.0, 10.0, 28.0, 39.0, 59.0, 104.0, 230.0, 464.0, 1294.0, 4355.0, 26271.0, 399355.0, 575381.0, 33314.0, 5115.0, 1422.0, 520.0, 238.0, 119.0, 62.0, 42.0, 32.0, 20.0, 9.0, 11.0, 6.0, 7.0, 2.0, 8.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-5.1015625, -4.960052490234375, -4.81854248046875, -4.677032470703125, -4.5355224609375, -4.394012451171875, -4.25250244140625, -4.110992431640625, -3.969482421875, -3.827972412109375, -3.68646240234375, -3.544952392578125, -3.4034423828125, -3.261932373046875, -3.12042236328125, -2.978912353515625, -2.83740234375, -2.695892333984375, -2.55438232421875, -2.412872314453125, -2.2713623046875, -2.129852294921875, -1.98834228515625, -1.846832275390625, -1.705322265625, -1.563812255859375, -1.42230224609375, -1.280792236328125, -1.1392822265625, -0.997772216796875, -0.85626220703125, -0.714752197265625, -0.5732421875, -0.431732177734375, -0.29022216796875, -0.148712158203125, -0.0072021484375, 0.134307861328125, 0.27581787109375, 0.417327880859375, 0.558837890625, 0.700347900390625, 0.84185791015625, 0.983367919921875, 1.1248779296875, 1.266387939453125, 1.40789794921875, 1.549407958984375, 1.69091796875, 1.832427978515625, 1.97393798828125, 2.115447998046875, 2.2569580078125, 2.398468017578125, 2.53997802734375, 2.681488037109375, 2.822998046875, 2.964508056640625, 3.10601806640625, 3.247528076171875, 3.3890380859375, 3.530548095703125, 3.67205810546875, 3.813568115234375, 3.955078125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 9.0, 8.0, 17.0, 35.0, 28.0, 45.0, 56.0, 62.0, 73.0, 100.0, 99.0, 113.0, 84.0, 71.0, 45.0, 47.0, 35.0, 21.0, 22.0, 8.0, 8.0, 4.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.28125, -3.15277099609375, -3.0242919921875, -2.89581298828125, -2.767333984375, -2.63885498046875, -2.5103759765625, -2.38189697265625, -2.25341796875, -2.12493896484375, -1.9964599609375, -1.86798095703125, -1.739501953125, -1.61102294921875, -1.4825439453125, -1.35406494140625, -1.2255859375, -1.09710693359375, -0.9686279296875, -0.84014892578125, -0.711669921875, -0.58319091796875, -0.4547119140625, -0.32623291015625, -0.19775390625, -0.06927490234375, 0.0592041015625, 0.18768310546875, 0.316162109375, 0.44464111328125, 0.5731201171875, 0.70159912109375, 0.830078125, 0.95855712890625, 1.0870361328125, 1.21551513671875, 1.343994140625, 1.47247314453125, 1.6009521484375, 1.72943115234375, 1.85791015625, 1.98638916015625, 2.1148681640625, 2.24334716796875, 2.371826171875, 2.50030517578125, 2.6287841796875, 2.75726318359375, 2.8857421875, 3.01422119140625, 3.1427001953125, 3.27117919921875, 3.399658203125, 3.52813720703125, 3.6566162109375, 3.78509521484375, 3.91357421875, 4.04205322265625, 4.1705322265625, 4.29901123046875, 4.427490234375, 4.55596923828125, 4.6844482421875, 4.81292724609375, 4.94140625]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 7.0, 12.0, 16.0, 54.0, 101.0, 148.0, 221.0, 187.0, 120.0, 58.0, 28.0, 17.0, 12.0, 7.0, 8.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-70.37223815917969, -67.91392517089844, -65.45560455322266, -62.997291564941406, -60.53897476196289, -58.080657958984375, -55.622344970703125, -53.16402816772461, -50.705711364746094, -48.24739456176758, -45.78908157348633, -43.33076477050781, -40.8724479675293, -38.41413116455078, -35.95581817626953, -33.497501373291016, -31.039188385009766, -28.580873489379883, -26.122556686401367, -23.664241790771484, -21.20592498779297, -18.747610092163086, -16.289295196533203, -13.830978393554688, -11.372663497924805, -8.914347648620605, -6.4560322761535645, -3.9977169036865234, -1.5394010543823242, 0.918914794921875, 3.377229690551758, 5.835546493530273, 8.293861389160156, 10.752177238464355, 13.210493087768555, 15.668807983398438, 18.127124786376953, 20.585439682006836, 23.04375457763672, 25.502071380615234, 27.960386276245117, 30.418701171875, 32.877017974853516, 35.33533477783203, 37.79364776611328, 40.2519645690918, 42.71028137207031, 45.16859436035156, 47.62691116333008, 50.085227966308594, 52.543540954589844, 55.00185775756836, 57.460174560546875, 59.918487548828125, 62.37680435180664, 64.83512115478516, 67.2934341430664, 69.75174713134766, 72.21006774902344, 74.66838073730469, 77.12669372558594, 79.58501434326172, 82.04332733154297, 84.50164794921875, 86.9599609375]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 4.0, 5.0, 1.0, 5.0, 4.0, 8.0, 2.0, 8.0, 13.0, 18.0, 14.0, 8.0, 26.0, 25.0, 27.0, 26.0, 33.0, 42.0, 30.0, 44.0, 36.0, 43.0, 54.0, 46.0, 54.0, 47.0, 53.0, 36.0, 35.0, 36.0, 29.0, 27.0, 30.0, 13.0, 21.0, 14.0, 19.0, 11.0, 12.0, 9.0, 6.0, 10.0, 5.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-38.6396369934082, -37.434715270996094, -36.22979736328125, -35.02487564086914, -33.81995391845703, -32.61503219604492, -31.410112380981445, -30.20519256591797, -29.00027084350586, -27.79534912109375, -26.590429306030273, -25.385509490966797, -24.180587768554688, -22.975666046142578, -21.7707462310791, -20.565826416015625, -19.360904693603516, -18.155982971191406, -16.95106315612793, -15.746142387390137, -14.541221618652344, -13.33630084991455, -12.131380081176758, -10.926459312438965, -9.721538543701172, -8.516617774963379, -7.311697006225586, -6.106776237487793, -4.90185546875, -3.696934700012207, -2.492013931274414, -1.287093162536621, -0.08217620849609375, 1.1227445602416992, 2.327665328979492, 3.532586097717285, 4.737506866455078, 5.942427635192871, 7.147348403930664, 8.352269172668457, 9.55718994140625, 10.762110710144043, 11.967031478881836, 13.171952247619629, 14.376873016357422, 15.581793785095215, 16.786714553833008, 17.991634368896484, 19.196556091308594, 20.401477813720703, 21.60639762878418, 22.811317443847656, 24.016239166259766, 25.221160888671875, 26.42608070373535, 27.631000518798828, 28.835922241210938, 30.040843963623047, 31.245763778686523, 32.45068359375, 33.65560531616211, 34.86052703857422, 36.06544494628906, 37.27036666870117, 38.47528839111328]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 6.0, 4.0, 6.0, 3.0, 12.0, 10.0, 14.0, 28.0, 27.0, 57.0, 88.0, 127.0, 227.0, 347.0, 639.0, 1210.0, 2231.0, 4367.0, 9172.0, 21649.0, 63123.0, 280219.0, 1704031.0, 1703465.0, 297035.0, 65839.0, 21883.0, 9246.0, 4316.0, 2223.0, 1132.0, 617.0, 372.0, 216.0, 110.0, 89.0, 51.0, 28.0, 26.0, 17.0, 10.0, 6.0, 5.0, 3.0, 5.0, 4.0, 2.0, 1.0], "bins": [-3.310546875, -3.225677490234375, -3.14080810546875, -3.055938720703125, -2.9710693359375, -2.886199951171875, -2.80133056640625, -2.716461181640625, -2.631591796875, -2.546722412109375, -2.46185302734375, -2.376983642578125, -2.2921142578125, -2.207244873046875, -2.12237548828125, -2.037506103515625, -1.95263671875, -1.867767333984375, -1.78289794921875, -1.698028564453125, -1.6131591796875, -1.528289794921875, -1.44342041015625, -1.358551025390625, -1.273681640625, -1.188812255859375, -1.10394287109375, -1.019073486328125, -0.9342041015625, -0.849334716796875, -0.76446533203125, -0.679595947265625, -0.5947265625, -0.509857177734375, -0.42498779296875, -0.340118408203125, -0.2552490234375, -0.170379638671875, -0.08551025390625, -0.000640869140625, 0.084228515625, 0.169097900390625, 0.25396728515625, 0.338836669921875, 0.4237060546875, 0.508575439453125, 0.59344482421875, 0.678314208984375, 0.76318359375, 0.848052978515625, 0.93292236328125, 1.017791748046875, 1.1026611328125, 1.187530517578125, 1.27239990234375, 1.357269287109375, 1.442138671875, 1.527008056640625, 1.61187744140625, 1.696746826171875, 1.7816162109375, 1.866485595703125, 1.95135498046875, 2.036224365234375, 2.12109375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 5.0, 7.0, 5.0, 5.0, 10.0, 4.0, 16.0, 12.0, 16.0, 17.0, 19.0, 14.0, 32.0, 26.0, 21.0, 35.0, 32.0, 44.0, 46.0, 44.0, 35.0, 49.0, 58.0, 47.0, 49.0, 50.0, 37.0, 45.0, 34.0, 27.0, 29.0, 19.0, 28.0, 19.0, 12.0, 16.0, 9.0, 11.0, 5.0, 7.0, 5.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.708984375, -1.642852783203125, -1.57672119140625, -1.510589599609375, -1.4444580078125, -1.378326416015625, -1.31219482421875, -1.246063232421875, -1.179931640625, -1.113800048828125, -1.04766845703125, -0.981536865234375, -0.9154052734375, -0.849273681640625, -0.78314208984375, -0.717010498046875, -0.65087890625, -0.584747314453125, -0.51861572265625, -0.452484130859375, -0.3863525390625, -0.320220947265625, -0.25408935546875, -0.187957763671875, -0.121826171875, -0.055694580078125, 0.01043701171875, 0.076568603515625, 0.1427001953125, 0.208831787109375, 0.27496337890625, 0.341094970703125, 0.4072265625, 0.473358154296875, 0.53948974609375, 0.605621337890625, 0.6717529296875, 0.737884521484375, 0.80401611328125, 0.870147705078125, 0.936279296875, 1.002410888671875, 1.06854248046875, 1.134674072265625, 1.2008056640625, 1.266937255859375, 1.33306884765625, 1.399200439453125, 1.46533203125, 1.531463623046875, 1.59759521484375, 1.663726806640625, 1.7298583984375, 1.795989990234375, 1.86212158203125, 1.928253173828125, 1.994384765625, 2.060516357421875, 2.12664794921875, 2.192779541015625, 2.2589111328125, 2.325042724609375, 2.39117431640625, 2.457305908203125, 2.5234375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 7.0, 8.0, 14.0, 13.0, 19.0, 33.0, 28.0, 55.0, 85.0, 126.0, 193.0, 375.0, 728.0, 1579.0, 3799.0, 10193.0, 35871.0, 187886.0, 3011319.0, 832088.0, 79997.0, 18960.0, 6155.0, 2373.0, 1042.0, 527.0, 298.0, 182.0, 91.0, 64.0, 51.0, 28.0, 21.0, 22.0, 13.0, 12.0, 6.0, 7.0, 9.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.91796875, -5.7374267578125, -5.556884765625, -5.3763427734375, -5.19580078125, -5.0152587890625, -4.834716796875, -4.6541748046875, -4.4736328125, -4.2930908203125, -4.112548828125, -3.9320068359375, -3.75146484375, -3.5709228515625, -3.390380859375, -3.2098388671875, -3.029296875, -2.8487548828125, -2.668212890625, -2.4876708984375, -2.30712890625, -2.1265869140625, -1.946044921875, -1.7655029296875, -1.5849609375, -1.4044189453125, -1.223876953125, -1.0433349609375, -0.86279296875, -0.6822509765625, -0.501708984375, -0.3211669921875, -0.140625, 0.0399169921875, 0.220458984375, 0.4010009765625, 0.58154296875, 0.7620849609375, 0.942626953125, 1.1231689453125, 1.3037109375, 1.4842529296875, 1.664794921875, 1.8453369140625, 2.02587890625, 2.2064208984375, 2.386962890625, 2.5675048828125, 2.748046875, 2.9285888671875, 3.109130859375, 3.2896728515625, 3.47021484375, 3.6507568359375, 3.831298828125, 4.0118408203125, 4.1923828125, 4.3729248046875, 4.553466796875, 4.7340087890625, 4.91455078125, 5.0950927734375, 5.275634765625, 5.4561767578125, 5.63671875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 5.0, 7.0, 8.0, 9.0, 15.0, 13.0, 21.0, 23.0, 36.0, 56.0, 70.0, 106.0, 165.0, 276.0, 460.0, 716.0, 780.0, 503.0, 282.0, 151.0, 95.0, 81.0, 52.0, 44.0, 20.0, 20.0, 6.0, 12.0, 8.0, 6.0, 3.0, 10.0, 7.0, 4.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.9375, -5.740234375, -5.54296875, -5.345703125, -5.1484375, -4.951171875, -4.75390625, -4.556640625, -4.359375, -4.162109375, -3.96484375, -3.767578125, -3.5703125, -3.373046875, -3.17578125, -2.978515625, -2.78125, -2.583984375, -2.38671875, -2.189453125, -1.9921875, -1.794921875, -1.59765625, -1.400390625, -1.203125, -1.005859375, -0.80859375, -0.611328125, -0.4140625, -0.216796875, -0.01953125, 0.177734375, 0.375, 0.572265625, 0.76953125, 0.966796875, 1.1640625, 1.361328125, 1.55859375, 1.755859375, 1.953125, 2.150390625, 2.34765625, 2.544921875, 2.7421875, 2.939453125, 3.13671875, 3.333984375, 3.53125, 3.728515625, 3.92578125, 4.123046875, 4.3203125, 4.517578125, 4.71484375, 4.912109375, 5.109375, 5.306640625, 5.50390625, 5.701171875, 5.8984375, 6.095703125, 6.29296875, 6.490234375, 6.6875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 8.0, 12.0, 20.0, 88.0, 193.0, 289.0, 246.0, 88.0, 32.0, 11.0, 8.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.10240936279297, -63.84999465942383, -60.59757995605469, -57.34516143798828, -54.092750549316406, -50.84033203125, -47.58791732788086, -44.33550262451172, -41.08308792114258, -37.83067321777344, -34.5782585144043, -31.325841903686523, -28.073427200317383, -24.821012496948242, -21.56859588623047, -18.316181182861328, -15.063766479492188, -11.811351776123047, -8.55893611907959, -5.306520462036133, -2.054105758666992, 1.1983089447021484, 4.450725555419922, 7.7031402587890625, 10.955554962158203, 14.207969665527344, 17.460384368896484, 20.712800979614258, 23.9652156829834, 27.21763038635254, 30.470046997070312, 33.72246170043945, 36.97486877441406, 40.2272834777832, 43.479698181152344, 46.73211669921875, 49.984527587890625, 53.23694610595703, 56.48936080932617, 59.74177551269531, 62.99419021606445, 66.2466049194336, 69.4990234375, 72.75143432617188, 76.00385284423828, 79.25626373291016, 82.50868225097656, 85.76109313964844, 89.01351165771484, 92.26593017578125, 95.51834106445312, 98.77075958251953, 102.0231704711914, 105.27558898925781, 108.52799987792969, 111.7804183959961, 115.0328369140625, 118.2852554321289, 121.53766632080078, 124.79008483886719, 128.04249572753906, 131.29490661621094, 134.54733276367188, 137.79974365234375, 141.05215454101562]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 2.0, 3.0, 3.0, 6.0, 8.0, 14.0, 9.0, 13.0, 26.0, 31.0, 38.0, 43.0, 41.0, 38.0, 45.0, 67.0, 62.0, 68.0, 58.0, 55.0, 48.0, 59.0, 40.0, 55.0, 37.0, 28.0, 23.0, 25.0, 20.0, 15.0, 7.0, 6.0, 7.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.968656539916992, -25.84511375427246, -24.72157096862793, -23.59803009033203, -22.4744873046875, -21.35094451904297, -20.227401733398438, -19.103858947753906, -17.980316162109375, -16.856773376464844, -15.733231544494629, -14.609688758850098, -13.486146926879883, -12.362604141235352, -11.23906135559082, -10.115518569946289, -8.99197769165039, -7.868435382843018, -6.7448930740356445, -5.621350288391113, -4.49780797958374, -3.374265670776367, -2.250722885131836, -1.127180576324463, -0.0036382675170898438, 1.1199041604995728, 2.2434465885162354, 3.3669891357421875, 4.4905314445495605, 5.614073753356934, 6.737616539001465, 7.861158847808838, 8.984699249267578, 10.10824203491211, 11.231783866882324, 12.355326652526855, 13.47886848449707, 14.602411270141602, 15.725954055786133, 16.849496841430664, 17.973037719726562, 19.096580505371094, 20.220123291015625, 21.343666076660156, 22.467206954956055, 23.590749740600586, 24.714292526245117, 25.83783531188965, 26.96137809753418, 28.08492088317871, 29.208463668823242, 30.33200454711914, 31.455547332763672, 32.5790901184082, 33.702632904052734, 34.826175689697266, 35.9497184753418, 37.07326126098633, 38.19680404663086, 39.32034683227539, 40.44388961791992, 41.56742858886719, 42.69097137451172, 43.81451416015625, 44.93805694580078]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 3.0, 9.0, 8.0, 30.0, 46.0, 64.0, 98.0, 122.0, 194.0, 366.0, 505.0, 840.0, 1494.0, 2527.0, 4274.0, 7604.0, 13225.0, 23319.0, 40756.0, 70203.0, 116426.0, 179661.0, 206315.0, 153024.0, 94577.0, 56564.0, 32489.0, 18455.0, 10796.0, 6017.0, 3516.0, 2028.0, 1175.0, 667.0, 424.0, 262.0, 166.0, 105.0, 69.0, 46.0, 33.0, 22.0, 13.0, 8.0, 8.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.31640625, -2.237335205078125, -2.15826416015625, -2.079193115234375, -2.0001220703125, -1.921051025390625, -1.84197998046875, -1.762908935546875, -1.683837890625, -1.604766845703125, -1.52569580078125, -1.446624755859375, -1.3675537109375, -1.288482666015625, -1.20941162109375, -1.130340576171875, -1.05126953125, -0.972198486328125, -0.89312744140625, -0.814056396484375, -0.7349853515625, -0.655914306640625, -0.57684326171875, -0.497772216796875, -0.418701171875, -0.339630126953125, -0.26055908203125, -0.181488037109375, -0.1024169921875, -0.023345947265625, 0.05572509765625, 0.134796142578125, 0.2138671875, 0.292938232421875, 0.37200927734375, 0.451080322265625, 0.5301513671875, 0.609222412109375, 0.68829345703125, 0.767364501953125, 0.846435546875, 0.925506591796875, 1.00457763671875, 1.083648681640625, 1.1627197265625, 1.241790771484375, 1.32086181640625, 1.399932861328125, 1.47900390625, 1.558074951171875, 1.63714599609375, 1.716217041015625, 1.7952880859375, 1.874359130859375, 1.95343017578125, 2.032501220703125, 2.111572265625, 2.190643310546875, 2.26971435546875, 2.348785400390625, 2.4278564453125, 2.506927490234375, 2.58599853515625, 2.665069580078125, 2.744140625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 1.0, 5.0, 7.0, 8.0, 10.0, 10.0, 12.0, 12.0, 18.0, 26.0, 20.0, 28.0, 25.0, 31.0, 36.0, 28.0, 32.0, 39.0, 39.0, 41.0, 69.0, 50.0, 45.0, 57.0, 33.0, 41.0, 37.0, 35.0, 26.0, 33.0, 22.0, 31.0, 20.0, 15.0, 11.0, 14.0, 9.0, 6.0, 6.0, 6.0, 3.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8193359375, -1.7544097900390625, -1.689483642578125, -1.6245574951171875, -1.55963134765625, -1.4947052001953125, -1.429779052734375, -1.3648529052734375, -1.2999267578125, -1.2350006103515625, -1.170074462890625, -1.1051483154296875, -1.04022216796875, -0.9752960205078125, -0.910369873046875, -0.8454437255859375, -0.780517578125, -0.7155914306640625, -0.650665283203125, -0.5857391357421875, -0.52081298828125, -0.4558868408203125, -0.390960693359375, -0.3260345458984375, -0.2611083984375, -0.1961822509765625, -0.131256103515625, -0.0663299560546875, -0.00140380859375, 0.0635223388671875, 0.128448486328125, 0.1933746337890625, 0.25830078125, 0.3232269287109375, 0.388153076171875, 0.4530792236328125, 0.51800537109375, 0.5829315185546875, 0.647857666015625, 0.7127838134765625, 0.7777099609375, 0.8426361083984375, 0.907562255859375, 0.9724884033203125, 1.03741455078125, 1.1023406982421875, 1.167266845703125, 1.2321929931640625, 1.297119140625, 1.3620452880859375, 1.426971435546875, 1.4918975830078125, 1.55682373046875, 1.6217498779296875, 1.686676025390625, 1.7516021728515625, 1.8165283203125, 1.8814544677734375, 1.946380615234375, 2.0113067626953125, 2.07623291015625, 2.1411590576171875, 2.206085205078125, 2.2710113525390625, 2.3359375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 2.0, 6.0, 4.0, 13.0, 17.0, 28.0, 35.0, 27.0, 51.0, 87.0, 106.0, 136.0, 206.0, 278.0, 466.0, 697.0, 1061.0, 1975.0, 4467.0, 14969.0, 70633.0, 452920.0, 407743.0, 68157.0, 14622.0, 4571.0, 1995.0, 1133.0, 690.0, 433.0, 280.0, 222.0, 151.0, 106.0, 76.0, 46.0, 41.0, 27.0, 27.0, 12.0, 11.0, 6.0, 6.0, 7.0, 0.0, 4.0, 3.0, 0.0, 0.0, 3.0, 1.0], "bins": [-8.0390625, -7.809326171875, -7.57958984375, -7.349853515625, -7.1201171875, -6.890380859375, -6.66064453125, -6.430908203125, -6.201171875, -5.971435546875, -5.74169921875, -5.511962890625, -5.2822265625, -5.052490234375, -4.82275390625, -4.593017578125, -4.36328125, -4.133544921875, -3.90380859375, -3.674072265625, -3.4443359375, -3.214599609375, -2.98486328125, -2.755126953125, -2.525390625, -2.295654296875, -2.06591796875, -1.836181640625, -1.6064453125, -1.376708984375, -1.14697265625, -0.917236328125, -0.6875, -0.457763671875, -0.22802734375, 0.001708984375, 0.2314453125, 0.461181640625, 0.69091796875, 0.920654296875, 1.150390625, 1.380126953125, 1.60986328125, 1.839599609375, 2.0693359375, 2.299072265625, 2.52880859375, 2.758544921875, 2.98828125, 3.218017578125, 3.44775390625, 3.677490234375, 3.9072265625, 4.136962890625, 4.36669921875, 4.596435546875, 4.826171875, 5.055908203125, 5.28564453125, 5.515380859375, 5.7451171875, 5.974853515625, 6.20458984375, 6.434326171875, 6.6640625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 5.0, 3.0, 8.0, 6.0, 9.0, 6.0, 7.0, 10.0, 11.0, 22.0, 30.0, 20.0, 38.0, 27.0, 37.0, 42.0, 49.0, 61.0, 44.0, 47.0, 32.0, 35.0, 47.0, 59.0, 54.0, 38.0, 41.0, 32.0, 36.0, 26.0, 22.0, 20.0, 19.0, 6.0, 7.0, 12.0, 9.0, 8.0, 7.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-9.609375, -9.3209228515625, -9.032470703125, -8.7440185546875, -8.45556640625, -8.1671142578125, -7.878662109375, -7.5902099609375, -7.3017578125, -7.0133056640625, -6.724853515625, -6.4364013671875, -6.14794921875, -5.8594970703125, -5.571044921875, -5.2825927734375, -4.994140625, -4.7056884765625, -4.417236328125, -4.1287841796875, -3.84033203125, -3.5518798828125, -3.263427734375, -2.9749755859375, -2.6865234375, -2.3980712890625, -2.109619140625, -1.8211669921875, -1.53271484375, -1.2442626953125, -0.955810546875, -0.6673583984375, -0.37890625, -0.0904541015625, 0.197998046875, 0.4864501953125, 0.77490234375, 1.0633544921875, 1.351806640625, 1.6402587890625, 1.9287109375, 2.2171630859375, 2.505615234375, 2.7940673828125, 3.08251953125, 3.3709716796875, 3.659423828125, 3.9478759765625, 4.236328125, 4.5247802734375, 4.813232421875, 5.1016845703125, 5.39013671875, 5.6785888671875, 5.967041015625, 6.2554931640625, 6.5439453125, 6.8323974609375, 7.120849609375, 7.4093017578125, 7.69775390625, 7.9862060546875, 8.274658203125, 8.5631103515625, 8.8515625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 4.0, 5.0, 7.0, 10.0, 17.0, 18.0, 22.0, 33.0, 42.0, 79.0, 130.0, 234.0, 475.0, 992.0, 2734.0, 11207.0, 104560.0, 826899.0, 86518.0, 9986.0, 2594.0, 912.0, 441.0, 254.0, 142.0, 59.0, 47.0, 38.0, 18.0, 21.0, 13.0, 11.0, 13.0, 2.0, 2.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.765625, -3.64202880859375, -3.5184326171875, -3.39483642578125, -3.271240234375, -3.14764404296875, -3.0240478515625, -2.90045166015625, -2.77685546875, -2.65325927734375, -2.5296630859375, -2.40606689453125, -2.282470703125, -2.15887451171875, -2.0352783203125, -1.91168212890625, -1.7880859375, -1.66448974609375, -1.5408935546875, -1.41729736328125, -1.293701171875, -1.17010498046875, -1.0465087890625, -0.92291259765625, -0.79931640625, -0.67572021484375, -0.5521240234375, -0.42852783203125, -0.304931640625, -0.18133544921875, -0.0577392578125, 0.06585693359375, 0.189453125, 0.31304931640625, 0.4366455078125, 0.56024169921875, 0.683837890625, 0.80743408203125, 0.9310302734375, 1.05462646484375, 1.17822265625, 1.30181884765625, 1.4254150390625, 1.54901123046875, 1.672607421875, 1.79620361328125, 1.9197998046875, 2.04339599609375, 2.1669921875, 2.29058837890625, 2.4141845703125, 2.53778076171875, 2.661376953125, 2.78497314453125, 2.9085693359375, 3.03216552734375, 3.15576171875, 3.27935791015625, 3.4029541015625, 3.52655029296875, 3.650146484375, 3.77374267578125, 3.8973388671875, 4.02093505859375, 4.14453125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 9.0, 12.0, 20.0, 23.0, 22.0, 43.0, 56.0, 81.0, 104.0, 119.0, 112.0, 106.0, 85.0, 54.0, 46.0, 31.0, 25.0, 21.0, 8.0, 8.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006494522094726562, -0.0006244927644729614, -0.0005995333194732666, -0.0005745738744735718, -0.000549614429473877, -0.0005246549844741821, -0.0004996955394744873, -0.0004747360944747925, -0.00044977664947509766, -0.00042481720447540283, -0.000399857759475708, -0.0003748983144760132, -0.00034993886947631836, -0.00032497942447662354, -0.0003000199794769287, -0.0002750605344772339, -0.00025010108947753906, -0.00022514164447784424, -0.00020018219947814941, -0.0001752227544784546, -0.00015026330947875977, -0.00012530386447906494, -0.00010034441947937012, -7.538497447967529e-05, -5.042552947998047e-05, -2.5466084480285645e-05, -5.066394805908203e-07, 2.4452805519104004e-05, 4.941225051879883e-05, 7.437169551849365e-05, 9.933114051818848e-05, 0.0001242905855178833, 0.00014925003051757812, 0.00017420947551727295, 0.00019916892051696777, 0.0002241283655166626, 0.0002490878105163574, 0.00027404725551605225, 0.00029900670051574707, 0.0003239661455154419, 0.0003489255905151367, 0.00037388503551483154, 0.00039884448051452637, 0.0004238039255142212, 0.000448763370513916, 0.00047372281551361084, 0.0004986822605133057, 0.0005236417055130005, 0.0005486011505126953, 0.0005735605955123901, 0.000598520040512085, 0.0006234794855117798, 0.0006484389305114746, 0.0006733983755111694, 0.0006983578205108643, 0.0007233172655105591, 0.0007482767105102539, 0.0007732361555099487, 0.0007981956005096436, 0.0008231550455093384, 0.0008481144905090332, 0.000873073935508728, 0.0008980333805084229, 0.0009229928255081177, 0.0009479522705078125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 5.0, 8.0, 7.0, 6.0, 11.0, 15.0, 16.0, 20.0, 27.0, 52.0, 67.0, 84.0, 136.0, 213.0, 354.0, 566.0, 1332.0, 3052.0, 8918.0, 40982.0, 370515.0, 556236.0, 48977.0, 10332.0, 3463.0, 1398.0, 705.0, 386.0, 214.0, 140.0, 102.0, 63.0, 43.0, 29.0, 21.0, 16.0, 19.0, 11.0, 4.0, 2.0, 2.0, 4.0, 4.0, 2.0, 4.0], "bins": [-3.33203125, -3.2488250732421875, -3.165618896484375, -3.0824127197265625, -2.99920654296875, -2.9160003662109375, -2.832794189453125, -2.7495880126953125, -2.6663818359375, -2.5831756591796875, -2.499969482421875, -2.4167633056640625, -2.33355712890625, -2.2503509521484375, -2.167144775390625, -2.0839385986328125, -2.000732421875, -1.9175262451171875, -1.834320068359375, -1.7511138916015625, -1.66790771484375, -1.5847015380859375, -1.501495361328125, -1.4182891845703125, -1.3350830078125, -1.2518768310546875, -1.168670654296875, -1.0854644775390625, -1.00225830078125, -0.9190521240234375, -0.835845947265625, -0.7526397705078125, -0.66943359375, -0.5862274169921875, -0.503021240234375, -0.4198150634765625, -0.33660888671875, -0.2534027099609375, -0.170196533203125, -0.0869903564453125, -0.0037841796875, 0.0794219970703125, 0.162628173828125, 0.2458343505859375, 0.32904052734375, 0.4122467041015625, 0.495452880859375, 0.5786590576171875, 0.661865234375, 0.7450714111328125, 0.828277587890625, 0.9114837646484375, 0.99468994140625, 1.0778961181640625, 1.161102294921875, 1.2443084716796875, 1.3275146484375, 1.4107208251953125, 1.493927001953125, 1.5771331787109375, 1.66033935546875, 1.7435455322265625, 1.826751708984375, 1.9099578857421875, 1.9931640625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 2.0, 4.0, 5.0, 9.0, 3.0, 16.0, 9.0, 17.0, 23.0, 33.0, 41.0, 38.0, 43.0, 55.0, 61.0, 70.0, 67.0, 61.0, 66.0, 63.0, 49.0, 72.0, 38.0, 37.0, 27.0, 26.0, 18.0, 18.0, 8.0, 5.0, 8.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.900390625, -2.82208251953125, -2.7437744140625, -2.66546630859375, -2.587158203125, -2.50885009765625, -2.4305419921875, -2.35223388671875, -2.27392578125, -2.19561767578125, -2.1173095703125, -2.03900146484375, -1.960693359375, -1.88238525390625, -1.8040771484375, -1.72576904296875, -1.6474609375, -1.56915283203125, -1.4908447265625, -1.41253662109375, -1.334228515625, -1.25592041015625, -1.1776123046875, -1.09930419921875, -1.02099609375, -0.94268798828125, -0.8643798828125, -0.78607177734375, -0.707763671875, -0.62945556640625, -0.5511474609375, -0.47283935546875, -0.39453125, -0.31622314453125, -0.2379150390625, -0.15960693359375, -0.081298828125, -0.00299072265625, 0.0753173828125, 0.15362548828125, 0.23193359375, 0.31024169921875, 0.3885498046875, 0.46685791015625, 0.545166015625, 0.62347412109375, 0.7017822265625, 0.78009033203125, 0.8583984375, 0.93670654296875, 1.0150146484375, 1.09332275390625, 1.171630859375, 1.24993896484375, 1.3282470703125, 1.40655517578125, 1.48486328125, 1.56317138671875, 1.6414794921875, 1.71978759765625, 1.798095703125, 1.87640380859375, 1.9547119140625, 2.03302001953125, 2.111328125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 12.0, 39.0, 58.0, 134.0, 248.0, 276.0, 140.0, 48.0, 17.0, 11.0, 5.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.76946258544922, -73.69979858398438, -70.63014221191406, -67.56047821044922, -64.49081420898438, -61.42115783691406, -58.35149383544922, -55.28183364868164, -52.21217346191406, -49.142513275146484, -46.07284927368164, -43.00318908691406, -39.933528900146484, -36.863868713378906, -33.79420471191406, -30.724544525146484, -27.65488052368164, -24.58521842956543, -21.51555824279785, -18.44589614868164, -15.376235008239746, -12.306573867797852, -9.23691177368164, -6.1672515869140625, -3.0975894927978516, -0.02792811393737793, 3.0417332649230957, 6.111394882202148, 9.181056022644043, 12.250717163085938, 15.320379257202148, 18.390039443969727, 21.459701538085938, 24.52936363220215, 27.599023818969727, 30.668685913085938, 33.738346099853516, 36.808006286621094, 39.87767028808594, 42.947330474853516, 46.016990661621094, 49.08665084838867, 52.156314849853516, 55.225975036621094, 58.29563522338867, 61.36529541015625, 64.4349594116211, 67.50462341308594, 70.57427978515625, 73.6439437866211, 76.7136001586914, 79.78326416015625, 82.8529281616211, 85.9225845336914, 88.99224853515625, 92.06190490722656, 95.13157653808594, 98.20124053955078, 101.2708969116211, 104.34056091308594, 107.41022491455078, 110.4798812866211, 113.54954528808594, 116.61920166015625, 119.6888656616211]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 11.0, 6.0, 9.0, 11.0, 24.0, 19.0, 27.0, 23.0, 24.0, 35.0, 37.0, 41.0, 42.0, 50.0, 59.0, 85.0, 79.0, 64.0, 63.0, 42.0, 45.0, 31.0, 33.0, 23.0, 20.0, 21.0, 11.0, 16.0, 15.0, 14.0, 5.0, 6.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-41.24934005737305, -39.95686340332031, -38.66438293457031, -37.37190628051758, -36.07942581176758, -34.786949157714844, -33.494468688964844, -32.20199203491211, -30.909513473510742, -29.617034912109375, -28.324556350708008, -27.03207778930664, -25.739601135253906, -24.447120666503906, -23.154644012451172, -21.862165451049805, -20.569686889648438, -19.27720832824707, -17.984729766845703, -16.692251205444336, -15.399773597717285, -14.107295036315918, -12.814817428588867, -11.5223388671875, -10.229860305786133, -8.937381744384766, -7.644903659820557, -6.352425575256348, -5.0599470138549805, -3.7674684524536133, -2.4749903678894043, -1.1825122833251953, 0.10996246337890625, 1.4024407863616943, 2.6949191093444824, 3.9873974323272705, 5.279875755310059, 6.572354316711426, 7.864832401275635, 9.157310485839844, 10.449789047241211, 11.742267608642578, 13.034746170043945, 14.327223777770996, 15.619702339172363, 16.912181854248047, 18.20465850830078, 19.49713706970215, 20.789615631103516, 22.082094192504883, 23.37457275390625, 24.667051315307617, 25.959529876708984, 27.25200653076172, 28.544485092163086, 29.836963653564453, 31.12944221496582, 32.42192077636719, 33.71439743041992, 35.00687789916992, 36.299354553222656, 37.591835021972656, 38.88431167602539, 40.176788330078125, 41.469268798828125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 4.0, 6.0, 10.0, 16.0, 27.0, 60.0, 43.0, 85.0, 130.0, 202.0, 289.0, 474.0, 831.0, 1450.0, 2663.0, 5006.0, 9986.0, 22732.0, 60458.0, 220949.0, 1099094.0, 2050605.0, 529648.0, 120425.0, 37642.0, 15765.0, 7131.0, 3609.0, 1997.0, 1135.0, 663.0, 367.0, 286.0, 179.0, 99.0, 72.0, 42.0, 32.0, 20.0, 16.0, 13.0, 6.0, 8.0, 2.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-2.82421875, -2.7418212890625, -2.659423828125, -2.5770263671875, -2.49462890625, -2.4122314453125, -2.329833984375, -2.2474365234375, -2.1650390625, -2.0826416015625, -2.000244140625, -1.9178466796875, -1.83544921875, -1.7530517578125, -1.670654296875, -1.5882568359375, -1.505859375, -1.4234619140625, -1.341064453125, -1.2586669921875, -1.17626953125, -1.0938720703125, -1.011474609375, -0.9290771484375, -0.8466796875, -0.7642822265625, -0.681884765625, -0.5994873046875, -0.51708984375, -0.4346923828125, -0.352294921875, -0.2698974609375, -0.1875, -0.1051025390625, -0.022705078125, 0.0596923828125, 0.14208984375, 0.2244873046875, 0.306884765625, 0.3892822265625, 0.4716796875, 0.5540771484375, 0.636474609375, 0.7188720703125, 0.80126953125, 0.8836669921875, 0.966064453125, 1.0484619140625, 1.130859375, 1.2132568359375, 1.295654296875, 1.3780517578125, 1.46044921875, 1.5428466796875, 1.625244140625, 1.7076416015625, 1.7900390625, 1.8724365234375, 1.954833984375, 2.0372314453125, 2.11962890625, 2.2020263671875, 2.284423828125, 2.3668212890625, 2.44921875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 1.0, 6.0, 6.0, 6.0, 2.0, 13.0, 8.0, 9.0, 10.0, 16.0, 19.0, 18.0, 22.0, 24.0, 24.0, 31.0, 32.0, 34.0, 45.0, 37.0, 37.0, 33.0, 43.0, 40.0, 53.0, 47.0, 40.0, 42.0, 34.0, 25.0, 20.0, 27.0, 28.0, 34.0, 20.0, 24.0, 17.0, 17.0, 11.0, 17.0, 7.0, 6.0, 3.0, 5.0, 3.0, 5.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.736328125, -1.67926025390625, -1.6221923828125, -1.56512451171875, -1.508056640625, -1.45098876953125, -1.3939208984375, -1.33685302734375, -1.27978515625, -1.22271728515625, -1.1656494140625, -1.10858154296875, -1.051513671875, -0.99444580078125, -0.9373779296875, -0.88031005859375, -0.8232421875, -0.76617431640625, -0.7091064453125, -0.65203857421875, -0.594970703125, -0.53790283203125, -0.4808349609375, -0.42376708984375, -0.36669921875, -0.30963134765625, -0.2525634765625, -0.19549560546875, -0.138427734375, -0.08135986328125, -0.0242919921875, 0.03277587890625, 0.08984375, 0.14691162109375, 0.2039794921875, 0.26104736328125, 0.318115234375, 0.37518310546875, 0.4322509765625, 0.48931884765625, 0.54638671875, 0.60345458984375, 0.6605224609375, 0.71759033203125, 0.774658203125, 0.83172607421875, 0.8887939453125, 0.94586181640625, 1.0029296875, 1.05999755859375, 1.1170654296875, 1.17413330078125, 1.231201171875, 1.28826904296875, 1.3453369140625, 1.40240478515625, 1.45947265625, 1.51654052734375, 1.5736083984375, 1.63067626953125, 1.687744140625, 1.74481201171875, 1.8018798828125, 1.85894775390625, 1.916015625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 7.0, 0.0, 6.0, 9.0, 6.0, 17.0, 13.0, 19.0, 27.0, 45.0, 57.0, 95.0, 133.0, 229.0, 368.0, 706.0, 1392.0, 2983.0, 7870.0, 25697.0, 112717.0, 1446766.0, 2400701.0, 149808.0, 30226.0, 8500.0, 3053.0, 1265.0, 616.0, 365.0, 219.0, 124.0, 82.0, 48.0, 36.0, 27.0, 13.0, 11.0, 7.0, 4.0, 7.0, 7.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.01953125, -5.84796142578125, -5.6763916015625, -5.50482177734375, -5.333251953125, -5.16168212890625, -4.9901123046875, -4.81854248046875, -4.64697265625, -4.47540283203125, -4.3038330078125, -4.13226318359375, -3.960693359375, -3.78912353515625, -3.6175537109375, -3.44598388671875, -3.2744140625, -3.10284423828125, -2.9312744140625, -2.75970458984375, -2.588134765625, -2.41656494140625, -2.2449951171875, -2.07342529296875, -1.90185546875, -1.73028564453125, -1.5587158203125, -1.38714599609375, -1.215576171875, -1.04400634765625, -0.8724365234375, -0.70086669921875, -0.529296875, -0.35772705078125, -0.1861572265625, -0.01458740234375, 0.156982421875, 0.32855224609375, 0.5001220703125, 0.67169189453125, 0.84326171875, 1.01483154296875, 1.1864013671875, 1.35797119140625, 1.529541015625, 1.70111083984375, 1.8726806640625, 2.04425048828125, 2.2158203125, 2.38739013671875, 2.5589599609375, 2.73052978515625, 2.902099609375, 3.07366943359375, 3.2452392578125, 3.41680908203125, 3.58837890625, 3.75994873046875, 3.9315185546875, 4.10308837890625, 4.274658203125, 4.44622802734375, 4.6177978515625, 4.78936767578125, 4.9609375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 7.0, 7.0, 12.0, 10.0, 12.0, 20.0, 24.0, 33.0, 50.0, 54.0, 94.0, 182.0, 306.0, 513.0, 883.0, 774.0, 447.0, 235.0, 120.0, 91.0, 48.0, 41.0, 27.0, 21.0, 25.0, 14.0, 8.0, 5.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.94140625, -5.71160888671875, -5.4818115234375, -5.25201416015625, -5.022216796875, -4.79241943359375, -4.5626220703125, -4.33282470703125, -4.10302734375, -3.87322998046875, -3.6434326171875, -3.41363525390625, -3.183837890625, -2.95404052734375, -2.7242431640625, -2.49444580078125, -2.2646484375, -2.03485107421875, -1.8050537109375, -1.57525634765625, -1.345458984375, -1.11566162109375, -0.8858642578125, -0.65606689453125, -0.42626953125, -0.19647216796875, 0.0333251953125, 0.26312255859375, 0.492919921875, 0.72271728515625, 0.9525146484375, 1.18231201171875, 1.412109375, 1.64190673828125, 1.8717041015625, 2.10150146484375, 2.331298828125, 2.56109619140625, 2.7908935546875, 3.02069091796875, 3.25048828125, 3.48028564453125, 3.7100830078125, 3.93988037109375, 4.169677734375, 4.39947509765625, 4.6292724609375, 4.85906982421875, 5.0888671875, 5.31866455078125, 5.5484619140625, 5.77825927734375, 6.008056640625, 6.23785400390625, 6.4676513671875, 6.69744873046875, 6.92724609375, 7.15704345703125, 7.3868408203125, 7.61663818359375, 7.846435546875, 8.07623291015625, 8.3060302734375, 8.53582763671875, 8.765625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 7.0, 13.0, 26.0, 56.0, 109.0, 182.0, 224.0, 181.0, 98.0, 56.0, 19.0, 5.0, 5.0, 7.0, 5.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-90.60877990722656, -88.32697296142578, -86.04515838623047, -83.76335144042969, -81.48153686523438, -79.1997299194336, -76.91792297363281, -74.6361083984375, -72.35430145263672, -70.07249450683594, -67.79067993164062, -65.50887298583984, -63.2270622253418, -60.94525146484375, -58.66344451904297, -56.38163375854492, -54.099822998046875, -51.81801223754883, -49.53620147705078, -47.25439453125, -44.97258377075195, -42.690773010253906, -40.408966064453125, -38.12715530395508, -35.84534454345703, -33.563533782958984, -31.28172492980957, -28.999916076660156, -26.71810531616211, -24.436294555664062, -22.15448570251465, -19.872676849365234, -17.590858459472656, -15.309048652648926, -13.027238845825195, -10.745429039001465, -8.463619232177734, -6.181809425354004, -3.8999996185302734, -1.618189811706543, 0.6636199951171875, 2.945429801940918, 5.227239608764648, 7.509049415588379, 9.79085922241211, 12.07266902923584, 14.35447883605957, 16.636287689208984, 18.91809844970703, 21.199909210205078, 23.481718063354492, 25.763526916503906, 28.045337677001953, 30.3271484375, 32.60895538330078, 34.89076614379883, 37.172576904296875, 39.45438766479492, 41.73619842529297, 44.01800537109375, 46.2998161315918, 48.581626892089844, 50.863433837890625, 53.14524459838867, 55.42705535888672]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 8.0, 2.0, 6.0, 12.0, 18.0, 12.0, 15.0, 15.0, 25.0, 22.0, 38.0, 40.0, 32.0, 36.0, 38.0, 48.0, 48.0, 52.0, 54.0, 47.0, 52.0, 38.0, 46.0, 40.0, 33.0, 35.0, 26.0, 24.0, 21.0, 19.0, 17.0, 10.0, 14.0, 11.0, 7.0, 6.0, 9.0, 9.0, 3.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.809492111206055, -28.851871490478516, -27.89425277709961, -26.936634063720703, -25.979013442993164, -25.021392822265625, -24.06377410888672, -23.106155395507812, -22.148534774780273, -21.190914154052734, -20.233295440673828, -19.275676727294922, -18.318056106567383, -17.360435485839844, -16.402816772460938, -15.445197105407715, -14.487577438354492, -13.52995777130127, -12.572338104248047, -11.614718437194824, -10.657098770141602, -9.699479103088379, -8.741859436035156, -7.784239768981934, -6.826620101928711, -5.869000434875488, -4.911380767822266, -3.953761100769043, -2.9961414337158203, -2.0385217666625977, -1.080902099609375, -0.12328243255615234, 0.8343353271484375, 1.7919549942016602, 2.749574661254883, 3.7071943283081055, 4.664813995361328, 5.622433662414551, 6.580053329467773, 7.537672996520996, 8.495292663574219, 9.452912330627441, 10.410531997680664, 11.368151664733887, 12.32577133178711, 13.283390998840332, 14.241010665893555, 15.198630332946777, 16.15625, 17.113868713378906, 18.071489334106445, 19.029109954833984, 19.98672866821289, 20.944347381591797, 21.901968002319336, 22.859588623046875, 23.81720733642578, 24.774826049804688, 25.732446670532227, 26.690067291259766, 27.647686004638672, 28.605304718017578, 29.562925338745117, 30.520545959472656, 31.478164672851562]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 8.0, 10.0, 14.0, 27.0, 36.0, 36.0, 65.0, 95.0, 108.0, 199.0, 261.0, 402.0, 601.0, 887.0, 1279.0, 1930.0, 3016.0, 4776.0, 7797.0, 12091.0, 19917.0, 32504.0, 53498.0, 86309.0, 138731.0, 196898.0, 179528.0, 117306.0, 72577.0, 44645.0, 27455.0, 16824.0, 10410.0, 6509.0, 4144.0, 2563.0, 1628.0, 1115.0, 757.0, 495.0, 347.0, 232.0, 155.0, 122.0, 80.0, 47.0, 51.0, 28.0, 20.0, 12.0, 11.0, 6.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0], "bins": [-2.443359375, -2.3665771484375, -2.289794921875, -2.2130126953125, -2.13623046875, -2.0594482421875, -1.982666015625, -1.9058837890625, -1.8291015625, -1.7523193359375, -1.675537109375, -1.5987548828125, -1.52197265625, -1.4451904296875, -1.368408203125, -1.2916259765625, -1.21484375, -1.1380615234375, -1.061279296875, -0.9844970703125, -0.90771484375, -0.8309326171875, -0.754150390625, -0.6773681640625, -0.6005859375, -0.5238037109375, -0.447021484375, -0.3702392578125, -0.29345703125, -0.2166748046875, -0.139892578125, -0.0631103515625, 0.013671875, 0.0904541015625, 0.167236328125, 0.2440185546875, 0.32080078125, 0.3975830078125, 0.474365234375, 0.5511474609375, 0.6279296875, 0.7047119140625, 0.781494140625, 0.8582763671875, 0.93505859375, 1.0118408203125, 1.088623046875, 1.1654052734375, 1.2421875, 1.3189697265625, 1.395751953125, 1.4725341796875, 1.54931640625, 1.6260986328125, 1.702880859375, 1.7796630859375, 1.8564453125, 1.9332275390625, 2.010009765625, 2.0867919921875, 2.16357421875, 2.2403564453125, 2.317138671875, 2.3939208984375, 2.470703125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 8.0, 6.0, 3.0, 7.0, 12.0, 11.0, 18.0, 24.0, 23.0, 18.0, 32.0, 25.0, 23.0, 37.0, 33.0, 27.0, 46.0, 47.0, 46.0, 49.0, 47.0, 57.0, 39.0, 44.0, 34.0, 38.0, 32.0, 31.0, 26.0, 28.0, 28.0, 18.0, 15.0, 14.0, 13.0, 12.0, 6.0, 9.0, 3.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.88671875, -1.821197509765625, -1.75567626953125, -1.690155029296875, -1.6246337890625, -1.559112548828125, -1.49359130859375, -1.428070068359375, -1.362548828125, -1.297027587890625, -1.23150634765625, -1.165985107421875, -1.1004638671875, -1.034942626953125, -0.96942138671875, -0.903900146484375, -0.83837890625, -0.772857666015625, -0.70733642578125, -0.641815185546875, -0.5762939453125, -0.510772705078125, -0.44525146484375, -0.379730224609375, -0.314208984375, -0.248687744140625, -0.18316650390625, -0.117645263671875, -0.0521240234375, 0.013397216796875, 0.07891845703125, 0.144439697265625, 0.2099609375, 0.275482177734375, 0.34100341796875, 0.406524658203125, 0.4720458984375, 0.537567138671875, 0.60308837890625, 0.668609619140625, 0.734130859375, 0.799652099609375, 0.86517333984375, 0.930694580078125, 0.9962158203125, 1.061737060546875, 1.12725830078125, 1.192779541015625, 1.25830078125, 1.323822021484375, 1.38934326171875, 1.454864501953125, 1.5203857421875, 1.585906982421875, 1.65142822265625, 1.716949462890625, 1.782470703125, 1.847991943359375, 1.91351318359375, 1.979034423828125, 2.0445556640625, 2.110076904296875, 2.17559814453125, 2.241119384765625, 2.306640625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 7.0, 12.0, 8.0, 21.0, 17.0, 22.0, 41.0, 55.0, 82.0, 97.0, 143.0, 216.0, 296.0, 438.0, 665.0, 1362.0, 2640.0, 7109.0, 27737.0, 151381.0, 663978.0, 151650.0, 27445.0, 7111.0, 2580.0, 1225.0, 757.0, 423.0, 315.0, 202.0, 159.0, 102.0, 71.0, 44.0, 33.0, 18.0, 23.0, 27.0, 13.0, 9.0, 8.0, 4.0, 7.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.703125, -7.4505615234375, -7.197998046875, -6.9454345703125, -6.69287109375, -6.4403076171875, -6.187744140625, -5.9351806640625, -5.6826171875, -5.4300537109375, -5.177490234375, -4.9249267578125, -4.67236328125, -4.4197998046875, -4.167236328125, -3.9146728515625, -3.662109375, -3.4095458984375, -3.156982421875, -2.9044189453125, -2.65185546875, -2.3992919921875, -2.146728515625, -1.8941650390625, -1.6416015625, -1.3890380859375, -1.136474609375, -0.8839111328125, -0.63134765625, -0.3787841796875, -0.126220703125, 0.1263427734375, 0.37890625, 0.6314697265625, 0.884033203125, 1.1365966796875, 1.38916015625, 1.6417236328125, 1.894287109375, 2.1468505859375, 2.3994140625, 2.6519775390625, 2.904541015625, 3.1571044921875, 3.40966796875, 3.6622314453125, 3.914794921875, 4.1673583984375, 4.419921875, 4.6724853515625, 4.925048828125, 5.1776123046875, 5.43017578125, 5.6827392578125, 5.935302734375, 6.1878662109375, 6.4404296875, 6.6929931640625, 6.945556640625, 7.1981201171875, 7.45068359375, 7.7032470703125, 7.955810546875, 8.2083740234375, 8.4609375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 2.0, 4.0, 7.0, 6.0, 8.0, 7.0, 10.0, 12.0, 13.0, 10.0, 11.0, 30.0, 22.0, 21.0, 29.0, 33.0, 36.0, 45.0, 37.0, 40.0, 46.0, 44.0, 45.0, 50.0, 41.0, 46.0, 43.0, 39.0, 32.0, 40.0, 34.0, 27.0, 22.0, 19.0, 10.0, 25.0, 12.0, 11.0, 5.0, 3.0, 5.0, 5.0, 3.0, 4.0, 4.0, 1.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0], "bins": [-8.671875, -8.4130859375, -8.154296875, -7.8955078125, -7.63671875, -7.3779296875, -7.119140625, -6.8603515625, -6.6015625, -6.3427734375, -6.083984375, -5.8251953125, -5.56640625, -5.3076171875, -5.048828125, -4.7900390625, -4.53125, -4.2724609375, -4.013671875, -3.7548828125, -3.49609375, -3.2373046875, -2.978515625, -2.7197265625, -2.4609375, -2.2021484375, -1.943359375, -1.6845703125, -1.42578125, -1.1669921875, -0.908203125, -0.6494140625, -0.390625, -0.1318359375, 0.126953125, 0.3857421875, 0.64453125, 0.9033203125, 1.162109375, 1.4208984375, 1.6796875, 1.9384765625, 2.197265625, 2.4560546875, 2.71484375, 2.9736328125, 3.232421875, 3.4912109375, 3.75, 4.0087890625, 4.267578125, 4.5263671875, 4.78515625, 5.0439453125, 5.302734375, 5.5615234375, 5.8203125, 6.0791015625, 6.337890625, 6.5966796875, 6.85546875, 7.1142578125, 7.373046875, 7.6318359375, 7.890625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 5.0, 2.0, 7.0, 7.0, 10.0, 11.0, 22.0, 33.0, 54.0, 100.0, 209.0, 443.0, 1286.0, 5292.0, 44436.0, 687968.0, 282725.0, 21314.0, 3080.0, 857.0, 348.0, 141.0, 75.0, 40.0, 25.0, 21.0, 13.0, 13.0, 2.0, 7.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.951171875, -2.852294921875, -2.75341796875, -2.654541015625, -2.5556640625, -2.456787109375, -2.35791015625, -2.259033203125, -2.16015625, -2.061279296875, -1.96240234375, -1.863525390625, -1.7646484375, -1.665771484375, -1.56689453125, -1.468017578125, -1.369140625, -1.270263671875, -1.17138671875, -1.072509765625, -0.9736328125, -0.874755859375, -0.77587890625, -0.677001953125, -0.578125, -0.479248046875, -0.38037109375, -0.281494140625, -0.1826171875, -0.083740234375, 0.01513671875, 0.114013671875, 0.212890625, 0.311767578125, 0.41064453125, 0.509521484375, 0.6083984375, 0.707275390625, 0.80615234375, 0.905029296875, 1.00390625, 1.102783203125, 1.20166015625, 1.300537109375, 1.3994140625, 1.498291015625, 1.59716796875, 1.696044921875, 1.794921875, 1.893798828125, 1.99267578125, 2.091552734375, 2.1904296875, 2.289306640625, 2.38818359375, 2.487060546875, 2.5859375, 2.684814453125, 2.78369140625, 2.882568359375, 2.9814453125, 3.080322265625, 3.17919921875, 3.278076171875, 3.376953125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 8.0, 2.0, 8.0, 11.0, 10.0, 23.0, 22.0, 25.0, 25.0, 37.0, 34.0, 56.0, 64.0, 70.0, 64.0, 88.0, 80.0, 63.0, 76.0, 43.0, 39.0, 40.0, 26.0, 20.0, 8.0, 14.0, 14.0, 7.0, 5.0, 4.0, 6.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0], "bins": [-0.00061798095703125, -0.00060218945145607, -0.0005863979458808899, -0.0005706064403057098, -0.0005548149347305298, -0.0005390234291553497, -0.0005232319235801697, -0.0005074404180049896, -0.0004916489124298096, -0.0004758574068546295, -0.00046006590127944946, -0.0004442743957042694, -0.00042848289012908936, -0.0004126913845539093, -0.00039689987897872925, -0.0003811083734035492, -0.00036531686782836914, -0.0003495253622531891, -0.00033373385667800903, -0.000317942351102829, -0.0003021508455276489, -0.00028635933995246887, -0.0002705678343772888, -0.00025477632880210876, -0.0002389848232269287, -0.00022319331765174866, -0.0002074018120765686, -0.00019161030650138855, -0.0001758188009262085, -0.00016002729535102844, -0.0001442357897758484, -0.00012844428420066833, -0.00011265277862548828, -9.686127305030823e-05, -8.106976747512817e-05, -6.527826189994812e-05, -4.9486756324768066e-05, -3.369525074958801e-05, -1.790374517440796e-05, -2.1122395992279053e-06, 1.3679265975952148e-05, 2.9470771551132202e-05, 4.5262277126312256e-05, 6.105378270149231e-05, 7.684528827667236e-05, 9.263679385185242e-05, 0.00010842829942703247, 0.00012421980500221252, 0.00014001131057739258, 0.00015580281615257263, 0.00017159432172775269, 0.00018738582730293274, 0.0002031773328781128, 0.00021896883845329285, 0.0002347603440284729, 0.00025055184960365295, 0.000266343355178833, 0.00028213486075401306, 0.0002979263663291931, 0.00031371787190437317, 0.0003295093774795532, 0.0003453008830547333, 0.00036109238862991333, 0.0003768838942050934, 0.00039267539978027344]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 2.0, 7.0, 13.0, 14.0, 19.0, 18.0, 19.0, 40.0, 68.0, 86.0, 122.0, 209.0, 376.0, 586.0, 1094.0, 2354.0, 6404.0, 24411.0, 136601.0, 629740.0, 197882.0, 34418.0, 8182.0, 2742.0, 1299.0, 677.0, 434.0, 252.0, 146.0, 106.0, 65.0, 57.0, 25.0, 20.0, 25.0, 14.0, 8.0, 7.0, 5.0, 3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0], "bins": [-2.068359375, -2.0118560791015625, -1.955352783203125, -1.8988494873046875, -1.84234619140625, -1.7858428955078125, -1.729339599609375, -1.6728363037109375, -1.6163330078125, -1.5598297119140625, -1.503326416015625, -1.4468231201171875, -1.39031982421875, -1.3338165283203125, -1.277313232421875, -1.2208099365234375, -1.164306640625, -1.1078033447265625, -1.051300048828125, -0.9947967529296875, -0.93829345703125, -0.8817901611328125, -0.825286865234375, -0.7687835693359375, -0.7122802734375, -0.6557769775390625, -0.599273681640625, -0.5427703857421875, -0.48626708984375, -0.4297637939453125, -0.373260498046875, -0.3167572021484375, -0.26025390625, -0.2037506103515625, -0.147247314453125, -0.0907440185546875, -0.03424072265625, 0.0222625732421875, 0.078765869140625, 0.1352691650390625, 0.1917724609375, 0.2482757568359375, 0.304779052734375, 0.3612823486328125, 0.41778564453125, 0.4742889404296875, 0.530792236328125, 0.5872955322265625, 0.643798828125, 0.7003021240234375, 0.756805419921875, 0.8133087158203125, 0.86981201171875, 0.9263153076171875, 0.982818603515625, 1.0393218994140625, 1.0958251953125, 1.1523284912109375, 1.208831787109375, 1.2653350830078125, 1.32183837890625, 1.3783416748046875, 1.434844970703125, 1.4913482666015625, 1.5478515625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 5.0, 7.0, 7.0, 14.0, 22.0, 19.0, 24.0, 42.0, 46.0, 58.0, 72.0, 74.0, 84.0, 84.0, 77.0, 64.0, 66.0, 41.0, 46.0, 31.0, 30.0, 19.0, 24.0, 16.0, 11.0, 6.0, 2.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.03125, -1.963592529296875, -1.89593505859375, -1.828277587890625, -1.7606201171875, -1.692962646484375, -1.62530517578125, -1.557647705078125, -1.489990234375, -1.422332763671875, -1.35467529296875, -1.287017822265625, -1.2193603515625, -1.151702880859375, -1.08404541015625, -1.016387939453125, -0.94873046875, -0.881072998046875, -0.81341552734375, -0.745758056640625, -0.6781005859375, -0.610443115234375, -0.54278564453125, -0.475128173828125, -0.407470703125, -0.339813232421875, -0.27215576171875, -0.204498291015625, -0.1368408203125, -0.069183349609375, -0.00152587890625, 0.066131591796875, 0.1337890625, 0.201446533203125, 0.26910400390625, 0.336761474609375, 0.4044189453125, 0.472076416015625, 0.53973388671875, 0.607391357421875, 0.675048828125, 0.742706298828125, 0.81036376953125, 0.878021240234375, 0.9456787109375, 1.013336181640625, 1.08099365234375, 1.148651123046875, 1.21630859375, 1.283966064453125, 1.35162353515625, 1.419281005859375, 1.4869384765625, 1.554595947265625, 1.62225341796875, 1.689910888671875, 1.757568359375, 1.825225830078125, 1.89288330078125, 1.960540771484375, 2.0281982421875, 2.095855712890625, 2.16351318359375, 2.231170654296875, 2.298828125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 13.0, 43.0, 87.0, 185.0, 329.0, 170.0, 98.0, 32.0, 22.0, 9.0, 2.0, 2.0, 4.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.013771057128906, -39.45927047729492, -36.90476989746094, -34.35026931762695, -31.79576873779297, -29.241268157958984, -26.686769485473633, -24.13226890563965, -21.577768325805664, -19.02326774597168, -16.468767166137695, -13.914267539978027, -11.359766960144043, -8.805266380310059, -6.250766754150391, -3.6962661743164062, -1.1417655944824219, 1.4127347469329834, 3.9672350883483887, 6.521735191345215, 9.0762357711792, 11.630736351013184, 14.185235977172852, 16.739736557006836, 19.29423713684082, 21.848737716674805, 24.40323829650879, 26.95773696899414, 29.512237548828125, 32.06673812866211, 34.621238708496094, 37.17573928833008, 39.73023986816406, 42.28474044799805, 44.83924102783203, 47.393741607666016, 49.9482421875, 52.502742767333984, 55.05724334716797, 57.61174011230469, 60.16624450683594, 62.72074508666992, 65.2752456665039, 67.82974243164062, 70.38424682617188, 72.9387435913086, 75.49324798583984, 78.04774475097656, 80.60224914550781, 83.15674591064453, 85.71125030517578, 88.2657470703125, 90.82025146484375, 93.37474822998047, 95.92925262451172, 98.48374938964844, 101.03824615478516, 103.59274291992188, 106.14724731445312, 108.70174407958984, 111.2562484741211, 113.81074523925781, 116.36524963378906, 118.91974639892578, 121.47425079345703]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 3.0, 5.0, 6.0, 8.0, 6.0, 10.0, 12.0, 16.0, 22.0, 17.0, 14.0, 29.0, 19.0, 27.0, 23.0, 39.0, 32.0, 58.0, 57.0, 74.0, 74.0, 70.0, 57.0, 35.0, 27.0, 30.0, 21.0, 35.0, 23.0, 23.0, 22.0, 11.0, 25.0, 14.0, 14.0, 10.0, 5.0, 5.0, 10.0, 4.0, 6.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.208620071411133, -28.090166091918945, -26.971712112426758, -25.853260040283203, -24.734806060791016, -23.616352081298828, -22.49789810180664, -21.379444122314453, -20.260990142822266, -19.142536163330078, -18.02408218383789, -16.905628204345703, -15.787176132202148, -14.668722152709961, -13.550268173217773, -12.431814193725586, -11.313362121582031, -10.194908142089844, -9.076455116271973, -7.958001136779785, -6.839547634124756, -5.721094131469727, -4.602640151977539, -3.4841866493225098, -2.3657331466674805, -1.2472795248031616, -0.12882590293884277, 0.9896278381347656, 2.108081340789795, 3.226534843444824, 4.344988822937012, 5.463442325592041, 6.581897735595703, 7.700351238250732, 8.818804740905762, 9.93725872039795, 11.05571174621582, 12.174165725708008, 13.292619705200195, 14.411073684692383, 15.529526710510254, 16.647979736328125, 17.766433715820312, 18.8848876953125, 20.003341674804688, 21.121795654296875, 22.240249633789062, 23.358701705932617, 24.477155685424805, 25.595609664916992, 26.71406364440918, 27.832515716552734, 28.950969696044922, 30.06942367553711, 31.187877655029297, 32.306331634521484, 33.42478561401367, 34.54323959350586, 35.66169357299805, 36.780147552490234, 37.89860153198242, 39.017051696777344, 40.13550567626953, 41.25395965576172, 42.372413635253906]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 0.0, 7.0, 7.0, 12.0, 10.0, 23.0, 21.0, 40.0, 36.0, 57.0, 89.0, 116.0, 175.0, 302.0, 411.0, 700.0, 1258.0, 2065.0, 4104.0, 8281.0, 19068.0, 55098.0, 199591.0, 816033.0, 1932890.0, 849982.0, 210382.0, 56008.0, 19383.0, 8455.0, 4236.0, 2175.0, 1248.0, 724.0, 411.0, 264.0, 185.0, 125.0, 101.0, 68.0, 49.0, 21.0, 25.0, 16.0, 9.0, 14.0, 8.0, 3.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.8740234375, -1.8083038330078125, -1.742584228515625, -1.6768646240234375, -1.61114501953125, -1.5454254150390625, -1.479705810546875, -1.4139862060546875, -1.3482666015625, -1.2825469970703125, -1.216827392578125, -1.1511077880859375, -1.08538818359375, -1.0196685791015625, -0.953948974609375, -0.8882293701171875, -0.822509765625, -0.7567901611328125, -0.691070556640625, -0.6253509521484375, -0.55963134765625, -0.4939117431640625, -0.428192138671875, -0.3624725341796875, -0.2967529296875, -0.2310333251953125, -0.165313720703125, -0.0995941162109375, -0.03387451171875, 0.0318450927734375, 0.097564697265625, 0.1632843017578125, 0.22900390625, 0.2947235107421875, 0.360443115234375, 0.4261627197265625, 0.49188232421875, 0.5576019287109375, 0.623321533203125, 0.6890411376953125, 0.7547607421875, 0.8204803466796875, 0.886199951171875, 0.9519195556640625, 1.01763916015625, 1.0833587646484375, 1.149078369140625, 1.2147979736328125, 1.280517578125, 1.3462371826171875, 1.411956787109375, 1.4776763916015625, 1.54339599609375, 1.6091156005859375, 1.674835205078125, 1.7405548095703125, 1.8062744140625, 1.8719940185546875, 1.937713623046875, 2.0034332275390625, 2.06915283203125, 2.1348724365234375, 2.200592041015625, 2.2663116455078125, 2.33203125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 4.0, 6.0, 4.0, 5.0, 9.0, 9.0, 15.0, 15.0, 18.0, 11.0, 24.0, 20.0, 25.0, 23.0, 33.0, 44.0, 43.0, 43.0, 51.0, 35.0, 42.0, 36.0, 45.0, 39.0, 49.0, 43.0, 33.0, 32.0, 34.0, 36.0, 33.0, 24.0, 22.0, 17.0, 15.0, 17.0, 10.0, 15.0, 7.0, 5.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9111328125, -1.850738525390625, -1.79034423828125, -1.729949951171875, -1.6695556640625, -1.609161376953125, -1.54876708984375, -1.488372802734375, -1.427978515625, -1.367584228515625, -1.30718994140625, -1.246795654296875, -1.1864013671875, -1.126007080078125, -1.06561279296875, -1.005218505859375, -0.94482421875, -0.884429931640625, -0.82403564453125, -0.763641357421875, -0.7032470703125, -0.642852783203125, -0.58245849609375, -0.522064208984375, -0.461669921875, -0.401275634765625, -0.34088134765625, -0.280487060546875, -0.2200927734375, -0.159698486328125, -0.09930419921875, -0.038909912109375, 0.021484375, 0.081878662109375, 0.14227294921875, 0.202667236328125, 0.2630615234375, 0.323455810546875, 0.38385009765625, 0.444244384765625, 0.504638671875, 0.565032958984375, 0.62542724609375, 0.685821533203125, 0.7462158203125, 0.806610107421875, 0.86700439453125, 0.927398681640625, 0.98779296875, 1.048187255859375, 1.10858154296875, 1.168975830078125, 1.2293701171875, 1.289764404296875, 1.35015869140625, 1.410552978515625, 1.470947265625, 1.531341552734375, 1.59173583984375, 1.652130126953125, 1.7125244140625, 1.772918701171875, 1.83331298828125, 1.893707275390625, 1.9541015625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 8.0, 15.0, 15.0, 16.0, 38.0, 60.0, 87.0, 146.0, 264.0, 700.0, 3323.0, 33627.0, 3718555.0, 424765.0, 10185.0, 1583.0, 506.0, 184.0, 99.0, 46.0, 23.0, 20.0, 5.0, 5.0, 6.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.140625, -12.783447265625, -12.42626953125, -12.069091796875, -11.7119140625, -11.354736328125, -10.99755859375, -10.640380859375, -10.283203125, -9.926025390625, -9.56884765625, -9.211669921875, -8.8544921875, -8.497314453125, -8.14013671875, -7.782958984375, -7.42578125, -7.068603515625, -6.71142578125, -6.354248046875, -5.9970703125, -5.639892578125, -5.28271484375, -4.925537109375, -4.568359375, -4.211181640625, -3.85400390625, -3.496826171875, -3.1396484375, -2.782470703125, -2.42529296875, -2.068115234375, -1.7109375, -1.353759765625, -0.99658203125, -0.639404296875, -0.2822265625, 0.074951171875, 0.43212890625, 0.789306640625, 1.146484375, 1.503662109375, 1.86083984375, 2.218017578125, 2.5751953125, 2.932373046875, 3.28955078125, 3.646728515625, 4.00390625, 4.361083984375, 4.71826171875, 5.075439453125, 5.4326171875, 5.789794921875, 6.14697265625, 6.504150390625, 6.861328125, 7.218505859375, 7.57568359375, 7.932861328125, 8.2900390625, 8.647216796875, 9.00439453125, 9.361572265625, 9.71875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 6.0, 8.0, 18.0, 36.0, 52.0, 99.0, 174.0, 366.0, 886.0, 1184.0, 652.0, 282.0, 131.0, 75.0, 45.0, 24.0, 12.0, 10.0, 3.0, 7.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.3515625, -12.072509765625, -11.79345703125, -11.514404296875, -11.2353515625, -10.956298828125, -10.67724609375, -10.398193359375, -10.119140625, -9.840087890625, -9.56103515625, -9.281982421875, -9.0029296875, -8.723876953125, -8.44482421875, -8.165771484375, -7.88671875, -7.607666015625, -7.32861328125, -7.049560546875, -6.7705078125, -6.491455078125, -6.21240234375, -5.933349609375, -5.654296875, -5.375244140625, -5.09619140625, -4.817138671875, -4.5380859375, -4.259033203125, -3.97998046875, -3.700927734375, -3.421875, -3.142822265625, -2.86376953125, -2.584716796875, -2.3056640625, -2.026611328125, -1.74755859375, -1.468505859375, -1.189453125, -0.910400390625, -0.63134765625, -0.352294921875, -0.0732421875, 0.205810546875, 0.48486328125, 0.763916015625, 1.04296875, 1.322021484375, 1.60107421875, 1.880126953125, 2.1591796875, 2.438232421875, 2.71728515625, 2.996337890625, 3.275390625, 3.554443359375, 3.83349609375, 4.112548828125, 4.3916015625, 4.670654296875, 4.94970703125, 5.228759765625, 5.5078125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 10.0, 5.0, 18.0, 27.0, 48.0, 80.0, 140.0, 183.0, 166.0, 136.0, 83.0, 40.0, 21.0, 13.0, 10.0, 4.0, 3.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.324188232421875, -41.77286911010742, -40.221553802490234, -38.67023468017578, -37.118919372558594, -35.56760025024414, -34.01628112792969, -32.4649658203125, -30.913646697998047, -29.362329483032227, -27.811012268066406, -26.259693145751953, -24.708375930786133, -23.157058715820312, -21.60573959350586, -20.05442237854004, -18.50310516357422, -16.9517879486084, -15.400469779968262, -13.849151611328125, -12.297834396362305, -10.746517181396484, -9.195199012756348, -7.643880844116211, -6.092563629150391, -4.541245937347412, -2.9899282455444336, -1.438610553741455, 0.11270713806152344, 1.664024829864502, 3.2153425216674805, 4.766660690307617, 6.317981719970703, 7.869299411773682, 9.42061710357666, 10.971935272216797, 12.523252487182617, 14.074569702148438, 15.625887870788574, 17.17720603942871, 18.72852325439453, 20.27984046936035, 21.831157684326172, 23.382476806640625, 24.933794021606445, 26.485111236572266, 28.03643035888672, 29.58774757385254, 31.13906478881836, 32.69038391113281, 34.24169921875, 35.79301834106445, 37.344337463378906, 38.895652770996094, 40.44697189331055, 41.998291015625, 43.54960632324219, 45.10092544555664, 46.65224075317383, 48.20355987548828, 49.75487518310547, 51.30619430541992, 52.857513427734375, 54.40882873535156, 55.960147857666016]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 7.0, 6.0, 10.0, 10.0, 14.0, 23.0, 22.0, 32.0, 24.0, 32.0, 29.0, 36.0, 45.0, 56.0, 44.0, 47.0, 47.0, 41.0, 49.0, 55.0, 47.0, 33.0, 43.0, 27.0, 39.0, 19.0, 31.0, 19.0, 16.0, 24.0, 25.0, 18.0, 9.0, 5.0, 8.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-26.42144012451172, -25.6193790435791, -24.81731605529785, -24.015254974365234, -23.213191986083984, -22.411130905151367, -21.609067916870117, -20.8070068359375, -20.00494384765625, -19.202882766723633, -18.400819778442383, -17.598758697509766, -16.796695709228516, -15.994634628295898, -15.192571640014648, -14.390510559082031, -13.588448524475098, -12.786386489868164, -11.98432445526123, -11.182262420654297, -10.380200386047363, -9.57813835144043, -8.776077270507812, -7.974014759063721, -7.171952724456787, -6.3698906898498535, -5.56782865524292, -4.7657670974731445, -3.963704824447632, -3.1616430282592773, -2.3595809936523438, -1.5575189590454102, -0.7554569244384766, 0.046605050563812256, 0.8486670255661011, 1.6507289409637451, 2.4527909755706787, 3.254852771759033, 4.056914806365967, 4.8589768409729, 5.661038875579834, 6.463100910186768, 7.265162944793701, 8.067224502563477, 8.86928653717041, 9.671348571777344, 10.473410606384277, 11.275472640991211, 12.077534675598145, 12.879596710205078, 13.681658744812012, 14.483720779418945, 15.285782814025879, 16.087844848632812, 16.88990592956543, 17.69196891784668, 18.494029998779297, 19.296091079711914, 20.098154067993164, 20.90021514892578, 21.70227813720703, 22.50433921813965, 23.3064022064209, 24.108463287353516, 24.910526275634766]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 5.0, 6.0, 6.0, 8.0, 18.0, 21.0, 33.0, 33.0, 60.0, 111.0, 96.0, 160.0, 225.0, 305.0, 467.0, 726.0, 1139.0, 1686.0, 2800.0, 4729.0, 7978.0, 14478.0, 25257.0, 46886.0, 85028.0, 145542.0, 210906.0, 200240.0, 130592.0, 74240.0, 41281.0, 22597.0, 12663.0, 6899.0, 4187.0, 2535.0, 1560.0, 975.0, 613.0, 457.0, 267.0, 209.0, 155.0, 111.0, 71.0, 68.0, 37.0, 21.0, 15.0, 18.0, 11.0, 13.0, 12.0, 6.0, 2.0, 3.0, 1.0, 2.0, 2.0], "bins": [-2.578125, -2.497283935546875, -2.41644287109375, -2.335601806640625, -2.2547607421875, -2.173919677734375, -2.09307861328125, -2.012237548828125, -1.931396484375, -1.850555419921875, -1.76971435546875, -1.688873291015625, -1.6080322265625, -1.527191162109375, -1.44635009765625, -1.365509033203125, -1.28466796875, -1.203826904296875, -1.12298583984375, -1.042144775390625, -0.9613037109375, -0.880462646484375, -0.79962158203125, -0.718780517578125, -0.637939453125, -0.557098388671875, -0.47625732421875, -0.395416259765625, -0.3145751953125, -0.233734130859375, -0.15289306640625, -0.072052001953125, 0.0087890625, 0.089630126953125, 0.17047119140625, 0.251312255859375, 0.3321533203125, 0.412994384765625, 0.49383544921875, 0.574676513671875, 0.655517578125, 0.736358642578125, 0.81719970703125, 0.898040771484375, 0.9788818359375, 1.059722900390625, 1.14056396484375, 1.221405029296875, 1.30224609375, 1.383087158203125, 1.46392822265625, 1.544769287109375, 1.6256103515625, 1.706451416015625, 1.78729248046875, 1.868133544921875, 1.948974609375, 2.029815673828125, 2.11065673828125, 2.191497802734375, 2.2723388671875, 2.353179931640625, 2.43402099609375, 2.514862060546875, 2.595703125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 2.0, 6.0, 2.0, 7.0, 11.0, 9.0, 6.0, 13.0, 17.0, 21.0, 19.0, 21.0, 25.0, 42.0, 21.0, 30.0, 37.0, 45.0, 45.0, 45.0, 47.0, 45.0, 41.0, 45.0, 47.0, 32.0, 48.0, 34.0, 39.0, 25.0, 24.0, 21.0, 23.0, 17.0, 18.0, 13.0, 14.0, 12.0, 10.0, 4.0, 4.0, 4.0, 3.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-2.232421875, -2.1678924560546875, -2.103363037109375, -2.0388336181640625, -1.97430419921875, -1.9097747802734375, -1.845245361328125, -1.7807159423828125, -1.7161865234375, -1.6516571044921875, -1.587127685546875, -1.5225982666015625, -1.45806884765625, -1.3935394287109375, -1.329010009765625, -1.2644805908203125, -1.199951171875, -1.1354217529296875, -1.070892333984375, -1.0063629150390625, -0.94183349609375, -0.8773040771484375, -0.812774658203125, -0.7482452392578125, -0.6837158203125, -0.6191864013671875, -0.554656982421875, -0.4901275634765625, -0.42559814453125, -0.3610687255859375, -0.296539306640625, -0.2320098876953125, -0.16748046875, -0.1029510498046875, -0.038421630859375, 0.0261077880859375, 0.09063720703125, 0.1551666259765625, 0.219696044921875, 0.2842254638671875, 0.3487548828125, 0.4132843017578125, 0.477813720703125, 0.5423431396484375, 0.60687255859375, 0.6714019775390625, 0.735931396484375, 0.8004608154296875, 0.864990234375, 0.9295196533203125, 0.994049072265625, 1.0585784912109375, 1.12310791015625, 1.1876373291015625, 1.252166748046875, 1.3166961669921875, 1.3812255859375, 1.4457550048828125, 1.510284423828125, 1.5748138427734375, 1.63934326171875, 1.7038726806640625, 1.768402099609375, 1.8329315185546875, 1.8974609375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 10.0, 11.0, 7.0, 18.0, 15.0, 27.0, 38.0, 47.0, 55.0, 75.0, 128.0, 201.0, 350.0, 797.0, 2016.0, 6853.0, 28108.0, 149737.0, 642678.0, 173016.0, 32681.0, 7544.0, 2268.0, 853.0, 378.0, 212.0, 122.0, 75.0, 64.0, 42.0, 39.0, 22.0, 16.0, 15.0, 12.0, 2.0, 4.0, 4.0, 5.0, 6.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.61328125, -7.39288330078125, -7.1724853515625, -6.95208740234375, -6.731689453125, -6.51129150390625, -6.2908935546875, -6.07049560546875, -5.85009765625, -5.62969970703125, -5.4093017578125, -5.18890380859375, -4.968505859375, -4.74810791015625, -4.5277099609375, -4.30731201171875, -4.0869140625, -3.86651611328125, -3.6461181640625, -3.42572021484375, -3.205322265625, -2.98492431640625, -2.7645263671875, -2.54412841796875, -2.32373046875, -2.10333251953125, -1.8829345703125, -1.66253662109375, -1.442138671875, -1.22174072265625, -1.0013427734375, -0.78094482421875, -0.560546875, -0.34014892578125, -0.1197509765625, 0.10064697265625, 0.321044921875, 0.54144287109375, 0.7618408203125, 0.98223876953125, 1.20263671875, 1.42303466796875, 1.6434326171875, 1.86383056640625, 2.084228515625, 2.30462646484375, 2.5250244140625, 2.74542236328125, 2.9658203125, 3.18621826171875, 3.4066162109375, 3.62701416015625, 3.847412109375, 4.06781005859375, 4.2882080078125, 4.50860595703125, 4.72900390625, 4.94940185546875, 5.1697998046875, 5.39019775390625, 5.610595703125, 5.83099365234375, 6.0513916015625, 6.27178955078125, 6.4921875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 2.0, 5.0, 3.0, 1.0, 4.0, 8.0, 6.0, 7.0, 12.0, 9.0, 8.0, 17.0, 18.0, 23.0, 28.0, 18.0, 28.0, 39.0, 32.0, 41.0, 45.0, 40.0, 43.0, 46.0, 62.0, 50.0, 41.0, 46.0, 49.0, 39.0, 35.0, 36.0, 33.0, 14.0, 27.0, 17.0, 14.0, 12.0, 9.0, 13.0, 5.0, 6.0, 2.0, 6.0, 1.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.55859375, -6.31939697265625, -6.0802001953125, -5.84100341796875, -5.601806640625, -5.36260986328125, -5.1234130859375, -4.88421630859375, -4.64501953125, -4.40582275390625, -4.1666259765625, -3.92742919921875, -3.688232421875, -3.44903564453125, -3.2098388671875, -2.97064208984375, -2.7314453125, -2.49224853515625, -2.2530517578125, -2.01385498046875, -1.774658203125, -1.53546142578125, -1.2962646484375, -1.05706787109375, -0.81787109375, -0.57867431640625, -0.3394775390625, -0.10028076171875, 0.138916015625, 0.37811279296875, 0.6173095703125, 0.85650634765625, 1.095703125, 1.33489990234375, 1.5740966796875, 1.81329345703125, 2.052490234375, 2.29168701171875, 2.5308837890625, 2.77008056640625, 3.00927734375, 3.24847412109375, 3.4876708984375, 3.72686767578125, 3.966064453125, 4.20526123046875, 4.4444580078125, 4.68365478515625, 4.9228515625, 5.16204833984375, 5.4012451171875, 5.64044189453125, 5.879638671875, 6.11883544921875, 6.3580322265625, 6.59722900390625, 6.83642578125, 7.07562255859375, 7.3148193359375, 7.55401611328125, 7.793212890625, 8.03240966796875, 8.2716064453125, 8.51080322265625, 8.75]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 1.0, 9.0, 4.0, 17.0, 7.0, 21.0, 35.0, 41.0, 82.0, 150.0, 217.0, 490.0, 1176.0, 3156.0, 10361.0, 43110.0, 212763.0, 620685.0, 120487.0, 25110.0, 6671.0, 2265.0, 825.0, 390.0, 185.0, 87.0, 76.0, 34.0, 30.0, 16.0, 14.0, 7.0, 9.0, 7.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.90625, -1.8433837890625, -1.780517578125, -1.7176513671875, -1.65478515625, -1.5919189453125, -1.529052734375, -1.4661865234375, -1.4033203125, -1.3404541015625, -1.277587890625, -1.2147216796875, -1.15185546875, -1.0889892578125, -1.026123046875, -0.9632568359375, -0.900390625, -0.8375244140625, -0.774658203125, -0.7117919921875, -0.64892578125, -0.5860595703125, -0.523193359375, -0.4603271484375, -0.3974609375, -0.3345947265625, -0.271728515625, -0.2088623046875, -0.14599609375, -0.0831298828125, -0.020263671875, 0.0426025390625, 0.10546875, 0.1683349609375, 0.231201171875, 0.2940673828125, 0.35693359375, 0.4197998046875, 0.482666015625, 0.5455322265625, 0.6083984375, 0.6712646484375, 0.734130859375, 0.7969970703125, 0.85986328125, 0.9227294921875, 0.985595703125, 1.0484619140625, 1.111328125, 1.1741943359375, 1.237060546875, 1.2999267578125, 1.36279296875, 1.4256591796875, 1.488525390625, 1.5513916015625, 1.6142578125, 1.6771240234375, 1.739990234375, 1.8028564453125, 1.86572265625, 1.9285888671875, 1.991455078125, 2.0543212890625, 2.1171875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 6.0, 7.0, 2.0, 11.0, 5.0, 12.0, 14.0, 29.0, 34.0, 53.0, 59.0, 64.0, 96.0, 95.0, 109.0, 91.0, 76.0, 63.0, 45.0, 41.0, 22.0, 19.0, 11.0, 9.0, 10.0, 5.0, 3.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005116462707519531, -0.0004921108484268188, -0.00047257542610168457, -0.0004530400037765503, -0.000433504581451416, -0.00041396915912628174, -0.00039443373680114746, -0.0003748983144760132, -0.0003553628921508789, -0.00033582746982574463, -0.00031629204750061035, -0.0002967566251754761, -0.0002772212028503418, -0.0002576857805252075, -0.00023815035820007324, -0.00021861493587493896, -0.0001990795135498047, -0.0001795440912246704, -0.00016000866889953613, -0.00014047324657440186, -0.00012093782424926758, -0.0001014024019241333, -8.186697959899902e-05, -6.233155727386475e-05, -4.279613494873047e-05, -2.326071262359619e-05, -3.725290298461914e-06, 1.5810132026672363e-05, 3.534555435180664e-05, 5.488097667694092e-05, 7.44163990020752e-05, 9.395182132720947e-05, 0.00011348724365234375, 0.00013302266597747803, 0.0001525580883026123, 0.00017209351062774658, 0.00019162893295288086, 0.00021116435527801514, 0.00023069977760314941, 0.0002502351999282837, 0.00026977062225341797, 0.00028930604457855225, 0.0003088414669036865, 0.0003283768892288208, 0.0003479123115539551, 0.00036744773387908936, 0.00038698315620422363, 0.0004065185785293579, 0.0004260540008544922, 0.00044558942317962646, 0.00046512484550476074, 0.000484660267829895, 0.0005041956901550293, 0.0005237311124801636, 0.0005432665348052979, 0.0005628019571304321, 0.0005823373794555664, 0.0006018728017807007, 0.000621408224105835, 0.0006409436464309692, 0.0006604790687561035, 0.0006800144910812378, 0.0006995499134063721, 0.0007190853357315063, 0.0007386207580566406]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 7.0, 27.0, 32.0, 79.0, 165.0, 538.0, 2321.0, 23084.0, 724625.0, 284034.0, 11426.0, 1546.0, 418.0, 138.0, 55.0, 33.0, 11.0, 6.0, 8.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.115234375, -2.979034423828125, -2.84283447265625, -2.706634521484375, -2.5704345703125, -2.434234619140625, -2.29803466796875, -2.161834716796875, -2.025634765625, -1.889434814453125, -1.75323486328125, -1.617034912109375, -1.4808349609375, -1.344635009765625, -1.20843505859375, -1.072235107421875, -0.93603515625, -0.799835205078125, -0.66363525390625, -0.527435302734375, -0.3912353515625, -0.255035400390625, -0.11883544921875, 0.017364501953125, 0.153564453125, 0.289764404296875, 0.42596435546875, 0.562164306640625, 0.6983642578125, 0.834564208984375, 0.97076416015625, 1.106964111328125, 1.2431640625, 1.379364013671875, 1.51556396484375, 1.651763916015625, 1.7879638671875, 1.924163818359375, 2.06036376953125, 2.196563720703125, 2.332763671875, 2.468963623046875, 2.60516357421875, 2.741363525390625, 2.8775634765625, 3.013763427734375, 3.14996337890625, 3.286163330078125, 3.42236328125, 3.558563232421875, 3.69476318359375, 3.830963134765625, 3.9671630859375, 4.103363037109375, 4.23956298828125, 4.375762939453125, 4.511962890625, 4.648162841796875, 4.78436279296875, 4.920562744140625, 5.0567626953125, 5.192962646484375, 5.32916259765625, 5.465362548828125, 5.6015625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 5.0, 2.0, 4.0, 7.0, 10.0, 21.0, 25.0, 22.0, 27.0, 46.0, 52.0, 59.0, 66.0, 75.0, 79.0, 106.0, 85.0, 74.0, 59.0, 41.0, 46.0, 23.0, 14.0, 17.0, 10.0, 10.0, 6.0, 7.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.904296875, -2.82525634765625, -2.7462158203125, -2.66717529296875, -2.588134765625, -2.50909423828125, -2.4300537109375, -2.35101318359375, -2.27197265625, -2.19293212890625, -2.1138916015625, -2.03485107421875, -1.955810546875, -1.87677001953125, -1.7977294921875, -1.71868896484375, -1.6396484375, -1.56060791015625, -1.4815673828125, -1.40252685546875, -1.323486328125, -1.24444580078125, -1.1654052734375, -1.08636474609375, -1.00732421875, -0.92828369140625, -0.8492431640625, -0.77020263671875, -0.691162109375, -0.61212158203125, -0.5330810546875, -0.45404052734375, -0.375, -0.29595947265625, -0.2169189453125, -0.13787841796875, -0.058837890625, 0.02020263671875, 0.0992431640625, 0.17828369140625, 0.25732421875, 0.33636474609375, 0.4154052734375, 0.49444580078125, 0.573486328125, 0.65252685546875, 0.7315673828125, 0.81060791015625, 0.8896484375, 0.96868896484375, 1.0477294921875, 1.12677001953125, 1.205810546875, 1.28485107421875, 1.3638916015625, 1.44293212890625, 1.52197265625, 1.60101318359375, 1.6800537109375, 1.75909423828125, 1.838134765625, 1.91717529296875, 1.9962158203125, 2.07525634765625, 2.154296875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 5.0, 13.0, 18.0, 52.0, 76.0, 191.0, 257.0, 125.0, 84.0, 65.0, 35.0, 28.0, 17.0, 9.0, 6.0, 4.0, 1.0, 5.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.088706970214844, -31.371530532836914, -29.654354095458984, -27.937175750732422, -26.219999313354492, -24.502822875976562, -22.78564453125, -21.06846809387207, -19.35129165649414, -17.63411521911621, -15.916937828063965, -14.199760437011719, -12.482583999633789, -10.76540756225586, -9.048230171203613, -7.331052780151367, -5.6138763427734375, -3.8966994285583496, -2.1795225143432617, -0.46234560012817383, 1.254831314086914, 2.9720077514648438, 4.68918514251709, 6.406362533569336, 8.123538970947266, 9.840715408325195, 11.557892799377441, 13.275070190429688, 14.992246627807617, 16.709423065185547, 18.42660140991211, 20.14377784729004, 21.86095428466797, 23.5781307220459, 25.295307159423828, 27.01248550415039, 28.72966194152832, 30.44683837890625, 32.16401672363281, 33.881195068359375, 35.59836959838867, 37.315547943115234, 39.03272247314453, 40.749900817871094, 42.467079162597656, 44.18425369262695, 45.901432037353516, 47.61860656738281, 49.335784912109375, 51.05296325683594, 52.770137786865234, 54.4873161315918, 56.204490661621094, 57.921669006347656, 59.63884735107422, 61.35602569580078, 63.07320022583008, 64.79037475585938, 66.50755310058594, 68.2247314453125, 69.94190979003906, 71.65908813476562, 73.37625885009766, 75.09343719482422, 76.81061553955078]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 6.0, 1.0, 7.0, 9.0, 7.0, 17.0, 8.0, 17.0, 21.0, 20.0, 27.0, 11.0, 29.0, 27.0, 28.0, 24.0, 36.0, 55.0, 64.0, 69.0, 77.0, 62.0, 46.0, 40.0, 30.0, 30.0, 35.0, 28.0, 21.0, 31.0, 20.0, 12.0, 18.0, 12.0, 4.0, 10.0, 13.0, 3.0, 2.0, 3.0, 6.0, 5.0, 4.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 3.0], "bins": [-33.36609649658203, -32.365840911865234, -31.36558723449707, -30.365333557128906, -29.36507797241211, -28.364822387695312, -27.36456871032715, -26.364315032958984, -25.364059448242188, -24.36380386352539, -23.363550186157227, -22.363296508789062, -21.363040924072266, -20.36278533935547, -19.362531661987305, -18.36227798461914, -17.362022399902344, -16.361766815185547, -15.361513137817383, -14.361258506774902, -13.361003875732422, -12.360749244689941, -11.360494613647461, -10.36023998260498, -9.3599853515625, -8.35973072052002, -7.359476089477539, -6.359221458435059, -5.358966827392578, -4.358712196350098, -3.358457565307617, -2.3582029342651367, -1.357950210571289, -0.3576955795288086, 0.6425590515136719, 1.6428136825561523, 2.643068313598633, 3.6433229446411133, 4.643577575683594, 5.643832206726074, 6.644086837768555, 7.644341468811035, 8.644596099853516, 9.644850730895996, 10.645105361938477, 11.645359992980957, 12.645614624023438, 13.645869255065918, 14.646123886108398, 15.646378517150879, 16.64663314819336, 17.646888732910156, 18.64714241027832, 19.647396087646484, 20.64765167236328, 21.647907257080078, 22.648160934448242, 23.648414611816406, 24.648670196533203, 25.64892578125, 26.649179458618164, 27.649433135986328, 28.649688720703125, 29.649944305419922, 30.650197982788086]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 6.0, 6.0, 13.0, 17.0, 14.0, 22.0, 36.0, 54.0, 105.0, 159.0, 211.0, 352.0, 583.0, 892.0, 1439.0, 2218.0, 3924.0, 7087.0, 14424.0, 32636.0, 87761.0, 255136.0, 723755.0, 1486221.0, 998094.0, 368632.0, 126250.0, 45366.0, 18497.0, 8629.0, 4642.0, 2674.0, 1583.0, 970.0, 657.0, 398.0, 277.0, 161.0, 135.0, 79.0, 61.0, 34.0, 21.0, 15.0, 12.0, 11.0, 8.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.400390625, -1.3515472412109375, -1.302703857421875, -1.2538604736328125, -1.20501708984375, -1.1561737060546875, -1.107330322265625, -1.0584869384765625, -1.0096435546875, -0.9608001708984375, -0.911956787109375, -0.8631134033203125, -0.81427001953125, -0.7654266357421875, -0.716583251953125, -0.6677398681640625, -0.618896484375, -0.5700531005859375, -0.521209716796875, -0.4723663330078125, -0.42352294921875, -0.3746795654296875, -0.325836181640625, -0.2769927978515625, -0.2281494140625, -0.1793060302734375, -0.130462646484375, -0.0816192626953125, -0.03277587890625, 0.0160675048828125, 0.064910888671875, 0.1137542724609375, 0.16259765625, 0.2114410400390625, 0.260284423828125, 0.3091278076171875, 0.35797119140625, 0.4068145751953125, 0.455657958984375, 0.5045013427734375, 0.5533447265625, 0.6021881103515625, 0.651031494140625, 0.6998748779296875, 0.74871826171875, 0.7975616455078125, 0.846405029296875, 0.8952484130859375, 0.944091796875, 0.9929351806640625, 1.041778564453125, 1.0906219482421875, 1.13946533203125, 1.1883087158203125, 1.237152099609375, 1.2859954833984375, 1.3348388671875, 1.3836822509765625, 1.432525634765625, 1.4813690185546875, 1.53021240234375, 1.5790557861328125, 1.627899169921875, 1.6767425537109375, 1.7255859375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 6.0, 9.0, 7.0, 8.0, 9.0, 19.0, 19.0, 15.0, 15.0, 38.0, 27.0, 27.0, 29.0, 36.0, 36.0, 39.0, 46.0, 40.0, 50.0, 55.0, 52.0, 45.0, 42.0, 39.0, 37.0, 36.0, 26.0, 24.0, 27.0, 22.0, 16.0, 23.0, 16.0, 16.0, 5.0, 6.0, 13.0, 4.0, 6.0, 6.0, 6.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.09765625, -2.0348358154296875, -1.972015380859375, -1.9091949462890625, -1.84637451171875, -1.7835540771484375, -1.720733642578125, -1.6579132080078125, -1.5950927734375, -1.5322723388671875, -1.469451904296875, -1.4066314697265625, -1.34381103515625, -1.2809906005859375, -1.218170166015625, -1.1553497314453125, -1.092529296875, -1.0297088623046875, -0.966888427734375, -0.9040679931640625, -0.84124755859375, -0.7784271240234375, -0.715606689453125, -0.6527862548828125, -0.5899658203125, -0.5271453857421875, -0.464324951171875, -0.4015045166015625, -0.33868408203125, -0.2758636474609375, -0.213043212890625, -0.1502227783203125, -0.08740234375, -0.0245819091796875, 0.038238525390625, 0.1010589599609375, 0.16387939453125, 0.2266998291015625, 0.289520263671875, 0.3523406982421875, 0.4151611328125, 0.4779815673828125, 0.540802001953125, 0.6036224365234375, 0.66644287109375, 0.7292633056640625, 0.792083740234375, 0.8549041748046875, 0.917724609375, 0.9805450439453125, 1.043365478515625, 1.1061859130859375, 1.16900634765625, 1.2318267822265625, 1.294647216796875, 1.3574676513671875, 1.4202880859375, 1.4831085205078125, 1.545928955078125, 1.6087493896484375, 1.67156982421875, 1.7343902587890625, 1.797210693359375, 1.8600311279296875, 1.9228515625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 3.0, 12.0, 13.0, 25.0, 39.0, 71.0, 137.0, 278.0, 744.0, 2964.0, 38451.0, 3945973.0, 197471.0, 6354.0, 1033.0, 356.0, 171.0, 88.0, 44.0, 11.0, 16.0, 11.0, 6.0, 7.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.859375, -12.4886474609375, -12.117919921875, -11.7471923828125, -11.37646484375, -11.0057373046875, -10.635009765625, -10.2642822265625, -9.8935546875, -9.5228271484375, -9.152099609375, -8.7813720703125, -8.41064453125, -8.0399169921875, -7.669189453125, -7.2984619140625, -6.927734375, -6.5570068359375, -6.186279296875, -5.8155517578125, -5.44482421875, -5.0740966796875, -4.703369140625, -4.3326416015625, -3.9619140625, -3.5911865234375, -3.220458984375, -2.8497314453125, -2.47900390625, -2.1082763671875, -1.737548828125, -1.3668212890625, -0.99609375, -0.6253662109375, -0.254638671875, 0.1160888671875, 0.48681640625, 0.8575439453125, 1.228271484375, 1.5989990234375, 1.9697265625, 2.3404541015625, 2.711181640625, 3.0819091796875, 3.45263671875, 3.8233642578125, 4.194091796875, 4.5648193359375, 4.935546875, 5.3062744140625, 5.677001953125, 6.0477294921875, 6.41845703125, 6.7891845703125, 7.159912109375, 7.5306396484375, 7.9013671875, 8.2720947265625, 8.642822265625, 9.0135498046875, 9.38427734375, 9.7550048828125, 10.125732421875, 10.4964599609375, 10.8671875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 5.0, 4.0, 10.0, 13.0, 21.0, 35.0, 52.0, 114.0, 194.0, 414.0, 895.0, 1156.0, 590.0, 283.0, 119.0, 63.0, 43.0, 26.0, 12.0, 7.0, 14.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.90625, -10.647705078125, -10.38916015625, -10.130615234375, -9.8720703125, -9.613525390625, -9.35498046875, -9.096435546875, -8.837890625, -8.579345703125, -8.32080078125, -8.062255859375, -7.8037109375, -7.545166015625, -7.28662109375, -7.028076171875, -6.76953125, -6.510986328125, -6.25244140625, -5.993896484375, -5.7353515625, -5.476806640625, -5.21826171875, -4.959716796875, -4.701171875, -4.442626953125, -4.18408203125, -3.925537109375, -3.6669921875, -3.408447265625, -3.14990234375, -2.891357421875, -2.6328125, -2.374267578125, -2.11572265625, -1.857177734375, -1.5986328125, -1.340087890625, -1.08154296875, -0.822998046875, -0.564453125, -0.305908203125, -0.04736328125, 0.211181640625, 0.4697265625, 0.728271484375, 0.98681640625, 1.245361328125, 1.50390625, 1.762451171875, 2.02099609375, 2.279541015625, 2.5380859375, 2.796630859375, 3.05517578125, 3.313720703125, 3.572265625, 3.830810546875, 4.08935546875, 4.347900390625, 4.6064453125, 4.864990234375, 5.12353515625, 5.382080078125, 5.640625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 10.0, 11.0, 33.0, 91.0, 164.0, 274.0, 226.0, 108.0, 47.0, 14.0, 10.0, 8.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-105.82020568847656, -103.69187927246094, -101.56355285644531, -99.43522644042969, -97.30690002441406, -95.17857360839844, -93.05024719238281, -90.92192840576172, -88.7936019897461, -86.66527557373047, -84.53694915771484, -82.40862274169922, -80.2802963256836, -78.1519775390625, -76.02365112304688, -73.89532470703125, -71.76699829101562, -69.638671875, -67.51034545898438, -65.38201904296875, -63.25369644165039, -61.125370025634766, -58.99704360961914, -56.868717193603516, -54.740386962890625, -52.612060546875, -50.483734130859375, -48.35540771484375, -46.22708511352539, -44.098758697509766, -41.97043228149414, -39.842105865478516, -37.71377944946289, -35.585453033447266, -33.45712661743164, -31.32880210876465, -29.200477600097656, -27.07215118408203, -24.943824768066406, -22.81549835205078, -20.68717384338379, -18.558847427368164, -16.430522918701172, -14.302196502685547, -12.173871040344238, -10.04554557800293, -7.917219161987305, -5.788893699645996, -3.6605682373046875, -1.5322425365447998, 0.5960831642150879, 2.7244091033935547, 4.852734565734863, 6.981060028076172, 9.109386444091797, 11.237711906433105, 13.366037368774414, 15.494362831115723, 17.62268829345703, 19.751014709472656, 21.87934112548828, 24.007665634155273, 26.1359920501709, 28.26431655883789, 30.392642974853516]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 6.0, 6.0, 7.0, 7.0, 13.0, 16.0, 12.0, 23.0, 26.0, 22.0, 27.0, 21.0, 44.0, 28.0, 50.0, 46.0, 45.0, 51.0, 61.0, 51.0, 46.0, 45.0, 47.0, 42.0, 34.0, 35.0, 29.0, 27.0, 20.0, 25.0, 10.0, 13.0, 8.0, 7.0, 11.0, 9.0, 9.0, 6.0, 5.0, 2.0, 5.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-25.260395050048828, -24.523662567138672, -23.786930084228516, -23.05019760131836, -22.313465118408203, -21.576732635498047, -20.84000015258789, -20.103267669677734, -19.366535186767578, -18.629802703857422, -17.893070220947266, -17.15633773803711, -16.419605255126953, -15.682872772216797, -14.946139335632324, -14.209406852722168, -13.472673416137695, -12.735940933227539, -11.999208450317383, -11.262475967407227, -10.52574348449707, -9.789011001586914, -9.052277565002441, -8.315545082092285, -7.578812599182129, -6.842080116271973, -6.105347633361816, -5.368614673614502, -4.631882190704346, -3.8951497077941895, -3.158416748046875, -2.4216842651367188, -1.6849517822265625, -0.9482191801071167, -0.2114865779876709, 0.5252461433410645, 1.2619786262512207, 1.998711109161377, 2.7354440689086914, 3.4721765518188477, 4.208909034729004, 4.94564151763916, 5.682374000549316, 6.419106960296631, 7.155839443206787, 7.892571926116943, 8.629304885864258, 9.366037368774414, 10.10276985168457, 10.839502334594727, 11.576234817504883, 12.312967300415039, 13.049699783325195, 13.786432266235352, 14.523165702819824, 15.25989818572998, 15.996630668640137, 16.73336410522461, 17.470096588134766, 18.206829071044922, 18.943561553955078, 19.680294036865234, 20.41702651977539, 21.153759002685547, 21.890491485595703]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 0.0, 2.0, 5.0, 2.0, 10.0, 10.0, 5.0, 31.0, 30.0, 35.0, 40.0, 78.0, 105.0, 180.0, 261.0, 401.0, 633.0, 1008.0, 1650.0, 2936.0, 5005.0, 9037.0, 16491.0, 30895.0, 57524.0, 107641.0, 186691.0, 238431.0, 174253.0, 98800.0, 53375.0, 28063.0, 15171.0, 8185.0, 4666.0, 2691.0, 1564.0, 948.0, 609.0, 347.0, 272.0, 137.0, 94.0, 73.0, 47.0, 41.0, 31.0, 21.0, 18.0, 7.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.291015625, -2.215728759765625, -2.14044189453125, -2.065155029296875, -1.9898681640625, -1.914581298828125, -1.83929443359375, -1.764007568359375, -1.688720703125, -1.613433837890625, -1.53814697265625, -1.462860107421875, -1.3875732421875, -1.312286376953125, -1.23699951171875, -1.161712646484375, -1.08642578125, -1.011138916015625, -0.93585205078125, -0.860565185546875, -0.7852783203125, -0.709991455078125, -0.63470458984375, -0.559417724609375, -0.484130859375, -0.408843994140625, -0.33355712890625, -0.258270263671875, -0.1829833984375, -0.107696533203125, -0.03240966796875, 0.042877197265625, 0.1181640625, 0.193450927734375, 0.26873779296875, 0.344024658203125, 0.4193115234375, 0.494598388671875, 0.56988525390625, 0.645172119140625, 0.720458984375, 0.795745849609375, 0.87103271484375, 0.946319580078125, 1.0216064453125, 1.096893310546875, 1.17218017578125, 1.247467041015625, 1.32275390625, 1.398040771484375, 1.47332763671875, 1.548614501953125, 1.6239013671875, 1.699188232421875, 1.77447509765625, 1.849761962890625, 1.925048828125, 2.000335693359375, 2.07562255859375, 2.150909423828125, 2.2261962890625, 2.301483154296875, 2.37677001953125, 2.452056884765625, 2.52734375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 5.0, 8.0, 5.0, 13.0, 9.0, 9.0, 11.0, 13.0, 26.0, 28.0, 31.0, 29.0, 40.0, 40.0, 39.0, 44.0, 47.0, 42.0, 63.0, 50.0, 66.0, 32.0, 37.0, 41.0, 37.0, 40.0, 27.0, 21.0, 25.0, 25.0, 24.0, 11.0, 8.0, 11.0, 12.0, 14.0, 6.0, 3.0, 0.0, 4.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.05078125, -1.9774169921875, -1.904052734375, -1.8306884765625, -1.75732421875, -1.6839599609375, -1.610595703125, -1.5372314453125, -1.4638671875, -1.3905029296875, -1.317138671875, -1.2437744140625, -1.17041015625, -1.0970458984375, -1.023681640625, -0.9503173828125, -0.876953125, -0.8035888671875, -0.730224609375, -0.6568603515625, -0.58349609375, -0.5101318359375, -0.436767578125, -0.3634033203125, -0.2900390625, -0.2166748046875, -0.143310546875, -0.0699462890625, 0.00341796875, 0.0767822265625, 0.150146484375, 0.2235107421875, 0.296875, 0.3702392578125, 0.443603515625, 0.5169677734375, 0.59033203125, 0.6636962890625, 0.737060546875, 0.8104248046875, 0.8837890625, 0.9571533203125, 1.030517578125, 1.1038818359375, 1.17724609375, 1.2506103515625, 1.323974609375, 1.3973388671875, 1.470703125, 1.5440673828125, 1.617431640625, 1.6907958984375, 1.76416015625, 1.8375244140625, 1.910888671875, 1.9842529296875, 2.0576171875, 2.1309814453125, 2.204345703125, 2.2777099609375, 2.35107421875, 2.4244384765625, 2.497802734375, 2.5711669921875, 2.64453125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 4.0, 3.0, 12.0, 6.0, 17.0, 29.0, 22.0, 35.0, 48.0, 93.0, 128.0, 188.0, 334.0, 587.0, 1234.0, 3215.0, 13355.0, 81597.0, 715306.0, 196937.0, 26178.0, 5686.0, 1699.0, 793.0, 390.0, 237.0, 136.0, 99.0, 61.0, 41.0, 21.0, 26.0, 12.0, 11.0, 7.0, 3.0, 2.0, 1.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.5859375, -7.33056640625, -7.0751953125, -6.81982421875, -6.564453125, -6.30908203125, -6.0537109375, -5.79833984375, -5.54296875, -5.28759765625, -5.0322265625, -4.77685546875, -4.521484375, -4.26611328125, -4.0107421875, -3.75537109375, -3.5, -3.24462890625, -2.9892578125, -2.73388671875, -2.478515625, -2.22314453125, -1.9677734375, -1.71240234375, -1.45703125, -1.20166015625, -0.9462890625, -0.69091796875, -0.435546875, -0.18017578125, 0.0751953125, 0.33056640625, 0.5859375, 0.84130859375, 1.0966796875, 1.35205078125, 1.607421875, 1.86279296875, 2.1181640625, 2.37353515625, 2.62890625, 2.88427734375, 3.1396484375, 3.39501953125, 3.650390625, 3.90576171875, 4.1611328125, 4.41650390625, 4.671875, 4.92724609375, 5.1826171875, 5.43798828125, 5.693359375, 5.94873046875, 6.2041015625, 6.45947265625, 6.71484375, 6.97021484375, 7.2255859375, 7.48095703125, 7.736328125, 7.99169921875, 8.2470703125, 8.50244140625, 8.7578125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 3.0, 9.0, 11.0, 6.0, 12.0, 19.0, 19.0, 32.0, 26.0, 42.0, 51.0, 61.0, 67.0, 69.0, 74.0, 76.0, 81.0, 66.0, 59.0, 54.0, 43.0, 34.0, 22.0, 16.0, 12.0, 10.0, 9.0, 8.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6796875, -9.289306640625, -8.89892578125, -8.508544921875, -8.1181640625, -7.727783203125, -7.33740234375, -6.947021484375, -6.556640625, -6.166259765625, -5.77587890625, -5.385498046875, -4.9951171875, -4.604736328125, -4.21435546875, -3.823974609375, -3.43359375, -3.043212890625, -2.65283203125, -2.262451171875, -1.8720703125, -1.481689453125, -1.09130859375, -0.700927734375, -0.310546875, 0.079833984375, 0.47021484375, 0.860595703125, 1.2509765625, 1.641357421875, 2.03173828125, 2.422119140625, 2.8125, 3.202880859375, 3.59326171875, 3.983642578125, 4.3740234375, 4.764404296875, 5.15478515625, 5.545166015625, 5.935546875, 6.325927734375, 6.71630859375, 7.106689453125, 7.4970703125, 7.887451171875, 8.27783203125, 8.668212890625, 9.05859375, 9.448974609375, 9.83935546875, 10.229736328125, 10.6201171875, 11.010498046875, 11.40087890625, 11.791259765625, 12.181640625, 12.572021484375, 12.96240234375, 13.352783203125, 13.7431640625, 14.133544921875, 14.52392578125, 14.914306640625, 15.3046875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 5.0, 5.0, 6.0, 13.0, 16.0, 24.0, 19.0, 41.0, 60.0, 122.0, 146.0, 244.0, 529.0, 1066.0, 2779.0, 8905.0, 35475.0, 191872.0, 684457.0, 93709.0, 19900.0, 5542.0, 1897.0, 771.0, 372.0, 195.0, 133.0, 84.0, 49.0, 31.0, 28.0, 16.0, 11.0, 8.0, 12.0, 3.0, 7.0, 2.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6943359375, -1.6322784423828125, -1.570220947265625, -1.5081634521484375, -1.44610595703125, -1.3840484619140625, -1.321990966796875, -1.2599334716796875, -1.1978759765625, -1.1358184814453125, -1.073760986328125, -1.0117034912109375, -0.94964599609375, -0.8875885009765625, -0.825531005859375, -0.7634735107421875, -0.701416015625, -0.6393585205078125, -0.577301025390625, -0.5152435302734375, -0.45318603515625, -0.3911285400390625, -0.329071044921875, -0.2670135498046875, -0.2049560546875, -0.1428985595703125, -0.080841064453125, -0.0187835693359375, 0.04327392578125, 0.1053314208984375, 0.167388916015625, 0.2294464111328125, 0.29150390625, 0.3535614013671875, 0.415618896484375, 0.4776763916015625, 0.53973388671875, 0.6017913818359375, 0.663848876953125, 0.7259063720703125, 0.7879638671875, 0.8500213623046875, 0.912078857421875, 0.9741363525390625, 1.03619384765625, 1.0982513427734375, 1.160308837890625, 1.2223663330078125, 1.284423828125, 1.3464813232421875, 1.408538818359375, 1.4705963134765625, 1.53265380859375, 1.5947113037109375, 1.656768798828125, 1.7188262939453125, 1.7808837890625, 1.8429412841796875, 1.904998779296875, 1.9670562744140625, 2.02911376953125, 2.0911712646484375, 2.153228759765625, 2.2152862548828125, 2.27734375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 9.0, 11.0, 13.0, 14.0, 22.0, 25.0, 22.0, 31.0, 45.0, 58.0, 67.0, 97.0, 100.0, 98.0, 78.0, 60.0, 51.0, 34.0, 42.0, 25.0, 25.0, 14.0, 13.0, 12.0, 5.0, 7.0, 5.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004782676696777344, -0.0004617348313331604, -0.0004452019929885864, -0.00042866915464401245, -0.0004121363162994385, -0.0003956034779548645, -0.00037907063961029053, -0.00036253780126571655, -0.0003460049629211426, -0.0003294721245765686, -0.00031293928623199463, -0.00029640644788742065, -0.0002798736095428467, -0.0002633407711982727, -0.00024680793285369873, -0.00023027509450912476, -0.00021374225616455078, -0.0001972094178199768, -0.00018067657947540283, -0.00016414374113082886, -0.00014761090278625488, -0.0001310780644416809, -0.00011454522609710693, -9.801238775253296e-05, -8.147954940795898e-05, -6.494671106338501e-05, -4.8413872718811035e-05, -3.188103437423706e-05, -1.5348196029663086e-05, 1.1846423149108887e-06, 1.7717480659484863e-05, 3.425031900405884e-05, 5.078315734863281e-05, 6.731599569320679e-05, 8.384883403778076e-05, 0.00010038167238235474, 0.00011691451072692871, 0.00013344734907150269, 0.00014998018741607666, 0.00016651302576065063, 0.0001830458641052246, 0.00019957870244979858, 0.00021611154079437256, 0.00023264437913894653, 0.0002491772174835205, 0.0002657100558280945, 0.00028224289417266846, 0.00029877573251724243, 0.0003153085708618164, 0.0003318414092063904, 0.00034837424755096436, 0.00036490708589553833, 0.0003814399242401123, 0.0003979727625846863, 0.00041450560092926025, 0.00043103843927383423, 0.0004475712776184082, 0.0004641041159629822, 0.00048063695430755615, 0.0004971697926521301, 0.0005137026309967041, 0.0005302354693412781, 0.000546768307685852, 0.000563301146030426, 0.000579833984375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 8.0, 15.0, 19.0, 32.0, 48.0, 81.0, 188.0, 354.0, 949.0, 2969.0, 16741.0, 222503.0, 757207.0, 39847.0, 5224.0, 1358.0, 484.0, 252.0, 109.0, 73.0, 37.0, 19.0, 17.0, 5.0, 6.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.59375, -2.49835205078125, -2.4029541015625, -2.30755615234375, -2.212158203125, -2.11676025390625, -2.0213623046875, -1.92596435546875, -1.83056640625, -1.73516845703125, -1.6397705078125, -1.54437255859375, -1.448974609375, -1.35357666015625, -1.2581787109375, -1.16278076171875, -1.0673828125, -0.97198486328125, -0.8765869140625, -0.78118896484375, -0.685791015625, -0.59039306640625, -0.4949951171875, -0.39959716796875, -0.30419921875, -0.20880126953125, -0.1134033203125, -0.01800537109375, 0.077392578125, 0.17279052734375, 0.2681884765625, 0.36358642578125, 0.458984375, 0.55438232421875, 0.6497802734375, 0.74517822265625, 0.840576171875, 0.93597412109375, 1.0313720703125, 1.12677001953125, 1.22216796875, 1.31756591796875, 1.4129638671875, 1.50836181640625, 1.603759765625, 1.69915771484375, 1.7945556640625, 1.88995361328125, 1.9853515625, 2.08074951171875, 2.1761474609375, 2.27154541015625, 2.366943359375, 2.46234130859375, 2.5577392578125, 2.65313720703125, 2.74853515625, 2.84393310546875, 2.9393310546875, 3.03472900390625, 3.130126953125, 3.22552490234375, 3.3209228515625, 3.41632080078125, 3.51171875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 6.0, 4.0, 4.0, 11.0, 12.0, 21.0, 12.0, 32.0, 33.0, 32.0, 49.0, 50.0, 53.0, 63.0, 80.0, 80.0, 71.0, 69.0, 58.0, 50.0, 42.0, 39.0, 22.0, 16.0, 25.0, 20.0, 9.0, 10.0, 2.0, 4.0, 3.0, 6.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3671875, -1.312896728515625, -1.25860595703125, -1.204315185546875, -1.1500244140625, -1.095733642578125, -1.04144287109375, -0.987152099609375, -0.932861328125, -0.878570556640625, -0.82427978515625, -0.769989013671875, -0.7156982421875, -0.661407470703125, -0.60711669921875, -0.552825927734375, -0.49853515625, -0.444244384765625, -0.38995361328125, -0.335662841796875, -0.2813720703125, -0.227081298828125, -0.17279052734375, -0.118499755859375, -0.064208984375, -0.009918212890625, 0.04437255859375, 0.098663330078125, 0.1529541015625, 0.207244873046875, 0.26153564453125, 0.315826416015625, 0.3701171875, 0.424407958984375, 0.47869873046875, 0.532989501953125, 0.5872802734375, 0.641571044921875, 0.69586181640625, 0.750152587890625, 0.804443359375, 0.858734130859375, 0.91302490234375, 0.967315673828125, 1.0216064453125, 1.075897216796875, 1.13018798828125, 1.184478759765625, 1.23876953125, 1.293060302734375, 1.34735107421875, 1.401641845703125, 1.4559326171875, 1.510223388671875, 1.56451416015625, 1.618804931640625, 1.673095703125, 1.727386474609375, 1.78167724609375, 1.835968017578125, 1.8902587890625, 1.944549560546875, 1.99884033203125, 2.053131103515625, 2.107421875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 2.0, 4.0, 4.0, 8.0, 30.0, 56.0, 100.0, 335.0, 271.0, 105.0, 46.0, 22.0, 9.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-107.48383331298828, -105.14241027832031, -102.80098724365234, -100.45956420898438, -98.11813354492188, -95.7767105102539, -93.43528747558594, -91.09386444091797, -88.75244140625, -86.41101837158203, -84.06959533691406, -81.7281723022461, -79.38674926757812, -77.04531860351562, -74.70389556884766, -72.36247253417969, -70.02104949951172, -67.67962646484375, -65.33820343017578, -62.99677658081055, -60.65535354614258, -58.31393051147461, -55.972503662109375, -53.631080627441406, -51.28965759277344, -48.94823455810547, -46.6068115234375, -44.265384674072266, -41.9239616394043, -39.58253860473633, -37.241111755371094, -34.899688720703125, -32.55826187133789, -30.216838836669922, -27.87541389465332, -25.53398895263672, -23.19256591796875, -20.85114288330078, -18.50971794128418, -16.168292999267578, -13.82686996459961, -11.485445976257324, -9.144021987915039, -6.802597999572754, -4.461174011230469, -2.1197500228881836, 0.22167396545410156, 2.563098907470703, 4.904521942138672, 7.245945930480957, 9.587369918823242, 11.928793907165527, 14.270217895507812, 16.61164093017578, 18.953065872192383, 21.294490814208984, 23.635913848876953, 25.977336883544922, 28.318761825561523, 30.660186767578125, 33.001609802246094, 35.34303283691406, 37.68445587158203, 40.025882720947266, 42.367305755615234]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 9.0, 5.0, 7.0, 8.0, 6.0, 13.0, 15.0, 16.0, 15.0, 14.0, 23.0, 15.0, 22.0, 29.0, 27.0, 24.0, 38.0, 44.0, 75.0, 105.0, 107.0, 71.0, 40.0, 38.0, 28.0, 27.0, 20.0, 32.0, 17.0, 16.0, 14.0, 12.0, 9.0, 12.0, 10.0, 11.0, 5.0, 6.0, 3.0, 5.0, 3.0, 2.0, 3.0, 5.0, 0.0, 1.0, 0.0, 2.0], "bins": [-35.56679153442383, -34.57630920410156, -33.5858268737793, -32.59534454345703, -31.6048641204834, -30.614381790161133, -29.623899459838867, -28.6334171295166, -27.64293670654297, -26.652454376220703, -25.661972045898438, -24.671489715576172, -23.68100929260254, -22.690526962280273, -21.700044631958008, -20.709562301635742, -19.719079971313477, -18.72859764099121, -17.738115310668945, -16.747634887695312, -15.757152557373047, -14.766670227050781, -13.776187896728516, -12.78570556640625, -11.7952241897583, -10.804741859436035, -9.814260482788086, -8.82377815246582, -7.833296298980713, -6.8428144454956055, -5.85233211517334, -4.861850261688232, -3.871370315551758, -2.8808884620666504, -1.8904063701629639, -0.8999242782592773, 0.09055757522583008, 1.0810394287109375, 2.071521759033203, 3.0620036125183105, 4.052485466003418, 5.042967319488525, 6.033449172973633, 7.023931503295898, 8.014413833618164, 9.004895210266113, 9.995377540588379, 10.985858917236328, 11.976341247558594, 12.96682357788086, 13.957304954528809, 14.947787284851074, 15.938268661499023, 16.92875099182129, 17.919233322143555, 18.90971565246582, 19.900196075439453, 20.89067840576172, 21.881160736083984, 22.87164306640625, 23.862123489379883, 24.85260581970215, 25.843088150024414, 26.83357048034668, 27.824052810668945]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 6.0, 11.0, 10.0, 14.0, 17.0, 40.0, 58.0, 66.0, 100.0, 145.0, 249.0, 355.0, 550.0, 961.0, 1494.0, 2749.0, 5144.0, 10267.0, 23960.0, 64243.0, 184456.0, 534736.0, 1335466.0, 1271856.0, 492662.0, 164750.0, 57465.0, 21669.0, 9465.0, 4701.0, 2539.0, 1511.0, 910.0, 522.0, 361.0, 247.0, 165.0, 113.0, 82.0, 60.0, 30.0, 22.0, 19.0, 13.0, 9.0, 4.0, 6.0, 3.0, 4.0, 0.0, 1.0, 1.0], "bins": [-1.9169921875, -1.862152099609375, -1.80731201171875, -1.752471923828125, -1.6976318359375, -1.642791748046875, -1.58795166015625, -1.533111572265625, -1.478271484375, -1.423431396484375, -1.36859130859375, -1.313751220703125, -1.2589111328125, -1.204071044921875, -1.14923095703125, -1.094390869140625, -1.03955078125, -0.984710693359375, -0.92987060546875, -0.875030517578125, -0.8201904296875, -0.765350341796875, -0.71051025390625, -0.655670166015625, -0.600830078125, -0.545989990234375, -0.49114990234375, -0.436309814453125, -0.3814697265625, -0.326629638671875, -0.27178955078125, -0.216949462890625, -0.162109375, -0.107269287109375, -0.05242919921875, 0.002410888671875, 0.0572509765625, 0.112091064453125, 0.16693115234375, 0.221771240234375, 0.276611328125, 0.331451416015625, 0.38629150390625, 0.441131591796875, 0.4959716796875, 0.550811767578125, 0.60565185546875, 0.660491943359375, 0.71533203125, 0.770172119140625, 0.82501220703125, 0.879852294921875, 0.9346923828125, 0.989532470703125, 1.04437255859375, 1.099212646484375, 1.154052734375, 1.208892822265625, 1.26373291015625, 1.318572998046875, 1.3734130859375, 1.428253173828125, 1.48309326171875, 1.537933349609375, 1.5927734375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 12.0, 3.0, 9.0, 6.0, 5.0, 5.0, 12.0, 10.0, 11.0, 16.0, 22.0, 29.0, 32.0, 30.0, 30.0, 31.0, 34.0, 52.0, 27.0, 41.0, 38.0, 49.0, 52.0, 48.0, 39.0, 35.0, 38.0, 38.0, 32.0, 21.0, 24.0, 28.0, 17.0, 13.0, 26.0, 14.0, 10.0, 10.0, 6.0, 8.0, 10.0, 6.0, 3.0, 5.0, 2.0, 3.0, 4.0, 3.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.90625, -1.8443603515625, -1.782470703125, -1.7205810546875, -1.65869140625, -1.5968017578125, -1.534912109375, -1.4730224609375, -1.4111328125, -1.3492431640625, -1.287353515625, -1.2254638671875, -1.16357421875, -1.1016845703125, -1.039794921875, -0.9779052734375, -0.916015625, -0.8541259765625, -0.792236328125, -0.7303466796875, -0.66845703125, -0.6065673828125, -0.544677734375, -0.4827880859375, -0.4208984375, -0.3590087890625, -0.297119140625, -0.2352294921875, -0.17333984375, -0.1114501953125, -0.049560546875, 0.0123291015625, 0.07421875, 0.1361083984375, 0.197998046875, 0.2598876953125, 0.32177734375, 0.3836669921875, 0.445556640625, 0.5074462890625, 0.5693359375, 0.6312255859375, 0.693115234375, 0.7550048828125, 0.81689453125, 0.8787841796875, 0.940673828125, 1.0025634765625, 1.064453125, 1.1263427734375, 1.188232421875, 1.2501220703125, 1.31201171875, 1.3739013671875, 1.435791015625, 1.4976806640625, 1.5595703125, 1.6214599609375, 1.683349609375, 1.7452392578125, 1.80712890625, 1.8690185546875, 1.930908203125, 1.9927978515625, 2.0546875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 5.0, 6.0, 5.0, 7.0, 5.0, 13.0, 6.0, 14.0, 16.0, 27.0, 28.0, 34.0, 53.0, 102.0, 177.0, 363.0, 780.0, 2226.0, 8068.0, 51037.0, 1637005.0, 2417760.0, 63835.0, 8916.0, 2174.0, 789.0, 335.0, 178.0, 87.0, 57.0, 45.0, 35.0, 27.0, 19.0, 14.0, 6.0, 6.0, 5.0, 6.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.43359375, -6.22637939453125, -6.0191650390625, -5.81195068359375, -5.604736328125, -5.39752197265625, -5.1903076171875, -4.98309326171875, -4.77587890625, -4.56866455078125, -4.3614501953125, -4.15423583984375, -3.947021484375, -3.73980712890625, -3.5325927734375, -3.32537841796875, -3.1181640625, -2.91094970703125, -2.7037353515625, -2.49652099609375, -2.289306640625, -2.08209228515625, -1.8748779296875, -1.66766357421875, -1.46044921875, -1.25323486328125, -1.0460205078125, -0.83880615234375, -0.631591796875, -0.42437744140625, -0.2171630859375, -0.00994873046875, 0.197265625, 0.40447998046875, 0.6116943359375, 0.81890869140625, 1.026123046875, 1.23333740234375, 1.4405517578125, 1.64776611328125, 1.85498046875, 2.06219482421875, 2.2694091796875, 2.47662353515625, 2.683837890625, 2.89105224609375, 3.0982666015625, 3.30548095703125, 3.5126953125, 3.71990966796875, 3.9271240234375, 4.13433837890625, 4.341552734375, 4.54876708984375, 4.7559814453125, 4.96319580078125, 5.17041015625, 5.37762451171875, 5.5848388671875, 5.79205322265625, 5.999267578125, 6.20648193359375, 6.4136962890625, 6.62091064453125, 6.828125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 8.0, 3.0, 5.0, 4.0, 9.0, 13.0, 11.0, 14.0, 31.0, 52.0, 45.0, 61.0, 103.0, 157.0, 258.0, 384.0, 606.0, 688.0, 559.0, 400.0, 217.0, 156.0, 84.0, 64.0, 38.0, 30.0, 21.0, 16.0, 11.0, 8.0, 5.0, 5.0, 5.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.23828125, -6.07110595703125, -5.9039306640625, -5.73675537109375, -5.569580078125, -5.40240478515625, -5.2352294921875, -5.06805419921875, -4.90087890625, -4.73370361328125, -4.5665283203125, -4.39935302734375, -4.232177734375, -4.06500244140625, -3.8978271484375, -3.73065185546875, -3.5634765625, -3.39630126953125, -3.2291259765625, -3.06195068359375, -2.894775390625, -2.72760009765625, -2.5604248046875, -2.39324951171875, -2.22607421875, -2.05889892578125, -1.8917236328125, -1.72454833984375, -1.557373046875, -1.39019775390625, -1.2230224609375, -1.05584716796875, -0.888671875, -0.72149658203125, -0.5543212890625, -0.38714599609375, -0.219970703125, -0.05279541015625, 0.1143798828125, 0.28155517578125, 0.44873046875, 0.61590576171875, 0.7830810546875, 0.95025634765625, 1.117431640625, 1.28460693359375, 1.4517822265625, 1.61895751953125, 1.7861328125, 1.95330810546875, 2.1204833984375, 2.28765869140625, 2.454833984375, 2.62200927734375, 2.7891845703125, 2.95635986328125, 3.12353515625, 3.29071044921875, 3.4578857421875, 3.62506103515625, 3.792236328125, 3.95941162109375, 4.1265869140625, 4.29376220703125, 4.4609375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 9.0, 9.0, 24.0, 61.0, 157.0, 298.0, 271.0, 111.0, 36.0, 15.0, 9.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.35106658935547, -116.86079406738281, -114.37052917480469, -111.88025665283203, -109.3899917602539, -106.89971923828125, -104.40945434570312, -101.91918182373047, -99.42890930175781, -96.93863677978516, -94.44837188720703, -91.95809936523438, -89.46783447265625, -86.9775619506836, -84.48729705810547, -81.99702453613281, -79.50675964355469, -77.01648712158203, -74.5262222290039, -72.03594970703125, -69.54568481445312, -67.05541229248047, -64.56514739990234, -62.07487487792969, -59.5846061706543, -57.094337463378906, -54.604068756103516, -52.113800048828125, -49.62352752685547, -47.133262634277344, -44.64299011230469, -42.1527214050293, -39.662452697753906, -37.172183990478516, -34.681915283203125, -32.191646575927734, -29.70137596130371, -27.21110725402832, -24.720836639404297, -22.230567932128906, -19.740299224853516, -17.250030517578125, -14.759760856628418, -12.269491195678711, -9.77922248840332, -7.28895378112793, -4.798684120178223, -2.3084144592285156, 0.181854248046875, 2.672123432159424, 5.162392616271973, 7.6526618003845215, 10.14293098449707, 12.633199691772461, 15.123469352722168, 17.613739013671875, 20.104007720947266, 22.594276428222656, 25.084545135498047, 27.57481575012207, 30.06508445739746, 32.55535125732422, 35.045623779296875, 37.535892486572266, 40.026161193847656]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 6.0, 5.0, 10.0, 5.0, 13.0, 19.0, 17.0, 24.0, 23.0, 32.0, 40.0, 42.0, 46.0, 60.0, 59.0, 71.0, 74.0, 66.0, 59.0, 51.0, 37.0, 35.0, 40.0, 26.0, 30.0, 23.0, 16.0, 15.0, 15.0, 9.0, 7.0, 10.0, 6.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.55684471130371, -25.677698135375977, -24.79854965209961, -23.919403076171875, -23.04025650024414, -22.161109924316406, -21.281963348388672, -20.402814865112305, -19.52366828918457, -18.644521713256836, -17.76537322998047, -16.886226654052734, -16.007080078125, -15.127933502197266, -14.248785972595215, -13.369638442993164, -12.49049186706543, -11.611345291137695, -10.732197761535645, -9.853050231933594, -8.97390365600586, -8.094757080078125, -7.215609550476074, -6.336462497711182, -5.457315444946289, -4.5781683921813965, -3.699021339416504, -2.8198742866516113, -1.9407272338867188, -1.0615801811218262, -0.1824331283569336, 0.696713924407959, 1.5758628845214844, 2.455009937286377, 3.3341569900512695, 4.213304042816162, 5.092451095581055, 5.971598148345947, 6.85074520111084, 7.729892253875732, 8.609039306640625, 9.48818588256836, 10.36733341217041, 11.246480941772461, 12.125627517700195, 13.00477409362793, 13.88392162322998, 14.763069152832031, 15.642215728759766, 16.5213623046875, 17.400508880615234, 18.2796573638916, 19.158803939819336, 20.03795051574707, 20.917098999023438, 21.796245574951172, 22.675392150878906, 23.55453872680664, 24.433685302734375, 25.312833786010742, 26.191980361938477, 27.07112693786621, 27.950275421142578, 28.829421997070312, 29.708568572998047]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 5.0, 12.0, 18.0, 29.0, 36.0, 41.0, 80.0, 114.0, 159.0, 301.0, 467.0, 754.0, 1344.0, 2413.0, 4186.0, 7788.0, 14984.0, 29812.0, 63430.0, 139801.0, 285425.0, 261147.0, 123718.0, 56168.0, 26762.0, 13400.0, 6940.0, 3808.0, 2193.0, 1278.0, 764.0, 474.0, 249.0, 156.0, 102.0, 69.0, 49.0, 29.0, 16.0, 11.0, 10.0, 8.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.33203125, -3.224273681640625, -3.11651611328125, -3.008758544921875, -2.9010009765625, -2.793243408203125, -2.68548583984375, -2.577728271484375, -2.469970703125, -2.362213134765625, -2.25445556640625, -2.146697998046875, -2.0389404296875, -1.931182861328125, -1.82342529296875, -1.715667724609375, -1.60791015625, -1.500152587890625, -1.39239501953125, -1.284637451171875, -1.1768798828125, -1.069122314453125, -0.96136474609375, -0.853607177734375, -0.745849609375, -0.638092041015625, -0.53033447265625, -0.422576904296875, -0.3148193359375, -0.207061767578125, -0.09930419921875, 0.008453369140625, 0.1162109375, 0.223968505859375, 0.33172607421875, 0.439483642578125, 0.5472412109375, 0.654998779296875, 0.76275634765625, 0.870513916015625, 0.978271484375, 1.086029052734375, 1.19378662109375, 1.301544189453125, 1.4093017578125, 1.517059326171875, 1.62481689453125, 1.732574462890625, 1.84033203125, 1.948089599609375, 2.05584716796875, 2.163604736328125, 2.2713623046875, 2.379119873046875, 2.48687744140625, 2.594635009765625, 2.702392578125, 2.810150146484375, 2.91790771484375, 3.025665283203125, 3.1334228515625, 3.241180419921875, 3.34893798828125, 3.456695556640625, 3.564453125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 6.0, 6.0, 6.0, 12.0, 16.0, 10.0, 18.0, 8.0, 21.0, 30.0, 42.0, 32.0, 35.0, 35.0, 44.0, 42.0, 48.0, 45.0, 44.0, 49.0, 46.0, 50.0, 35.0, 37.0, 30.0, 37.0, 34.0, 22.0, 28.0, 25.0, 18.0, 17.0, 11.0, 13.0, 6.0, 7.0, 7.0, 8.0, 8.0, 6.0, 4.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.255859375, -2.18341064453125, -2.1109619140625, -2.03851318359375, -1.966064453125, -1.89361572265625, -1.8211669921875, -1.74871826171875, -1.67626953125, -1.60382080078125, -1.5313720703125, -1.45892333984375, -1.386474609375, -1.31402587890625, -1.2415771484375, -1.16912841796875, -1.0966796875, -1.02423095703125, -0.9517822265625, -0.87933349609375, -0.806884765625, -0.73443603515625, -0.6619873046875, -0.58953857421875, -0.51708984375, -0.44464111328125, -0.3721923828125, -0.29974365234375, -0.227294921875, -0.15484619140625, -0.0823974609375, -0.00994873046875, 0.0625, 0.13494873046875, 0.2073974609375, 0.27984619140625, 0.352294921875, 0.42474365234375, 0.4971923828125, 0.56964111328125, 0.64208984375, 0.71453857421875, 0.7869873046875, 0.85943603515625, 0.931884765625, 1.00433349609375, 1.0767822265625, 1.14923095703125, 1.2216796875, 1.29412841796875, 1.3665771484375, 1.43902587890625, 1.511474609375, 1.58392333984375, 1.6563720703125, 1.72882080078125, 1.80126953125, 1.87371826171875, 1.9461669921875, 2.01861572265625, 2.091064453125, 2.16351318359375, 2.2359619140625, 2.30841064453125, 2.380859375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 8.0, 4.0, 23.0, 16.0, 23.0, 19.0, 57.0, 59.0, 82.0, 130.0, 184.0, 268.0, 387.0, 648.0, 1105.0, 2405.0, 7073.0, 33599.0, 281550.0, 659300.0, 46569.0, 8874.0, 2792.0, 1296.0, 711.0, 424.0, 291.0, 193.0, 134.0, 108.0, 61.0, 43.0, 36.0, 31.0, 10.0, 10.0, 11.0, 5.0, 4.0, 6.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.9453125, -7.69769287109375, -7.4500732421875, -7.20245361328125, -6.954833984375, -6.70721435546875, -6.4595947265625, -6.21197509765625, -5.96435546875, -5.71673583984375, -5.4691162109375, -5.22149658203125, -4.973876953125, -4.72625732421875, -4.4786376953125, -4.23101806640625, -3.9833984375, -3.73577880859375, -3.4881591796875, -3.24053955078125, -2.992919921875, -2.74530029296875, -2.4976806640625, -2.25006103515625, -2.00244140625, -1.75482177734375, -1.5072021484375, -1.25958251953125, -1.011962890625, -0.76434326171875, -0.5167236328125, -0.26910400390625, -0.021484375, 0.22613525390625, 0.4737548828125, 0.72137451171875, 0.968994140625, 1.21661376953125, 1.4642333984375, 1.71185302734375, 1.95947265625, 2.20709228515625, 2.4547119140625, 2.70233154296875, 2.949951171875, 3.19757080078125, 3.4451904296875, 3.69281005859375, 3.9404296875, 4.18804931640625, 4.4356689453125, 4.68328857421875, 4.930908203125, 5.17852783203125, 5.4261474609375, 5.67376708984375, 5.92138671875, 6.16900634765625, 6.4166259765625, 6.66424560546875, 6.911865234375, 7.15948486328125, 7.4071044921875, 7.65472412109375, 7.90234375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 10.0, 7.0, 12.0, 17.0, 17.0, 26.0, 17.0, 16.0, 22.0, 26.0, 40.0, 42.0, 50.0, 44.0, 50.0, 58.0, 74.0, 64.0, 63.0, 40.0, 35.0, 45.0, 23.0, 32.0, 24.0, 20.0, 17.0, 14.0, 23.0, 17.0, 11.0, 8.0, 7.0, 6.0, 6.0, 3.0, 2.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.1875, -8.9129638671875, -8.638427734375, -8.3638916015625, -8.08935546875, -7.8148193359375, -7.540283203125, -7.2657470703125, -6.9912109375, -6.7166748046875, -6.442138671875, -6.1676025390625, -5.89306640625, -5.6185302734375, -5.343994140625, -5.0694580078125, -4.794921875, -4.5203857421875, -4.245849609375, -3.9713134765625, -3.69677734375, -3.4222412109375, -3.147705078125, -2.8731689453125, -2.5986328125, -2.3240966796875, -2.049560546875, -1.7750244140625, -1.50048828125, -1.2259521484375, -0.951416015625, -0.6768798828125, -0.40234375, -0.1278076171875, 0.146728515625, 0.4212646484375, 0.69580078125, 0.9703369140625, 1.244873046875, 1.5194091796875, 1.7939453125, 2.0684814453125, 2.343017578125, 2.6175537109375, 2.89208984375, 3.1666259765625, 3.441162109375, 3.7156982421875, 3.990234375, 4.2647705078125, 4.539306640625, 4.8138427734375, 5.08837890625, 5.3629150390625, 5.637451171875, 5.9119873046875, 6.1865234375, 6.4610595703125, 6.735595703125, 7.0101318359375, 7.28466796875, 7.5592041015625, 7.833740234375, 8.1082763671875, 8.3828125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 6.0, 5.0, 6.0, 4.0, 8.0, 19.0, 19.0, 18.0, 49.0, 65.0, 126.0, 246.0, 490.0, 1295.0, 4703.0, 32141.0, 719145.0, 264397.0, 20420.0, 3458.0, 1000.0, 428.0, 215.0, 129.0, 49.0, 43.0, 15.0, 19.0, 14.0, 14.0, 4.0, 5.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.234375, -3.1552886962890625, -3.076202392578125, -2.9971160888671875, -2.91802978515625, -2.8389434814453125, -2.759857177734375, -2.6807708740234375, -2.6016845703125, -2.5225982666015625, -2.443511962890625, -2.3644256591796875, -2.28533935546875, -2.2062530517578125, -2.127166748046875, -2.0480804443359375, -1.968994140625, -1.8899078369140625, -1.810821533203125, -1.7317352294921875, -1.65264892578125, -1.5735626220703125, -1.494476318359375, -1.4153900146484375, -1.3363037109375, -1.2572174072265625, -1.178131103515625, -1.0990447998046875, -1.01995849609375, -0.9408721923828125, -0.861785888671875, -0.7826995849609375, -0.70361328125, -0.6245269775390625, -0.545440673828125, -0.4663543701171875, -0.38726806640625, -0.3081817626953125, -0.229095458984375, -0.1500091552734375, -0.0709228515625, 0.0081634521484375, 0.087249755859375, 0.1663360595703125, 0.24542236328125, 0.3245086669921875, 0.403594970703125, 0.4826812744140625, 0.561767578125, 0.6408538818359375, 0.719940185546875, 0.7990264892578125, 0.87811279296875, 0.9571990966796875, 1.036285400390625, 1.1153717041015625, 1.1944580078125, 1.2735443115234375, 1.352630615234375, 1.4317169189453125, 1.51080322265625, 1.5898895263671875, 1.668975830078125, 1.7480621337890625, 1.8271484375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 9.0, 6.0, 9.0, 6.0, 14.0, 20.0, 28.0, 23.0, 42.0, 46.0, 58.0, 84.0, 120.0, 104.0, 99.0, 76.0, 62.0, 49.0, 36.0, 36.0, 14.0, 12.0, 10.0, 13.0, 6.0, 5.0, 7.0, 2.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006017684936523438, -0.0005847364664077759, -0.000567704439163208, -0.0005506724119186401, -0.0005336403846740723, -0.0005166083574295044, -0.0004995763301849365, -0.00048254430294036865, -0.0004655122756958008, -0.0004484802484512329, -0.00043144822120666504, -0.00041441619396209717, -0.0003973841667175293, -0.0003803521394729614, -0.00036332011222839355, -0.0003462880849838257, -0.0003292560577392578, -0.00031222403049468994, -0.00029519200325012207, -0.0002781599760055542, -0.00026112794876098633, -0.00024409592151641846, -0.00022706389427185059, -0.00021003186702728271, -0.00019299983978271484, -0.00017596781253814697, -0.0001589357852935791, -0.00014190375804901123, -0.00012487173080444336, -0.00010783970355987549, -9.080767631530762e-05, -7.377564907073975e-05, -5.6743621826171875e-05, -3.9711594581604004e-05, -2.2679567337036133e-05, -5.647540092468262e-06, 1.138448715209961e-05, 2.841651439666748e-05, 4.544854164123535e-05, 6.248056888580322e-05, 7.95125961303711e-05, 9.654462337493896e-05, 0.00011357665061950684, 0.0001306086778640747, 0.00014764070510864258, 0.00016467273235321045, 0.00018170475959777832, 0.0001987367868423462, 0.00021576881408691406, 0.00023280084133148193, 0.0002498328685760498, 0.0002668648958206177, 0.00028389692306518555, 0.0003009289503097534, 0.0003179609775543213, 0.00033499300479888916, 0.00035202503204345703, 0.0003690570592880249, 0.0003860890865325928, 0.00040312111377716064, 0.0004201531410217285, 0.0004371851682662964, 0.00045421719551086426, 0.00047124922275543213, 0.00048828125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 6.0, 3.0, 7.0, 10.0, 6.0, 11.0, 16.0, 24.0, 26.0, 57.0, 58.0, 128.0, 179.0, 308.0, 475.0, 947.0, 2043.0, 5947.0, 25838.0, 215241.0, 724100.0, 57107.0, 10093.0, 2991.0, 1268.0, 636.0, 348.0, 236.0, 140.0, 81.0, 79.0, 41.0, 28.0, 23.0, 11.0, 13.0, 9.0, 10.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.8427734375, -1.785552978515625, -1.72833251953125, -1.671112060546875, -1.6138916015625, -1.556671142578125, -1.49945068359375, -1.442230224609375, -1.385009765625, -1.327789306640625, -1.27056884765625, -1.213348388671875, -1.1561279296875, -1.098907470703125, -1.04168701171875, -0.984466552734375, -0.92724609375, -0.870025634765625, -0.81280517578125, -0.755584716796875, -0.6983642578125, -0.641143798828125, -0.58392333984375, -0.526702880859375, -0.469482421875, -0.412261962890625, -0.35504150390625, -0.297821044921875, -0.2406005859375, -0.183380126953125, -0.12615966796875, -0.068939208984375, -0.01171875, 0.045501708984375, 0.10272216796875, 0.159942626953125, 0.2171630859375, 0.274383544921875, 0.33160400390625, 0.388824462890625, 0.446044921875, 0.503265380859375, 0.56048583984375, 0.617706298828125, 0.6749267578125, 0.732147216796875, 0.78936767578125, 0.846588134765625, 0.90380859375, 0.961029052734375, 1.01824951171875, 1.075469970703125, 1.1326904296875, 1.189910888671875, 1.24713134765625, 1.304351806640625, 1.361572265625, 1.418792724609375, 1.47601318359375, 1.533233642578125, 1.5904541015625, 1.647674560546875, 1.70489501953125, 1.762115478515625, 1.8193359375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 9.0, 4.0, 4.0, 9.0, 9.0, 12.0, 16.0, 22.0, 26.0, 44.0, 42.0, 42.0, 57.0, 73.0, 74.0, 83.0, 89.0, 74.0, 51.0, 47.0, 37.0, 27.0, 27.0, 17.0, 14.0, 15.0, 15.0, 13.0, 11.0, 2.0, 4.0, 11.0, 6.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.73046875, -1.6787261962890625, -1.626983642578125, -1.5752410888671875, -1.52349853515625, -1.4717559814453125, -1.420013427734375, -1.3682708740234375, -1.3165283203125, -1.2647857666015625, -1.213043212890625, -1.1613006591796875, -1.10955810546875, -1.0578155517578125, -1.006072998046875, -0.9543304443359375, -0.902587890625, -0.8508453369140625, -0.799102783203125, -0.7473602294921875, -0.69561767578125, -0.6438751220703125, -0.592132568359375, -0.5403900146484375, -0.4886474609375, -0.4369049072265625, -0.385162353515625, -0.3334197998046875, -0.28167724609375, -0.2299346923828125, -0.178192138671875, -0.1264495849609375, -0.07470703125, -0.0229644775390625, 0.028778076171875, 0.0805206298828125, 0.13226318359375, 0.1840057373046875, 0.235748291015625, 0.2874908447265625, 0.3392333984375, 0.3909759521484375, 0.442718505859375, 0.4944610595703125, 0.54620361328125, 0.5979461669921875, 0.649688720703125, 0.7014312744140625, 0.753173828125, 0.8049163818359375, 0.856658935546875, 0.9084014892578125, 0.96014404296875, 1.0118865966796875, 1.063629150390625, 1.1153717041015625, 1.1671142578125, 1.2188568115234375, 1.270599365234375, 1.3223419189453125, 1.37408447265625, 1.4258270263671875, 1.477569580078125, 1.5293121337890625, 1.5810546875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 8.0, 3.0, 17.0, 29.0, 39.0, 66.0, 136.0, 325.0, 136.0, 107.0, 53.0, 30.0, 23.0, 14.0, 7.0, 3.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.87493133544922, -44.46272277832031, -43.05051040649414, -41.638301849365234, -40.22609329223633, -38.813880920410156, -37.40167236328125, -35.989463806152344, -34.57725524902344, -33.16504669189453, -31.752836227416992, -30.340625762939453, -28.928417205810547, -27.516206741333008, -26.10399627685547, -24.691787719726562, -23.27957534790039, -21.86736488342285, -20.455156326293945, -19.042945861816406, -17.6307373046875, -16.21852684020996, -14.806316375732422, -13.3941068649292, -11.981897354125977, -10.569687843322754, -9.157478332519531, -7.745267868041992, -6.3330583572387695, -4.920848846435547, -3.508638381958008, -2.096428871154785, -0.6842231750488281, 0.7279865741729736, 2.1401963233947754, 3.5524063110351562, 4.964615821838379, 6.376825332641602, 7.789035797119141, 9.201245307922363, 10.613454818725586, 12.025664329528809, 13.437873840332031, 14.85008430480957, 16.26229476928711, 17.674503326416016, 19.086713790893555, 20.498924255371094, 21.9111328125, 23.32334327697754, 24.735551834106445, 26.147762298583984, 27.55997085571289, 28.97218132019043, 30.38439178466797, 31.796600341796875, 33.20880889892578, 34.62101745605469, 36.03322982788086, 37.445438385009766, 38.85764694213867, 40.269859313964844, 41.68206787109375, 43.094276428222656, 44.50648880004883]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 6.0, 4.0, 3.0, 8.0, 6.0, 10.0, 10.0, 15.0, 24.0, 21.0, 15.0, 27.0, 23.0, 23.0, 29.0, 32.0, 48.0, 55.0, 133.0, 135.0, 66.0, 28.0, 35.0, 36.0, 21.0, 36.0, 25.0, 19.0, 12.0, 21.0, 13.0, 15.0, 11.0, 9.0, 11.0, 4.0, 5.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.195968627929688, -30.15711212158203, -29.118255615234375, -28.07939910888672, -27.04054069519043, -26.001684188842773, -24.962827682495117, -23.92397117614746, -22.885112762451172, -21.846256256103516, -20.80739974975586, -19.768543243408203, -18.729684829711914, -17.690828323364258, -16.6519718170166, -15.613115310668945, -14.574258804321289, -13.535402297973633, -12.49654483795166, -11.457688331604004, -10.418830871582031, -9.379974365234375, -8.341117858886719, -7.302260875701904, -6.26340389251709, -5.224546909332275, -4.185689926147461, -3.1468334197998047, -2.1079764366149902, -1.0691194534301758, -0.03026294708251953, 1.008594036102295, 2.0474510192871094, 3.086308002471924, 4.125164985656738, 5.1640214920043945, 6.202878475189209, 7.241735458374023, 8.28059196472168, 9.319448471069336, 10.358305931091309, 11.397162437438965, 12.436019897460938, 13.474876403808594, 14.51373291015625, 15.552590370178223, 16.591445922851562, 17.63030433654785, 18.669160842895508, 19.708017349243164, 20.74687385559082, 21.78573226928711, 22.824588775634766, 23.863445281982422, 24.902301788330078, 25.941158294677734, 26.98001480102539, 28.018871307373047, 29.057727813720703, 30.09658432006836, 31.13544273376465, 32.17430114746094, 33.213157653808594, 34.25201416015625, 35.290870666503906]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 5.0, 7.0, 3.0, 21.0, 26.0, 29.0, 55.0, 78.0, 101.0, 174.0, 277.0, 481.0, 812.0, 1299.0, 2380.0, 4850.0, 10510.0, 27754.0, 95142.0, 383526.0, 1332801.0, 1614825.0, 529736.0, 127925.0, 35782.0, 13186.0, 5728.0, 2894.0, 1571.0, 883.0, 507.0, 308.0, 196.0, 131.0, 89.0, 61.0, 38.0, 28.0, 16.0, 16.0, 11.0, 11.0, 9.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.9140625, -2.820404052734375, -2.72674560546875, -2.633087158203125, -2.5394287109375, -2.445770263671875, -2.35211181640625, -2.258453369140625, -2.164794921875, -2.071136474609375, -1.97747802734375, -1.883819580078125, -1.7901611328125, -1.696502685546875, -1.60284423828125, -1.509185791015625, -1.41552734375, -1.321868896484375, -1.22821044921875, -1.134552001953125, -1.0408935546875, -0.947235107421875, -0.85357666015625, -0.759918212890625, -0.666259765625, -0.572601318359375, -0.47894287109375, -0.385284423828125, -0.2916259765625, -0.197967529296875, -0.10430908203125, -0.010650634765625, 0.0830078125, 0.176666259765625, 0.27032470703125, 0.363983154296875, 0.4576416015625, 0.551300048828125, 0.64495849609375, 0.738616943359375, 0.832275390625, 0.925933837890625, 1.01959228515625, 1.113250732421875, 1.2069091796875, 1.300567626953125, 1.39422607421875, 1.487884521484375, 1.58154296875, 1.675201416015625, 1.76885986328125, 1.862518310546875, 1.9561767578125, 2.049835205078125, 2.14349365234375, 2.237152099609375, 2.330810546875, 2.424468994140625, 2.51812744140625, 2.611785888671875, 2.7054443359375, 2.799102783203125, 2.89276123046875, 2.986419677734375, 3.080078125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 7.0, 13.0, 7.0, 9.0, 9.0, 12.0, 7.0, 13.0, 17.0, 16.0, 32.0, 22.0, 25.0, 31.0, 25.0, 37.0, 35.0, 47.0, 38.0, 38.0, 48.0, 40.0, 44.0, 43.0, 39.0, 37.0, 39.0, 31.0, 33.0, 24.0, 24.0, 28.0, 22.0, 24.0, 16.0, 13.0, 12.0, 8.0, 7.0, 3.0, 1.0, 4.0, 9.0, 4.0, 5.0, 4.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0], "bins": [-1.943359375, -1.88494873046875, -1.8265380859375, -1.76812744140625, -1.709716796875, -1.65130615234375, -1.5928955078125, -1.53448486328125, -1.47607421875, -1.41766357421875, -1.3592529296875, -1.30084228515625, -1.242431640625, -1.18402099609375, -1.1256103515625, -1.06719970703125, -1.0087890625, -0.95037841796875, -0.8919677734375, -0.83355712890625, -0.775146484375, -0.71673583984375, -0.6583251953125, -0.59991455078125, -0.54150390625, -0.48309326171875, -0.4246826171875, -0.36627197265625, -0.307861328125, -0.24945068359375, -0.1910400390625, -0.13262939453125, -0.07421875, -0.01580810546875, 0.0426025390625, 0.10101318359375, 0.159423828125, 0.21783447265625, 0.2762451171875, 0.33465576171875, 0.39306640625, 0.45147705078125, 0.5098876953125, 0.56829833984375, 0.626708984375, 0.68511962890625, 0.7435302734375, 0.80194091796875, 0.8603515625, 0.91876220703125, 0.9771728515625, 1.03558349609375, 1.093994140625, 1.15240478515625, 1.2108154296875, 1.26922607421875, 1.32763671875, 1.38604736328125, 1.4444580078125, 1.50286865234375, 1.561279296875, 1.61968994140625, 1.6781005859375, 1.73651123046875, 1.794921875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 5.0, 4.0, 5.0, 6.0, 7.0, 22.0, 45.0, 58.0, 114.0, 208.0, 454.0, 936.0, 2825.0, 25174.0, 3959434.0, 196293.0, 5979.0, 1499.0, 559.0, 296.0, 165.0, 97.0, 34.0, 35.0, 15.0, 12.0, 2.0, 0.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.28125, -13.783935546875, -13.28662109375, -12.789306640625, -12.2919921875, -11.794677734375, -11.29736328125, -10.800048828125, -10.302734375, -9.805419921875, -9.30810546875, -8.810791015625, -8.3134765625, -7.816162109375, -7.31884765625, -6.821533203125, -6.32421875, -5.826904296875, -5.32958984375, -4.832275390625, -4.3349609375, -3.837646484375, -3.34033203125, -2.843017578125, -2.345703125, -1.848388671875, -1.35107421875, -0.853759765625, -0.3564453125, 0.140869140625, 0.63818359375, 1.135498046875, 1.6328125, 2.130126953125, 2.62744140625, 3.124755859375, 3.6220703125, 4.119384765625, 4.61669921875, 5.114013671875, 5.611328125, 6.108642578125, 6.60595703125, 7.103271484375, 7.6005859375, 8.097900390625, 8.59521484375, 9.092529296875, 9.58984375, 10.087158203125, 10.58447265625, 11.081787109375, 11.5791015625, 12.076416015625, 12.57373046875, 13.071044921875, 13.568359375, 14.065673828125, 14.56298828125, 15.060302734375, 15.5576171875, 16.054931640625, 16.55224609375, 17.049560546875, 17.546875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 6.0, 10.0, 20.0, 24.0, 37.0, 64.0, 90.0, 105.0, 152.0, 237.0, 340.0, 506.0, 637.0, 580.0, 378.0, 282.0, 186.0, 126.0, 95.0, 69.0, 47.0, 23.0, 17.0, 22.0, 10.0, 5.0, 6.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0], "bins": [-10.453125, -10.2135009765625, -9.973876953125, -9.7342529296875, -9.49462890625, -9.2550048828125, -9.015380859375, -8.7757568359375, -8.5361328125, -8.2965087890625, -8.056884765625, -7.8172607421875, -7.57763671875, -7.3380126953125, -7.098388671875, -6.8587646484375, -6.619140625, -6.3795166015625, -6.139892578125, -5.9002685546875, -5.66064453125, -5.4210205078125, -5.181396484375, -4.9417724609375, -4.7021484375, -4.4625244140625, -4.222900390625, -3.9832763671875, -3.74365234375, -3.5040283203125, -3.264404296875, -3.0247802734375, -2.78515625, -2.5455322265625, -2.305908203125, -2.0662841796875, -1.82666015625, -1.5870361328125, -1.347412109375, -1.1077880859375, -0.8681640625, -0.6285400390625, -0.388916015625, -0.1492919921875, 0.09033203125, 0.3299560546875, 0.569580078125, 0.8092041015625, 1.048828125, 1.2884521484375, 1.528076171875, 1.7677001953125, 2.00732421875, 2.2469482421875, 2.486572265625, 2.7261962890625, 2.9658203125, 3.2054443359375, 3.445068359375, 3.6846923828125, 3.92431640625, 4.1639404296875, 4.403564453125, 4.6431884765625, 4.8828125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 2.0, 4.0, 2.0, 3.0, 7.0, 12.0, 13.0, 20.0, 21.0, 53.0, 88.0, 122.0, 175.0, 156.0, 108.0, 73.0, 43.0, 18.0, 24.0, 15.0, 6.0, 8.0, 3.0, 4.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-67.07365417480469, -65.02252960205078, -62.97140884399414, -60.9202880859375, -58.869163513183594, -56.81804275512695, -54.76692199707031, -52.715797424316406, -50.6646728515625, -48.61355209350586, -46.56242752075195, -44.51130676269531, -42.460182189941406, -40.409061431884766, -38.357940673828125, -36.30681610107422, -34.25569534301758, -32.20457458496094, -30.15345001220703, -28.10232925415039, -26.051204681396484, -24.000083923339844, -21.94896125793457, -19.897838592529297, -17.846715927124023, -15.79559326171875, -13.744470596313477, -11.69334888458252, -9.642226219177246, -7.591103553771973, -5.539981842041016, -3.488859176635742, -1.4377365112304688, 0.6133859157562256, 2.66450834274292, 4.715630531311035, 6.766753196716309, 8.817875862121582, 10.868997573852539, 12.920120239257812, 14.971242904663086, 17.02236557006836, 19.073488235473633, 21.124610900878906, 23.175731658935547, 25.226856231689453, 27.277976989746094, 29.329099655151367, 31.38022232055664, 33.43134307861328, 35.48246765136719, 37.53358840942383, 39.584712982177734, 41.635833740234375, 43.68695831298828, 45.73807907104492, 47.78919982910156, 49.8403205871582, 51.89144515991211, 53.94256591796875, 55.993690490722656, 58.0448112487793, 60.09593200683594, 62.147056579589844, 64.19818115234375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 6.0, 9.0, 12.0, 10.0, 11.0, 19.0, 19.0, 15.0, 18.0, 28.0, 25.0, 25.0, 39.0, 55.0, 58.0, 42.0, 53.0, 54.0, 64.0, 56.0, 63.0, 41.0, 40.0, 47.0, 31.0, 23.0, 26.0, 32.0, 13.0, 11.0, 15.0, 10.0, 6.0, 4.0, 7.0, 2.0, 1.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-44.854557037353516, -43.54741668701172, -42.24028015136719, -40.93313980102539, -39.625999450683594, -38.31886291503906, -37.011722564697266, -35.70458221435547, -34.39744567871094, -33.09030532836914, -31.783166885375977, -30.476028442382812, -29.168888092041016, -27.86174964904785, -26.554611206054688, -25.24747085571289, -23.940330505371094, -22.63319206237793, -21.326051712036133, -20.01891326904297, -18.711772918701172, -17.404634475708008, -16.097496032714844, -14.790356636047363, -13.483217239379883, -12.176077842712402, -10.868938446044922, -9.561800003051758, -8.254660606384277, -6.947521209716797, -5.640382289886475, -4.333243370056152, -3.0261001586914062, -1.7189610004425049, -0.4118218421936035, 0.8953173160552979, 2.202456474304199, 3.5095958709716797, 4.816734790802002, 6.123873710632324, 7.431013107299805, 8.738152503967285, 10.045291900634766, 11.35243034362793, 12.65956974029541, 13.96670913696289, 15.273847579956055, 16.58098602294922, 17.888126373291016, 19.19526481628418, 20.502405166625977, 21.80954360961914, 23.116683959960938, 24.4238224029541, 25.730960845947266, 27.038101196289062, 28.345239639282227, 29.65237808227539, 30.959518432617188, 32.266658782958984, 33.573795318603516, 34.88093566894531, 36.18807601928711, 37.49521255493164, 38.80235290527344]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 5.0, 8.0, 11.0, 12.0, 14.0, 23.0, 43.0, 79.0, 113.0, 212.0, 314.0, 591.0, 1104.0, 2322.0, 5043.0, 12389.0, 34646.0, 120766.0, 569686.0, 215846.0, 54258.0, 17849.0, 6874.0, 3090.0, 1458.0, 780.0, 415.0, 241.0, 146.0, 82.0, 54.0, 29.0, 22.0, 14.0, 12.0, 3.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.33984375, -5.18133544921875, -5.0228271484375, -4.86431884765625, -4.705810546875, -4.54730224609375, -4.3887939453125, -4.23028564453125, -4.07177734375, -3.91326904296875, -3.7547607421875, -3.59625244140625, -3.437744140625, -3.27923583984375, -3.1207275390625, -2.96221923828125, -2.8037109375, -2.64520263671875, -2.4866943359375, -2.32818603515625, -2.169677734375, -2.01116943359375, -1.8526611328125, -1.69415283203125, -1.53564453125, -1.37713623046875, -1.2186279296875, -1.06011962890625, -0.901611328125, -0.74310302734375, -0.5845947265625, -0.42608642578125, -0.267578125, -0.10906982421875, 0.0494384765625, 0.20794677734375, 0.366455078125, 0.52496337890625, 0.6834716796875, 0.84197998046875, 1.00048828125, 1.15899658203125, 1.3175048828125, 1.47601318359375, 1.634521484375, 1.79302978515625, 1.9515380859375, 2.11004638671875, 2.2685546875, 2.42706298828125, 2.5855712890625, 2.74407958984375, 2.902587890625, 3.06109619140625, 3.2196044921875, 3.37811279296875, 3.53662109375, 3.69512939453125, 3.8536376953125, 4.01214599609375, 4.170654296875, 4.32916259765625, 4.4876708984375, 4.64617919921875, 4.8046875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 8.0, 7.0, 17.0, 14.0, 8.0, 12.0, 16.0, 23.0, 16.0, 22.0, 24.0, 23.0, 41.0, 44.0, 35.0, 37.0, 43.0, 53.0, 36.0, 45.0, 46.0, 49.0, 41.0, 39.0, 42.0, 43.0, 26.0, 23.0, 26.0, 30.0, 9.0, 24.0, 17.0, 15.0, 12.0, 11.0, 6.0, 9.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.16015625, -2.086273193359375, -2.01239013671875, -1.938507080078125, -1.8646240234375, -1.790740966796875, -1.71685791015625, -1.642974853515625, -1.569091796875, -1.495208740234375, -1.42132568359375, -1.347442626953125, -1.2735595703125, -1.199676513671875, -1.12579345703125, -1.051910400390625, -0.97802734375, -0.904144287109375, -0.83026123046875, -0.756378173828125, -0.6824951171875, -0.608612060546875, -0.53472900390625, -0.460845947265625, -0.386962890625, -0.313079833984375, -0.23919677734375, -0.165313720703125, -0.0914306640625, -0.017547607421875, 0.05633544921875, 0.130218505859375, 0.2041015625, 0.277984619140625, 0.35186767578125, 0.425750732421875, 0.4996337890625, 0.573516845703125, 0.64739990234375, 0.721282958984375, 0.795166015625, 0.869049072265625, 0.94293212890625, 1.016815185546875, 1.0906982421875, 1.164581298828125, 1.23846435546875, 1.312347412109375, 1.38623046875, 1.460113525390625, 1.53399658203125, 1.607879638671875, 1.6817626953125, 1.755645751953125, 1.82952880859375, 1.903411865234375, 1.977294921875, 2.051177978515625, 2.12506103515625, 2.198944091796875, 2.2728271484375, 2.346710205078125, 2.42059326171875, 2.494476318359375, 2.568359375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 6.0, 1.0, 11.0, 7.0, 11.0, 26.0, 20.0, 25.0, 64.0, 72.0, 120.0, 195.0, 292.0, 561.0, 1099.0, 2767.0, 11548.0, 84094.0, 885827.0, 49238.0, 8111.0, 2257.0, 948.0, 479.0, 278.0, 149.0, 108.0, 84.0, 49.0, 31.0, 30.0, 14.0, 19.0, 5.0, 9.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.60546875, -7.35516357421875, -7.1048583984375, -6.85455322265625, -6.604248046875, -6.35394287109375, -6.1036376953125, -5.85333251953125, -5.60302734375, -5.35272216796875, -5.1024169921875, -4.85211181640625, -4.601806640625, -4.35150146484375, -4.1011962890625, -3.85089111328125, -3.6005859375, -3.35028076171875, -3.0999755859375, -2.84967041015625, -2.599365234375, -2.34906005859375, -2.0987548828125, -1.84844970703125, -1.59814453125, -1.34783935546875, -1.0975341796875, -0.84722900390625, -0.596923828125, -0.34661865234375, -0.0963134765625, 0.15399169921875, 0.404296875, 0.65460205078125, 0.9049072265625, 1.15521240234375, 1.405517578125, 1.65582275390625, 1.9061279296875, 2.15643310546875, 2.40673828125, 2.65704345703125, 2.9073486328125, 3.15765380859375, 3.407958984375, 3.65826416015625, 3.9085693359375, 4.15887451171875, 4.4091796875, 4.65948486328125, 4.9097900390625, 5.16009521484375, 5.410400390625, 5.66070556640625, 5.9110107421875, 6.16131591796875, 6.41162109375, 6.66192626953125, 6.9122314453125, 7.16253662109375, 7.412841796875, 7.66314697265625, 7.9134521484375, 8.16375732421875, 8.4140625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 5.0, 1.0, 5.0, 6.0, 9.0, 9.0, 9.0, 12.0, 18.0, 10.0, 23.0, 17.0, 26.0, 22.0, 26.0, 32.0, 43.0, 48.0, 66.0, 76.0, 74.0, 60.0, 61.0, 42.0, 51.0, 40.0, 31.0, 29.0, 17.0, 14.0, 21.0, 11.0, 15.0, 7.0, 11.0, 13.0, 11.0, 5.0, 8.0, 7.0, 4.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.0234375, -9.7225341796875, -9.421630859375, -9.1207275390625, -8.81982421875, -8.5189208984375, -8.218017578125, -7.9171142578125, -7.6162109375, -7.3153076171875, -7.014404296875, -6.7135009765625, -6.41259765625, -6.1116943359375, -5.810791015625, -5.5098876953125, -5.208984375, -4.9080810546875, -4.607177734375, -4.3062744140625, -4.00537109375, -3.7044677734375, -3.403564453125, -3.1026611328125, -2.8017578125, -2.5008544921875, -2.199951171875, -1.8990478515625, -1.59814453125, -1.2972412109375, -0.996337890625, -0.6954345703125, -0.39453125, -0.0936279296875, 0.207275390625, 0.5081787109375, 0.80908203125, 1.1099853515625, 1.410888671875, 1.7117919921875, 2.0126953125, 2.3135986328125, 2.614501953125, 2.9154052734375, 3.21630859375, 3.5172119140625, 3.818115234375, 4.1190185546875, 4.419921875, 4.7208251953125, 5.021728515625, 5.3226318359375, 5.62353515625, 5.9244384765625, 6.225341796875, 6.5262451171875, 6.8271484375, 7.1280517578125, 7.428955078125, 7.7298583984375, 8.03076171875, 8.3316650390625, 8.632568359375, 8.9334716796875, 9.234375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 8.0, 2.0, 7.0, 4.0, 6.0, 14.0, 21.0, 20.0, 31.0, 47.0, 62.0, 100.0, 149.0, 296.0, 593.0, 1495.0, 4643.0, 20921.0, 764538.0, 231114.0, 17682.0, 4120.0, 1402.0, 589.0, 261.0, 149.0, 79.0, 55.0, 39.0, 30.0, 23.0, 25.0, 9.0, 11.0, 4.0, 5.0, 6.0, 1.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.701171875, -1.644378662109375, -1.58758544921875, -1.530792236328125, -1.4739990234375, -1.417205810546875, -1.36041259765625, -1.303619384765625, -1.246826171875, -1.190032958984375, -1.13323974609375, -1.076446533203125, -1.0196533203125, -0.962860107421875, -0.90606689453125, -0.849273681640625, -0.79248046875, -0.735687255859375, -0.67889404296875, -0.622100830078125, -0.5653076171875, -0.508514404296875, -0.45172119140625, -0.394927978515625, -0.338134765625, -0.281341552734375, -0.22454833984375, -0.167755126953125, -0.1109619140625, -0.054168701171875, 0.00262451171875, 0.059417724609375, 0.1162109375, 0.173004150390625, 0.22979736328125, 0.286590576171875, 0.3433837890625, 0.400177001953125, 0.45697021484375, 0.513763427734375, 0.570556640625, 0.627349853515625, 0.68414306640625, 0.740936279296875, 0.7977294921875, 0.854522705078125, 0.91131591796875, 0.968109130859375, 1.02490234375, 1.081695556640625, 1.13848876953125, 1.195281982421875, 1.2520751953125, 1.308868408203125, 1.36566162109375, 1.422454833984375, 1.479248046875, 1.536041259765625, 1.59283447265625, 1.649627685546875, 1.7064208984375, 1.763214111328125, 1.82000732421875, 1.876800537109375, 1.93359375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 5.0, 3.0, 7.0, 5.0, 9.0, 8.0, 9.0, 14.0, 12.0, 13.0, 28.0, 22.0, 45.0, 68.0, 82.0, 114.0, 135.0, 107.0, 76.0, 60.0, 43.0, 25.0, 23.0, 17.0, 13.0, 12.0, 4.0, 6.0, 5.0, 6.0, 6.0, 6.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.000461578369140625, -0.00044780224561691284, -0.0004340261220932007, -0.0004202499985694885, -0.00040647387504577637, -0.0003926977515220642, -0.00037892162799835205, -0.0003651455044746399, -0.00035136938095092773, -0.0003375932574272156, -0.0003238171339035034, -0.00031004101037979126, -0.0002962648868560791, -0.00028248876333236694, -0.0002687126398086548, -0.0002549365162849426, -0.00024116039276123047, -0.0002273842692375183, -0.00021360814571380615, -0.000199832022190094, -0.00018605589866638184, -0.00017227977514266968, -0.00015850365161895752, -0.00014472752809524536, -0.0001309514045715332, -0.00011717528104782104, -0.00010339915752410889, -8.962303400039673e-05, -7.584691047668457e-05, -6.207078695297241e-05, -4.8294663429260254e-05, -3.4518539905548096e-05, -2.0742416381835938e-05, -6.966292858123779e-06, 6.809830665588379e-06, 2.0585954189300537e-05, 3.4362077713012695e-05, 4.8138201236724854e-05, 6.191432476043701e-05, 7.569044828414917e-05, 8.946657180786133e-05, 0.00010324269533157349, 0.00011701881885528564, 0.0001307949423789978, 0.00014457106590270996, 0.00015834718942642212, 0.00017212331295013428, 0.00018589943647384644, 0.0001996755599975586, 0.00021345168352127075, 0.0002272278070449829, 0.00024100393056869507, 0.0002547800540924072, 0.0002685561776161194, 0.00028233230113983154, 0.0002961084246635437, 0.00030988454818725586, 0.000323660671710968, 0.0003374367952346802, 0.00035121291875839233, 0.0003649890422821045, 0.00037876516580581665, 0.0003925412893295288, 0.00040631741285324097, 0.0004200935363769531]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 7.0, 7.0, 11.0, 11.0, 10.0, 26.0, 24.0, 39.0, 57.0, 84.0, 100.0, 142.0, 248.0, 404.0, 692.0, 1487.0, 3199.0, 8551.0, 32971.0, 743219.0, 217853.0, 26394.0, 7138.0, 2792.0, 1268.0, 695.0, 383.0, 248.0, 143.0, 103.0, 75.0, 42.0, 28.0, 31.0, 23.0, 11.0, 12.0, 6.0, 4.0, 5.0, 2.0, 4.0, 1.0, 3.0, 3.0, 2.0, 0.0, 2.0], "bins": [-1.2255859375, -1.1914749145507812, -1.1573638916015625, -1.1232528686523438, -1.089141845703125, -1.0550308227539062, -1.0209197998046875, -0.9868087768554688, -0.95269775390625, -0.9185867309570312, -0.8844757080078125, -0.8503646850585938, -0.816253662109375, -0.7821426391601562, -0.7480316162109375, -0.7139205932617188, -0.6798095703125, -0.6456985473632812, -0.6115875244140625, -0.5774765014648438, -0.543365478515625, -0.5092544555664062, -0.4751434326171875, -0.44103240966796875, -0.40692138671875, -0.37281036376953125, -0.3386993408203125, -0.30458831787109375, -0.270477294921875, -0.23636627197265625, -0.2022552490234375, -0.16814422607421875, -0.134033203125, -0.09992218017578125, -0.0658111572265625, -0.03170013427734375, 0.002410888671875, 0.03652191162109375, 0.0706329345703125, 0.10474395751953125, 0.13885498046875, 0.17296600341796875, 0.2070770263671875, 0.24118804931640625, 0.275299072265625, 0.30941009521484375, 0.3435211181640625, 0.37763214111328125, 0.4117431640625, 0.44585418701171875, 0.4799652099609375, 0.5140762329101562, 0.548187255859375, 0.5822982788085938, 0.6164093017578125, 0.6505203247070312, 0.68463134765625, 0.7187423706054688, 0.7528533935546875, 0.7869644165039062, 0.821075439453125, 0.8551864624023438, 0.8892974853515625, 0.9234085083007812, 0.95751953125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 6.0, 1.0, 2.0, 1.0, 5.0, 2.0, 5.0, 8.0, 6.0, 8.0, 4.0, 9.0, 8.0, 12.0, 18.0, 21.0, 36.0, 30.0, 43.0, 45.0, 66.0, 104.0, 101.0, 90.0, 90.0, 53.0, 53.0, 33.0, 25.0, 22.0, 20.0, 13.0, 11.0, 10.0, 7.0, 10.0, 8.0, 7.0, 2.0, 2.0, 4.0, 1.0, 3.0, 5.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.0810546875, -1.0492324829101562, -1.0174102783203125, -0.9855880737304688, -0.953765869140625, -0.9219436645507812, -0.8901214599609375, -0.8582992553710938, -0.82647705078125, -0.7946548461914062, -0.7628326416015625, -0.7310104370117188, -0.699188232421875, -0.6673660278320312, -0.6355438232421875, -0.6037216186523438, -0.5718994140625, -0.5400772094726562, -0.5082550048828125, -0.47643280029296875, -0.444610595703125, -0.41278839111328125, -0.3809661865234375, -0.34914398193359375, -0.31732177734375, -0.28549957275390625, -0.2536773681640625, -0.22185516357421875, -0.190032958984375, -0.15821075439453125, -0.1263885498046875, -0.09456634521484375, -0.062744140625, -0.03092193603515625, 0.0009002685546875, 0.03272247314453125, 0.064544677734375, 0.09636688232421875, 0.1281890869140625, 0.16001129150390625, 0.19183349609375, 0.22365570068359375, 0.2554779052734375, 0.28730010986328125, 0.319122314453125, 0.35094451904296875, 0.3827667236328125, 0.41458892822265625, 0.4464111328125, 0.47823333740234375, 0.5100555419921875, 0.5418777465820312, 0.573699951171875, 0.6055221557617188, 0.6373443603515625, 0.6691665649414062, 0.70098876953125, 0.7328109741210938, 0.7646331787109375, 0.7964553833007812, 0.828277587890625, 0.8600997924804688, 0.8919219970703125, 0.9237442016601562, 0.95556640625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 3.0, 4.0, 25.0, 36.0, 73.0, 130.0, 519.0, 94.0, 49.0, 37.0, 12.0, 5.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-80.2357177734375, -78.34186553955078, -76.44800567626953, -74.55415344238281, -72.66029357910156, -70.76644134521484, -68.87258911132812, -66.97872924804688, -65.08487701416016, -63.19102096557617, -61.29716491699219, -59.40331268310547, -57.509456634521484, -55.6156005859375, -53.72174835205078, -51.8278923034668, -49.93403625488281, -48.04018020629883, -46.146324157714844, -44.252471923828125, -42.35861587524414, -40.464759826660156, -38.57090759277344, -36.67705154418945, -34.78319549560547, -32.889339447021484, -30.995485305786133, -29.10163116455078, -27.207775115966797, -25.313919067382812, -23.42006492614746, -21.52621078491211, -19.632354736328125, -17.73849868774414, -15.844644546508789, -13.950789451599121, -12.056934356689453, -10.163079261779785, -8.269224166870117, -6.375369071960449, -4.481513977050781, -2.5876588821411133, -0.6938037872314453, 1.2000513076782227, 3.0939064025878906, 4.987761497497559, 6.881616592407227, 8.775471687316895, 10.669326782226562, 12.56318187713623, 14.457036972045898, 16.35089111328125, 18.244747161865234, 20.13860321044922, 22.03245735168457, 23.926311492919922, 25.820167541503906, 27.71402359008789, 29.607877731323242, 31.501731872558594, 33.39558792114258, 35.28944396972656, 37.18329620361328, 39.077152252197266, 40.97100830078125]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 6.0, 10.0, 7.0, 11.0, 8.0, 15.0, 11.0, 24.0, 29.0, 28.0, 43.0, 34.0, 110.0, 374.0, 62.0, 32.0, 29.0, 30.0, 32.0, 29.0, 14.0, 12.0, 14.0, 15.0, 13.0, 2.0, 3.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-52.86162185668945, -51.583953857421875, -50.30628204345703, -49.02861404418945, -47.75094223022461, -46.47327423095703, -45.19560241699219, -43.91793441772461, -42.64026641845703, -41.36259841918945, -40.08492660522461, -38.80725860595703, -37.52958679199219, -36.25191879272461, -34.974246978759766, -33.69657897949219, -32.418907165527344, -31.141237258911133, -29.863567352294922, -28.58589744567871, -27.3082275390625, -26.030559539794922, -24.75288963317871, -23.4752197265625, -22.19754981994629, -20.919879913330078, -19.642210006713867, -18.364540100097656, -17.086872100830078, -15.80920124053955, -14.531532287597656, -13.253862380981445, -11.976188659667969, -10.698518753051758, -9.420848846435547, -8.143179893493652, -6.865509986877441, -5.5878400802612305, -4.310170650482178, -3.032501220703125, -1.754831314086914, -0.4771616458892822, 0.8005080223083496, 2.0781776905059814, 3.3558473587036133, 4.633517265319824, 5.911186695098877, 7.18885612487793, 8.46652603149414, 9.744195938110352, 11.021865844726562, 12.299534797668457, 13.577204704284668, 14.854874610900879, 16.132543563842773, 17.410213470458984, 18.687883377075195, 19.965553283691406, 21.243223190307617, 22.520893096923828, 23.798561096191406, 25.07623291015625, 26.353900909423828, 27.63157081604004, 28.90924072265625]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 5.0, 4.0, 8.0, 7.0, 12.0, 12.0, 14.0, 16.0, 13.0, 26.0, 17.0, 25.0, 35.0, 31.0, 64.0, 123.0, 210.0, 85.0, 45.0, 38.0, 35.0, 23.0, 27.0, 14.0, 18.0, 14.0, 15.0, 13.0, 12.0, 12.0, 9.0, 3.0, 6.0, 7.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.427734375, -2.350067138671875, -2.27239990234375, -2.194732666015625, -2.1170654296875, -2.039398193359375, -1.96173095703125, -1.884063720703125, -1.806396484375, -1.728729248046875, -1.65106201171875, -1.573394775390625, -1.4957275390625, -1.418060302734375, -1.34039306640625, -1.262725830078125, -1.18505859375, -1.107391357421875, -1.02972412109375, -0.952056884765625, -0.8743896484375, -0.796722412109375, -0.71905517578125, -0.641387939453125, -0.563720703125, -0.486053466796875, -0.40838623046875, -0.330718994140625, -0.2530517578125, -0.175384521484375, -0.09771728515625, -0.020050048828125, 0.0576171875, 0.135284423828125, 0.21295166015625, 0.290618896484375, 0.3682861328125, 0.445953369140625, 0.52362060546875, 0.601287841796875, 0.678955078125, 0.756622314453125, 0.83428955078125, 0.911956787109375, 0.9896240234375, 1.067291259765625, 1.14495849609375, 1.222625732421875, 1.30029296875, 1.377960205078125, 1.45562744140625, 1.533294677734375, 1.6109619140625, 1.688629150390625, 1.76629638671875, 1.843963623046875, 1.921630859375, 1.999298095703125, 2.07696533203125, 2.154632568359375, 2.2322998046875, 2.309967041015625, 2.38763427734375, 2.465301513671875, 2.54296875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 3.0, 7.0, 10.0, 17.0, 20.0, 22.0, 33.0, 53.0, 62.0, 115.0, 209.0, 456.0, 953.0, 2562.0, 9164.0, 8181894.0, 181542.0, 7312.0, 2254.0, 856.0, 410.0, 202.0, 139.0, 62.0, 48.0, 38.0, 26.0, 18.0, 10.0, 14.0, 8.0, 10.0, 11.0, 4.0, 7.0, 7.0, 0.0, 2.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 3.0], "bins": [-17.026226043701172, -16.416513442993164, -15.80679988861084, -15.197086334228516, -14.587372779846191, -13.977659225463867, -13.36794662475586, -12.758233070373535, -12.148519515991211, -11.538805961608887, -10.929093360900879, -10.319379806518555, -9.70966625213623, -9.099952697753906, -8.490240097045898, -7.880526542663574, -7.270813941955566, -6.6611008644104, -6.051387310028076, -5.44167423248291, -4.831960678100586, -4.22224760055542, -3.612534523010254, -3.0028209686279297, -2.3931078910827637, -1.7833945751190186, -1.173681378364563, -0.5639681816101074, 0.045745134353637695, 0.6554584503173828, 1.2651715278625488, 1.874885082244873, 2.484598159790039, 3.094311475753784, 3.7040247917175293, 4.313737869262695, 4.9234514236450195, 5.5331645011901855, 6.142877578735352, 6.752591133117676, 7.362304210662842, 7.972017288208008, 8.581730842590332, 9.191444396972656, 9.801156997680664, 10.410870552062988, 11.020584106445312, 11.63029670715332, 12.240010261535645, 12.849723815917969, 13.459436416625977, 14.0691499710083, 14.678863525390625, 15.288576126098633, 15.898289680480957, 16.50800323486328, 17.11771583557129, 17.727428436279297, 18.337142944335938, 18.946855545043945, 19.556568145751953, 20.166282653808594, 20.7759952545166, 21.38570785522461, 21.99542236328125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 5.0, 5.0, 3.0, 2.0, 3.0, 4.0, 6.0, 4.0, 5.0, 3.0, 5.0, 2.0, 4.0, 6.0, 3.0, 7.0, 4.0, 4.0, 2.0, 3.0, 5.0, 8.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.60777473449707, -11.981675148010254, -11.355575561523438, -10.729476928710938, -10.103377342224121, -9.477277755737305, -8.851179122924805, -8.225079536437988, -7.598979949951172, -6.9728803634643555, -6.346781253814697, -5.720682144165039, -5.094582557678223, -4.468482971191406, -3.842383861541748, -3.21628475189209, -2.5901851654052734, -1.9640858173370361, -1.3379864692687988, -0.7118871212005615, -0.08578777313232422, 0.5403115749359131, 1.1664109230041504, 1.7925100326538086, 2.418609619140625, 3.0447089672088623, 3.6708083152770996, 4.296907424926758, 4.923007011413574, 5.549106597900391, 6.175205707550049, 6.801304817199707, 7.427406311035156, 8.053505897521973, 8.679605484008789, 9.305704116821289, 9.931803703308105, 10.557903289794922, 11.184001922607422, 11.810101509094238, 12.436201095581055, 13.062300682067871, 13.688400268554688, 14.314498901367188, 14.940598487854004, 15.56669807434082, 16.19279670715332, 16.818897247314453, 17.444995880126953, 18.071094512939453, 18.697195053100586, 19.323293685913086, 19.94939422607422, 20.57549285888672, 21.20159149169922, 21.82769012451172, 22.45379066467285, 23.07988929748535, 23.705989837646484, 24.332088470458984, 24.958187103271484, 25.584287643432617, 26.210386276245117, 26.83648681640625, 27.46258544921875]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 11.0, 5.0, 14.0, 15.0, 23.0, 21.0, 36.0, 34.0, 51.0, 77.0, 111.0, 179.0, 331.0, 476.0, 933.0, 1743.0, 3626.0, 7828.0, 18582.0, 47421.0, 125364.0, 182082.0, 82217.0, 30337.0, 12185.0, 5318.0, 2431.0, 1193.0, 649.0, 350.0, 211.0, 131.0, 84.0, 53.0, 40.0, 36.0, 17.0, 18.0, 13.0, 3.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-18.234375, -17.6865234375, -17.138671875, -16.5908203125, -16.04296875, -15.4951171875, -14.947265625, -14.3994140625, -13.8515625, -13.3037109375, -12.755859375, -12.2080078125, -11.66015625, -11.1123046875, -10.564453125, -10.0166015625, -9.46875, -8.9208984375, -8.373046875, -7.8251953125, -7.27734375, -6.7294921875, -6.181640625, -5.6337890625, -5.0859375, -4.5380859375, -3.990234375, -3.4423828125, -2.89453125, -2.3466796875, -1.798828125, -1.2509765625, -0.703125, -0.1552734375, 0.392578125, 0.9404296875, 1.48828125, 2.0361328125, 2.583984375, 3.1318359375, 3.6796875, 4.2275390625, 4.775390625, 5.3232421875, 5.87109375, 6.4189453125, 6.966796875, 7.5146484375, 8.0625, 8.6103515625, 9.158203125, 9.7060546875, 10.25390625, 10.8017578125, 11.349609375, 11.8974609375, 12.4453125, 12.9931640625, 13.541015625, 14.0888671875, 14.63671875, 15.1845703125, 15.732421875, 16.2802734375, 16.828125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 4.0, 5.0, 3.0, 3.0, 5.0, 13.0, 9.0, 14.0, 15.0, 12.0, 20.0, 19.0, 32.0, 34.0, 45.0, 57.0, 67.0, 63.0, 59.0, 76.0, 57.0, 66.0, 49.0, 54.0, 41.0, 36.0, 33.0, 16.0, 22.0, 14.0, 16.0, 12.0, 10.0, 7.0, 5.0, 1.0, 4.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.70703125, -2.61669921875, -2.5263671875, -2.43603515625, -2.345703125, -2.25537109375, -2.1650390625, -2.07470703125, -1.984375, -1.89404296875, -1.8037109375, -1.71337890625, -1.623046875, -1.53271484375, -1.4423828125, -1.35205078125, -1.26171875, -1.17138671875, -1.0810546875, -0.99072265625, -0.900390625, -0.81005859375, -0.7197265625, -0.62939453125, -0.5390625, -0.44873046875, -0.3583984375, -0.26806640625, -0.177734375, -0.08740234375, 0.0029296875, 0.09326171875, 0.18359375, 0.27392578125, 0.3642578125, 0.45458984375, 0.544921875, 0.63525390625, 0.7255859375, 0.81591796875, 0.90625, 0.99658203125, 1.0869140625, 1.17724609375, 1.267578125, 1.35791015625, 1.4482421875, 1.53857421875, 1.62890625, 1.71923828125, 1.8095703125, 1.89990234375, 1.990234375, 2.08056640625, 2.1708984375, 2.26123046875, 2.3515625, 2.44189453125, 2.5322265625, 2.62255859375, 2.712890625, 2.80322265625, 2.8935546875, 2.98388671875, 3.07421875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 14.0, 21.0, 34.0, 87.0, 191.0, 106.0, 25.0, 9.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.65459632873535, -25.014572143554688, -23.374549865722656, -21.734527587890625, -20.09450340270996, -18.454479217529297, -16.814456939697266, -15.174433708190918, -13.53441047668457, -11.894387245178223, -10.254364013671875, -8.614340782165527, -6.97431755065918, -5.334294319152832, -3.6942710876464844, -2.0542478561401367, -0.41422462463378906, 1.2257986068725586, 2.8658218383789062, 4.505845069885254, 6.145868301391602, 7.785891532897949, 9.425914764404297, 11.065937995910645, 12.705961227416992, 14.34598445892334, 15.986007690429688, 17.62602996826172, 19.266054153442383, 20.906078338623047, 22.546100616455078, 24.18612289428711, 25.826148986816406, 27.466171264648438, 29.1061954498291, 30.746219635009766, 32.3862419128418, 34.02626419067383, 35.666290283203125, 37.306312561035156, 38.94633483886719, 40.58635711669922, 42.22637939453125, 43.86640548706055, 45.50642776489258, 47.14645004272461, 48.786476135253906, 50.42649841308594, 52.06652069091797, 53.70654296875, 55.34656524658203, 56.98659133911133, 58.62661361694336, 60.26663589477539, 61.90666198730469, 63.54668426513672, 65.18670654296875, 66.82672882080078, 68.46675109863281, 70.10677337646484, 71.74679565429688, 73.38682556152344, 75.02684783935547, 76.6668701171875, 78.30689239501953]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 8.0, 4.0, 8.0, 1.0, 4.0, 7.0, 4.0, 6.0, 15.0, 34.0, 73.0, 104.0, 92.0, 59.0, 22.0, 7.0, 9.0, 7.0, 7.0, 8.0, 3.0, 3.0, 0.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.888593673706055, -20.272724151611328, -19.6568546295166, -19.040985107421875, -18.42511558532715, -17.809246063232422, -17.193376541137695, -16.57750701904297, -15.961638450622559, -15.345768928527832, -14.729899406433105, -14.114029884338379, -13.498161315917969, -12.882291793823242, -12.266422271728516, -11.650552749633789, -11.034683227539062, -10.418813705444336, -9.80294418334961, -9.187074661254883, -8.571205139160156, -7.955336093902588, -7.3394670486450195, -6.723597526550293, -6.107728004455566, -5.49185848236084, -4.875988960266113, -4.260119915008545, -3.6442503929138184, -3.028380870819092, -2.4125115871429443, -1.7966423034667969, -1.1807708740234375, -0.5649014711380005, 0.05096793174743652, 0.6668373346328735, 1.2827067375183105, 1.898576259613037, 2.5144455432891846, 3.130314826965332, 3.7461843490600586, 4.362053871154785, 4.977923393249512, 5.59379243850708, 6.209661960601807, 6.825531482696533, 7.441400527954102, 8.057270050048828, 8.673139572143555, 9.289009094238281, 9.904878616333008, 10.520748138427734, 11.136617660522461, 11.752487182617188, 12.368355751037598, 12.984225273132324, 13.60009479522705, 14.215964317321777, 14.831833839416504, 15.44770336151123, 16.06357192993164, 16.679441452026367, 17.295310974121094, 17.91118049621582, 18.527050018310547]}, "eval/loss": 4.170833587646484, "eval/wer": 1.9509520031733438, "eval/runtime": 786.0537, "eval/samples_per_second": 3.361, "eval/steps_per_second": 0.281} \ No newline at end of file +{"train/loss": 4.3369, "train/learning_rate": 9.574468085106382e-07, "train/epoch": 1.0, "train/global_step": 594, "_runtime": 5680, "_timestamp": 1646136607, "_step": 595, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 67.0, 918.0, 32.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.59164047241211, -13.245392799377441, -7.899145126342773, -2.552898406982422, 2.7933502197265625, 8.139598846435547, 13.485843658447266, 18.83209228515625, 24.178340911865234, 29.52458953857422, 34.87083435058594, 40.21708297729492, 45.563331604003906, 50.90958023071289, 56.25582504272461, 61.602073669433594, 66.94831848144531, 72.29456329345703, 77.64081573486328, 82.987060546875, 88.33331298828125, 93.67955780029297, 99.02580261230469, 104.37205505371094, 109.71830749511719, 115.0645523071289, 120.41080474853516, 125.75704956054688, 131.10330200195312, 136.44955444335938, 141.79579162597656, 147.1420440673828, 152.48828125, 157.83453369140625, 163.18077087402344, 168.5270233154297, 173.87327575683594, 179.21951293945312, 184.56576538085938, 189.91201782226562, 195.25827026367188, 200.60452270507812, 205.9507598876953, 211.29701232910156, 216.6432647705078, 221.989501953125, 227.33575439453125, 232.6820068359375, 238.0282440185547, 243.37449645996094, 248.72073364257812, 254.06698608398438, 259.4132385253906, 264.7594909667969, 270.105712890625, 275.45196533203125, 280.7982177734375, 286.14447021484375, 291.49072265625, 296.83697509765625, 302.1831970214844, 307.5294494628906, 312.8757019042969, 318.2219543457031, 323.5682067871094]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 6.0, 5.0, 5.0, 10.0, 13.0, 15.0, 20.0, 21.0, 21.0, 34.0, 28.0, 40.0, 38.0, 47.0, 43.0, 55.0, 39.0, 62.0, 57.0, 49.0, 51.0, 52.0, 53.0, 40.0, 29.0, 31.0, 24.0, 25.0, 24.0, 19.0, 10.0, 10.0, 9.0, 5.0, 5.0, 5.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.58059310913086, -23.754621505737305, -22.92864990234375, -22.102678298950195, -21.27670669555664, -20.450735092163086, -19.62476348876953, -18.798791885375977, -17.972820281982422, -17.146848678588867, -16.320877075195312, -15.494905471801758, -14.668933868408203, -13.842962265014648, -13.016990661621094, -12.191019058227539, -11.3650484085083, -10.539076805114746, -9.713105201721191, -8.887133598327637, -8.061161994934082, -7.2351908683776855, -6.409219264984131, -5.583247661590576, -4.7572760581970215, -3.931304454803467, -3.105332851409912, -2.2793614864349365, -1.4533898830413818, -0.6274185180664062, 0.19855308532714844, 1.0245246887207031, 1.8504962921142578, 2.6764678955078125, 3.502439498901367, 4.328411102294922, 5.154382705688477, 5.980353832244873, 6.806325435638428, 7.632297039031982, 8.458269119262695, 9.28424072265625, 10.110212326049805, 10.93618392944336, 11.762155532836914, 12.588127136230469, 13.414098739624023, 14.240070343017578, 15.066040992736816, 15.892012596130371, 16.71798324584961, 17.543954849243164, 18.36992645263672, 19.195898056030273, 20.021869659423828, 20.847841262817383, 21.673812866210938, 22.499784469604492, 23.325756072998047, 24.1517276763916, 24.977699279785156, 25.80367088317871, 26.629642486572266, 27.45561408996582, 28.281585693359375]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 6.0, 6.0, 3.0, 6.0, 12.0, 16.0, 12.0, 18.0, 16.0, 26.0, 23.0, 22.0, 32.0, 33.0, 36.0, 32.0, 35.0, 44.0, 39.0, 48.0, 44.0, 33.0, 48.0, 42.0, 41.0, 36.0, 33.0, 34.0, 33.0, 37.0, 25.0, 25.0, 21.0, 26.0, 8.0, 10.0, 11.0, 12.0, 3.0, 4.0, 1.0, 4.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0830078125, -1.0488433837890625, -1.014678955078125, -0.9805145263671875, -0.94635009765625, -0.9121856689453125, -0.878021240234375, -0.8438568115234375, -0.8096923828125, -0.7755279541015625, -0.741363525390625, -0.7071990966796875, -0.67303466796875, -0.6388702392578125, -0.604705810546875, -0.5705413818359375, -0.536376953125, -0.5022125244140625, -0.468048095703125, -0.4338836669921875, -0.39971923828125, -0.3655548095703125, -0.331390380859375, -0.2972259521484375, -0.2630615234375, -0.2288970947265625, -0.194732666015625, -0.1605682373046875, -0.12640380859375, -0.0922393798828125, -0.058074951171875, -0.0239105224609375, 0.01025390625, 0.0444183349609375, 0.078582763671875, 0.1127471923828125, 0.14691162109375, 0.1810760498046875, 0.215240478515625, 0.2494049072265625, 0.2835693359375, 0.3177337646484375, 0.351898193359375, 0.3860626220703125, 0.42022705078125, 0.4543914794921875, 0.488555908203125, 0.5227203369140625, 0.556884765625, 0.5910491943359375, 0.625213623046875, 0.6593780517578125, 0.69354248046875, 0.7277069091796875, 0.761871337890625, 0.7960357666015625, 0.8302001953125, 0.8643646240234375, 0.898529052734375, 0.9326934814453125, 0.96685791015625, 1.0010223388671875, 1.035186767578125, 1.0693511962890625, 1.103515625]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 3.0, 9.0, 13.0, 19.0, 24.0, 30.0, 39.0, 58.0, 73.0, 108.0, 176.0, 240.0, 336.0, 519.0, 853.0, 1507.0, 2550.0, 5584.0, 14655.0, 54536.0, 337513.0, 2318331.0, 1256090.0, 151546.0, 30755.0, 9536.0, 4005.0, 2002.0, 1127.0, 651.0, 439.0, 283.0, 214.0, 145.0, 87.0, 61.0, 36.0, 31.0, 21.0, 21.0, 11.0, 9.0, 8.0, 5.0, 5.0, 4.0, 4.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.21484375, -3.106964111328125, -2.99908447265625, -2.891204833984375, -2.7833251953125, -2.675445556640625, -2.56756591796875, -2.459686279296875, -2.351806640625, -2.243927001953125, -2.13604736328125, -2.028167724609375, -1.9202880859375, -1.812408447265625, -1.70452880859375, -1.596649169921875, -1.48876953125, -1.380889892578125, -1.27301025390625, -1.165130615234375, -1.0572509765625, -0.949371337890625, -0.84149169921875, -0.733612060546875, -0.625732421875, -0.517852783203125, -0.40997314453125, -0.302093505859375, -0.1942138671875, -0.086334228515625, 0.02154541015625, 0.129425048828125, 0.2373046875, 0.345184326171875, 0.45306396484375, 0.560943603515625, 0.6688232421875, 0.776702880859375, 0.88458251953125, 0.992462158203125, 1.100341796875, 1.208221435546875, 1.31610107421875, 1.423980712890625, 1.5318603515625, 1.639739990234375, 1.74761962890625, 1.855499267578125, 1.96337890625, 2.071258544921875, 2.17913818359375, 2.287017822265625, 2.3948974609375, 2.502777099609375, 2.61065673828125, 2.718536376953125, 2.826416015625, 2.934295654296875, 3.04217529296875, 3.150054931640625, 3.2579345703125, 3.365814208984375, 3.47369384765625, 3.581573486328125, 3.689453125]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 3.0, 9.0, 20.0, 27.0, 62.0, 105.0, 171.0, 293.0, 511.0, 856.0, 824.0, 513.0, 281.0, 163.0, 77.0, 71.0, 25.0, 24.0, 17.0, 9.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.7890625, -8.56292724609375, -8.3367919921875, -8.11065673828125, -7.884521484375, -7.65838623046875, -7.4322509765625, -7.20611572265625, -6.97998046875, -6.75384521484375, -6.5277099609375, -6.30157470703125, -6.075439453125, -5.84930419921875, -5.6231689453125, -5.39703369140625, -5.1708984375, -4.94476318359375, -4.7186279296875, -4.49249267578125, -4.266357421875, -4.04022216796875, -3.8140869140625, -3.58795166015625, -3.36181640625, -3.13568115234375, -2.9095458984375, -2.68341064453125, -2.457275390625, -2.23114013671875, -2.0050048828125, -1.77886962890625, -1.552734375, -1.32659912109375, -1.1004638671875, -0.87432861328125, -0.648193359375, -0.42205810546875, -0.1959228515625, 0.03021240234375, 0.25634765625, 0.48248291015625, 0.7086181640625, 0.93475341796875, 1.160888671875, 1.38702392578125, 1.6131591796875, 1.83929443359375, 2.0654296875, 2.29156494140625, 2.5177001953125, 2.74383544921875, 2.969970703125, 3.19610595703125, 3.4222412109375, 3.64837646484375, 3.87451171875, 4.10064697265625, 4.3267822265625, 4.55291748046875, 4.779052734375, 5.00518798828125, 5.2313232421875, 5.45745849609375, 5.68359375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 6.0, 19.0, 26.0, 54.0, 92.0, 232.0, 469.0, 1130.0, 4021.0, 263401.0, 3910513.0, 11003.0, 1959.0, 660.0, 330.0, 155.0, 86.0, 37.0, 40.0, 10.0, 6.0, 5.0, 3.0, 6.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.8125, -26.029052734375, -25.24560546875, -24.462158203125, -23.6787109375, -22.895263671875, -22.11181640625, -21.328369140625, -20.544921875, -19.761474609375, -18.97802734375, -18.194580078125, -17.4111328125, -16.627685546875, -15.84423828125, -15.060791015625, -14.27734375, -13.493896484375, -12.71044921875, -11.927001953125, -11.1435546875, -10.360107421875, -9.57666015625, -8.793212890625, -8.009765625, -7.226318359375, -6.44287109375, -5.659423828125, -4.8759765625, -4.092529296875, -3.30908203125, -2.525634765625, -1.7421875, -0.958740234375, -0.17529296875, 0.608154296875, 1.3916015625, 2.175048828125, 2.95849609375, 3.741943359375, 4.525390625, 5.308837890625, 6.09228515625, 6.875732421875, 7.6591796875, 8.442626953125, 9.22607421875, 10.009521484375, 10.79296875, 11.576416015625, 12.35986328125, 13.143310546875, 13.9267578125, 14.710205078125, 15.49365234375, 16.277099609375, 17.060546875, 17.843994140625, 18.62744140625, 19.410888671875, 20.1943359375, 20.977783203125, 21.76123046875, 22.544677734375, 23.328125]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 389.0, 615.0, 9.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-239.70358276367188, -235.50018310546875, -231.2967987060547, -227.09339904785156, -222.8900146484375, -218.68661499023438, -214.4832305908203, -210.2798309326172, -206.07644653320312, -201.873046875, -197.66966247558594, -193.4662628173828, -189.26287841796875, -185.05947875976562, -180.85609436035156, -176.65269470214844, -172.4492950439453, -168.2458953857422, -164.04251098632812, -159.839111328125, -155.63572692871094, -151.4323272705078, -147.22894287109375, -143.02554321289062, -138.8221435546875, -134.61874389648438, -130.4153594970703, -126.21196746826172, -122.00857543945312, -117.80517578125, -113.6017837524414, -109.39839172363281, -105.19499969482422, -100.99160766601562, -96.78821563720703, -92.58482360839844, -88.38142395019531, -84.17803955078125, -79.97463989257812, -75.77124786376953, -71.56785583496094, -67.36446380615234, -63.16107177734375, -58.95767593383789, -54.7542839050293, -50.5508918762207, -46.347496032714844, -42.14410400390625, -37.940711975097656, -33.73731994628906, -29.533926010131836, -25.33053207397461, -21.127140045166016, -16.923748016357422, -12.720354080200195, -8.516960144042969, -4.313568115234375, -0.11017513275146484, 4.093217849731445, 8.296610832214355, 12.500003814697266, 16.70339584350586, 20.906789779663086, 25.110183715820312, 29.313575744628906]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 7.0, 1.0, 6.0, 4.0, 5.0, 15.0, 17.0, 21.0, 25.0, 15.0, 27.0, 37.0, 45.0, 28.0, 52.0, 43.0, 49.0, 41.0, 52.0, 51.0, 62.0, 49.0, 46.0, 48.0, 36.0, 46.0, 18.0, 28.0, 27.0, 30.0, 16.0, 14.0, 12.0, 7.0, 8.0, 8.0, 6.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.197795867919922, -20.582115173339844, -19.966432571411133, -19.350751876831055, -18.735069274902344, -18.119388580322266, -17.503707885742188, -16.888025283813477, -16.2723445892334, -15.656662940979004, -15.04098129272461, -14.425300598144531, -13.809618949890137, -13.193937301635742, -12.578255653381348, -11.962574005126953, -11.346892356872559, -10.731210708618164, -10.11552906036377, -9.499847412109375, -8.884166717529297, -8.268485069274902, -7.652803421020508, -7.0371222496032715, -6.421440601348877, -5.805758953094482, -5.190077781677246, -4.574396133422852, -3.958714723587036, -3.3430333137512207, -2.727351665496826, -2.11167049407959, -1.4959888458251953, -0.8803073763847351, -0.2646259069442749, 0.3510556221008301, 0.9667370319366455, 1.582418441772461, 2.1981000900268555, 2.813781261444092, 3.4294629096984863, 4.045144557952881, 4.660825729370117, 5.276507377624512, 5.892189025878906, 6.507870197296143, 7.123551845550537, 7.739233016967773, 8.354914665222168, 8.970596313476562, 9.586277961730957, 10.201959609985352, 10.81764030456543, 11.433321952819824, 12.049003601074219, 12.664684295654297, 13.280366897583008, 13.896048545837402, 14.511730194091797, 15.127410888671875, 15.74309253692627, 16.358774185180664, 16.974456787109375, 17.590137481689453, 18.20581817626953]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 7.0, 5.0, 12.0, 18.0, 11.0, 21.0, 19.0, 25.0, 19.0, 20.0, 26.0, 22.0, 34.0, 35.0, 29.0, 43.0, 34.0, 54.0, 41.0, 48.0, 46.0, 39.0, 41.0, 38.0, 43.0, 31.0, 29.0, 30.0, 23.0, 24.0, 16.0, 30.0, 18.0, 18.0, 9.0, 5.0, 7.0, 11.0, 5.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.990234375, -0.9550628662109375, -0.919891357421875, -0.8847198486328125, -0.84954833984375, -0.8143768310546875, -0.779205322265625, -0.7440338134765625, -0.7088623046875, -0.6736907958984375, -0.638519287109375, -0.6033477783203125, -0.56817626953125, -0.5330047607421875, -0.497833251953125, -0.4626617431640625, -0.427490234375, -0.3923187255859375, -0.357147216796875, -0.3219757080078125, -0.28680419921875, -0.2516326904296875, -0.216461181640625, -0.1812896728515625, -0.1461181640625, -0.1109466552734375, -0.075775146484375, -0.0406036376953125, -0.00543212890625, 0.0297393798828125, 0.064910888671875, 0.1000823974609375, 0.13525390625, 0.1704254150390625, 0.205596923828125, 0.2407684326171875, 0.27593994140625, 0.3111114501953125, 0.346282958984375, 0.3814544677734375, 0.4166259765625, 0.4517974853515625, 0.486968994140625, 0.5221405029296875, 0.55731201171875, 0.5924835205078125, 0.627655029296875, 0.6628265380859375, 0.697998046875, 0.7331695556640625, 0.768341064453125, 0.8035125732421875, 0.83868408203125, 0.8738555908203125, 0.909027099609375, 0.9441986083984375, 0.9793701171875, 1.0145416259765625, 1.049713134765625, 1.0848846435546875, 1.12005615234375, 1.1552276611328125, 1.190399169921875, 1.2255706787109375, 1.2607421875]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 4.0, 5.0, 4.0, 11.0, 25.0, 23.0, 32.0, 66.0, 73.0, 119.0, 187.0, 279.0, 361.0, 549.0, 815.0, 1171.0, 1817.0, 2620.0, 3770.0, 5787.0, 8687.0, 13711.0, 21180.0, 34597.0, 55046.0, 89843.0, 151260.0, 224994.0, 166624.0, 99576.0, 60592.0, 37402.0, 23540.0, 15026.0, 9661.0, 6371.0, 4206.0, 2705.0, 1905.0, 1306.0, 876.0, 557.0, 402.0, 268.0, 153.0, 121.0, 84.0, 41.0, 41.0, 22.0, 15.0, 15.0, 6.0, 2.0, 7.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.11016845703125, -0.1064462661743164, -0.10272407531738281, -0.09900188446044922, -0.09527969360351562, -0.09155750274658203, -0.08783531188964844, -0.08411312103271484, -0.08039093017578125, -0.07666873931884766, -0.07294654846191406, -0.06922435760498047, -0.06550216674804688, -0.06177997589111328, -0.05805778503417969, -0.054335594177246094, -0.0506134033203125, -0.046891212463378906, -0.04316902160644531, -0.03944683074951172, -0.035724639892578125, -0.03200244903564453, -0.028280258178710938, -0.024558067321777344, -0.02083587646484375, -0.017113685607910156, -0.013391494750976562, -0.009669303894042969, -0.005947113037109375, -0.0022249221801757812, 0.0014972686767578125, 0.005219459533691406, 0.008941650390625, 0.012663841247558594, 0.016386032104492188, 0.02010822296142578, 0.023830413818359375, 0.02755260467529297, 0.03127479553222656, 0.034996986389160156, 0.03871917724609375, 0.042441368103027344, 0.04616355895996094, 0.04988574981689453, 0.053607940673828125, 0.05733013153076172, 0.06105232238769531, 0.0647745132446289, 0.0684967041015625, 0.0722188949584961, 0.07594108581542969, 0.07966327667236328, 0.08338546752929688, 0.08710765838623047, 0.09082984924316406, 0.09455204010009766, 0.09827423095703125, 0.10199642181396484, 0.10571861267089844, 0.10944080352783203, 0.11316299438476562, 0.11688518524169922, 0.12060737609863281, 0.1243295669555664, 0.1280517578125]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 0.0, 1.0, 3.0, 5.0, 3.0, 8.0, 10.0, 8.0, 13.0, 18.0, 15.0, 10.0, 25.0, 20.0, 29.0, 24.0, 20.0, 38.0, 43.0, 34.0, 40.0, 42.0, 52.0, 1060.0, 53.0, 37.0, 44.0, 32.0, 41.0, 39.0, 35.0, 33.0, 29.0, 28.0, 31.0, 22.0, 12.0, 18.0, 12.0, 13.0, 8.0, 8.0, 8.0, 2.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68212890625, -0.6590194702148438, -0.6359100341796875, -0.6128005981445312, -0.589691162109375, -0.5665817260742188, -0.5434722900390625, -0.5203628540039062, -0.49725341796875, -0.47414398193359375, -0.4510345458984375, -0.42792510986328125, -0.404815673828125, -0.38170623779296875, -0.3585968017578125, -0.33548736572265625, -0.3123779296875, -0.28926849365234375, -0.2661590576171875, -0.24304962158203125, -0.219940185546875, -0.19683074951171875, -0.1737213134765625, -0.15061187744140625, -0.12750244140625, -0.10439300537109375, -0.0812835693359375, -0.05817413330078125, -0.035064697265625, -0.01195526123046875, 0.0111541748046875, 0.03426361083984375, 0.057373046875, 0.08048248291015625, 0.1035919189453125, 0.12670135498046875, 0.149810791015625, 0.17292022705078125, 0.1960296630859375, 0.21913909912109375, 0.24224853515625, 0.26535797119140625, 0.2884674072265625, 0.31157684326171875, 0.334686279296875, 0.35779571533203125, 0.3809051513671875, 0.40401458740234375, 0.4271240234375, 0.45023345947265625, 0.4733428955078125, 0.49645233154296875, 0.519561767578125, 0.5426712036132812, 0.5657806396484375, 0.5888900756835938, 0.61199951171875, 0.6351089477539062, 0.6582183837890625, 0.6813278198242188, 0.704437255859375, 0.7275466918945312, 0.7506561279296875, 0.7737655639648438, 0.796875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 10.0, 11.0, 17.0, 12.0, 22.0, 36.0, 45.0, 73.0, 115.0, 163.0, 255.0, 349.0, 528.0, 807.0, 1231.0, 1787.0, 2796.0, 4221.0, 6372.0, 10405.0, 16721.0, 27761.0, 46524.0, 80060.0, 140423.0, 1261154.0, 205011.0, 117839.0, 67991.0, 40187.0, 23975.0, 14617.0, 9283.0, 5714.0, 3692.0, 2301.0, 1507.0, 1019.0, 671.0, 433.0, 314.0, 205.0, 129.0, 104.0, 58.0, 53.0, 38.0, 32.0, 17.0, 16.0, 8.0, 5.0, 8.0, 6.0, 1.0, 4.0, 0.0, 2.0], "bins": [-0.10205078125, -0.098846435546875, -0.09564208984375, -0.092437744140625, -0.0892333984375, -0.086029052734375, -0.08282470703125, -0.079620361328125, -0.076416015625, -0.073211669921875, -0.07000732421875, -0.066802978515625, -0.0635986328125, -0.060394287109375, -0.05718994140625, -0.053985595703125, -0.05078125, -0.047576904296875, -0.04437255859375, -0.041168212890625, -0.0379638671875, -0.034759521484375, -0.03155517578125, -0.028350830078125, -0.025146484375, -0.021942138671875, -0.01873779296875, -0.015533447265625, -0.0123291015625, -0.009124755859375, -0.00592041015625, -0.002716064453125, 0.00048828125, 0.003692626953125, 0.00689697265625, 0.010101318359375, 0.0133056640625, 0.016510009765625, 0.01971435546875, 0.022918701171875, 0.026123046875, 0.029327392578125, 0.03253173828125, 0.035736083984375, 0.0389404296875, 0.042144775390625, 0.04534912109375, 0.048553466796875, 0.0517578125, 0.054962158203125, 0.05816650390625, 0.061370849609375, 0.0645751953125, 0.067779541015625, 0.07098388671875, 0.074188232421875, 0.077392578125, 0.080596923828125, 0.08380126953125, 0.087005615234375, 0.0902099609375, 0.093414306640625, 0.09661865234375, 0.099822998046875, 0.10302734375]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 1.0, 2.0, 3.0, 5.0, 6.0, 3.0, 6.0, 2.0, 7.0, 10.0, 18.0, 16.0, 19.0, 12.0, 25.0, 34.0, 37.0, 35.0, 60.0, 68.0, 62.0, 66.0, 77.0, 57.0, 54.0, 51.0, 53.0, 38.0, 21.0, 20.0, 24.0, 14.0, 15.0, 17.0, 18.0, 9.0, 11.0, 6.0, 6.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0005459785461425781, -0.0005276501178741455, -0.0005093216896057129, -0.0004909932613372803, -0.00047266483306884766, -0.00045433640480041504, -0.0004360079765319824, -0.0004176795482635498, -0.0003993511199951172, -0.00038102269172668457, -0.00036269426345825195, -0.00034436583518981934, -0.0003260374069213867, -0.0003077089786529541, -0.0002893805503845215, -0.00027105212211608887, -0.00025272369384765625, -0.00023439526557922363, -0.00021606683731079102, -0.0001977384090423584, -0.00017940998077392578, -0.00016108155250549316, -0.00014275312423706055, -0.00012442469596862793, -0.00010609626770019531, -8.77678394317627e-05, -6.943941116333008e-05, -5.111098289489746e-05, -3.2782554626464844e-05, -1.4454126358032227e-05, 3.874301910400391e-06, 2.2202730178833008e-05, 4.0531158447265625e-05, 5.885958671569824e-05, 7.718801498413086e-05, 9.551644325256348e-05, 0.0001138448715209961, 0.0001321732997894287, 0.00015050172805786133, 0.00016883015632629395, 0.00018715858459472656, 0.00020548701286315918, 0.0002238154411315918, 0.00024214386940002441, 0.00026047229766845703, 0.00027880072593688965, 0.00029712915420532227, 0.0003154575824737549, 0.0003337860107421875, 0.0003521144390106201, 0.00037044286727905273, 0.00038877129554748535, 0.00040709972381591797, 0.0004254281520843506, 0.0004437565803527832, 0.0004620850086212158, 0.00048041343688964844, 0.0004987418651580811, 0.0005170702934265137, 0.0005353987216949463, 0.0005537271499633789, 0.0005720555782318115, 0.0005903840065002441, 0.0006087124347686768, 0.0006270408630371094]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 5.0, 7.0, 15.0, 11.0, 15.0, 20.0, 26.0, 23.0, 36.0, 40.0, 63.0, 96.0, 82.0, 123.0, 162.0, 262.0, 389.0, 724.0, 155899.0, 888204.0, 841.0, 387.0, 310.0, 190.0, 133.0, 112.0, 75.0, 65.0, 64.0, 47.0, 33.0, 20.0, 11.0, 11.0, 10.0, 8.0, 6.0, 6.0, 6.0, 6.0, 4.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.012969970703125, -0.012589335441589355, -0.012208700180053711, -0.011828064918518066, -0.011447429656982422, -0.011066794395446777, -0.010686159133911133, -0.010305523872375488, -0.009924888610839844, -0.0095442533493042, -0.009163618087768555, -0.00878298282623291, -0.008402347564697266, -0.008021712303161621, -0.0076410770416259766, -0.007260441780090332, -0.0068798065185546875, -0.006499171257019043, -0.0061185359954833984, -0.005737900733947754, -0.005357265472412109, -0.004976630210876465, -0.00459599494934082, -0.004215359687805176, -0.0038347244262695312, -0.0034540891647338867, -0.003073453903198242, -0.0026928186416625977, -0.002312183380126953, -0.0019315481185913086, -0.001550912857055664, -0.0011702775955200195, -0.000789642333984375, -0.00040900707244873047, -2.8371810913085938e-05, 0.0003522634506225586, 0.0007328987121582031, 0.0011135339736938477, 0.0014941692352294922, 0.0018748044967651367, 0.0022554397583007812, 0.0026360750198364258, 0.0030167102813720703, 0.003397345542907715, 0.0037779808044433594, 0.004158616065979004, 0.0045392513275146484, 0.004919886589050293, 0.0053005218505859375, 0.005681157112121582, 0.0060617923736572266, 0.006442427635192871, 0.006823062896728516, 0.00720369815826416, 0.007584333419799805, 0.00796496868133545, 0.008345603942871094, 0.008726239204406738, 0.009106874465942383, 0.009487509727478027, 0.009868144989013672, 0.010248780250549316, 0.010629415512084961, 0.011010050773620605, 0.01139068603515625]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 24.0, 906.0, 85.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010611843317747116, -0.0009833176154643297, -0.0009054508409462869, -0.000827584124635905, -0.0007497173501178622, -0.0006718506338074803, -0.0005939839174970984, -0.0005161171429790556, -0.00043825042666867375, -0.0003603836812544614, -0.00028251693584024906, -0.00020465021952986717, -0.00012678347411565483, -4.891672870144248e-05, 2.894998760893941e-05, 0.00010681676212698221, 0.0001846834784373641, 0.00026255022385157645, 0.0003404169692657888, 0.0004182836855761707, 0.0004961504600942135, 0.0005740171764045954, 0.0006518838927149773, 0.0007297506672330201, 0.000807617383543402, 0.0008854840998537838, 0.0009633508743718266, 0.0010412175906822085, 0.0011190843069925904, 0.0011969511397182941, 0.001274817856028676, 0.001352684572339058, 0.0014305512886494398, 0.0015084180049598217, 0.0015862847212702036, 0.0016641514375805855, 0.0017420182703062892, 0.001819884986616671, 0.001897751702927053, 0.0019756185356527567, 0.0020534852519631386, 0.0021313519682735205, 0.0022092186845839024, 0.0022870854008942842, 0.002364952117204666, 0.0024428190663456917, 0.00252068554982543, 0.0025985524989664555, 0.0026764189824461937, 0.0027542856987565756, 0.0028321524150669575, 0.0029100191313773394, 0.0029878858476877213, 0.003065752796828747, 0.003143619280308485, 0.0032214862294495106, 0.0032993529457598925, 0.0033772196620702744, 0.0034550863783806562, 0.003532953094691038, 0.00361081981100142, 0.003688686527311802, 0.0037665534764528275, 0.0038444201927632093, 0.003922286909073591]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 8.0, 6.0, 6.0, 3.0, 7.0, 9.0, 14.0, 15.0, 16.0, 18.0, 22.0, 24.0, 20.0, 24.0, 32.0, 29.0, 36.0, 30.0, 31.0, 44.0, 46.0, 46.0, 44.0, 36.0, 38.0, 50.0, 42.0, 42.0, 36.0, 28.0, 32.0, 32.0, 25.0, 12.0, 21.0, 16.0, 12.0, 16.0, 5.0, 9.0, 14.0, 2.0, 2.0, 1.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0003165006637573242, -0.0003069555386900902, -0.00029741041362285614, -0.0002878652885556221, -0.00027832016348838806, -0.000268775038421154, -0.00025922991335392, -0.00024968478828668594, -0.0002401396632194519, -0.00023059453815221786, -0.00022104941308498383, -0.00021150428801774979, -0.00020195916295051575, -0.0001924140378832817, -0.00018286891281604767, -0.00017332378774881363, -0.0001637786626815796, -0.00015423353761434555, -0.0001446884125471115, -0.00013514328747987747, -0.00012559816241264343, -0.0001160530373454094, -0.00010650791227817535, -9.696278721094131e-05, -8.741766214370728e-05, -7.787253707647324e-05, -6.83274120092392e-05, -5.878228694200516e-05, -4.923716187477112e-05, -3.969203680753708e-05, -3.014691174030304e-05, -2.0601786673069e-05, -1.1056661605834961e-05, -1.5115365386009216e-06, 8.033588528633118e-06, 1.7578713595867157e-05, 2.7123838663101196e-05, 3.6668963730335236e-05, 4.6214088797569275e-05, 5.5759213864803314e-05, 6.530433893203735e-05, 7.484946399927139e-05, 8.439458906650543e-05, 9.393971413373947e-05, 0.00010348483920097351, 0.00011302996426820755, 0.0001225750893354416, 0.00013212021440267563, 0.00014166533946990967, 0.0001512104645371437, 0.00016075558960437775, 0.00017030071467161179, 0.00017984583973884583, 0.00018939096480607986, 0.0001989360898733139, 0.00020848121494054794, 0.00021802634000778198, 0.00022757146507501602, 0.00023711659014225006, 0.0002466617152094841, 0.00025620684027671814, 0.0002657519653439522, 0.0002752970904111862, 0.00028484221547842026, 0.0002943873405456543]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 7.0, 5.0, 12.0, 18.0, 11.0, 21.0, 19.0, 25.0, 19.0, 20.0, 26.0, 22.0, 34.0, 35.0, 29.0, 43.0, 34.0, 54.0, 41.0, 48.0, 46.0, 39.0, 41.0, 38.0, 42.0, 32.0, 29.0, 30.0, 23.0, 24.0, 16.0, 30.0, 18.0, 18.0, 9.0, 5.0, 7.0, 11.0, 5.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.990234375, -0.9550628662109375, -0.919891357421875, -0.8847198486328125, -0.84954833984375, -0.8143768310546875, -0.779205322265625, -0.7440338134765625, -0.7088623046875, -0.6736907958984375, -0.638519287109375, -0.6033477783203125, -0.56817626953125, -0.5330047607421875, -0.497833251953125, -0.4626617431640625, -0.427490234375, -0.3923187255859375, -0.357147216796875, -0.3219757080078125, -0.28680419921875, -0.2516326904296875, -0.216461181640625, -0.1812896728515625, -0.1461181640625, -0.1109466552734375, -0.075775146484375, -0.0406036376953125, -0.00543212890625, 0.0297393798828125, 0.064910888671875, 0.1000823974609375, 0.13525390625, 0.1704254150390625, 0.205596923828125, 0.2407684326171875, 0.27593994140625, 0.3111114501953125, 0.346282958984375, 0.3814544677734375, 0.4166259765625, 0.4517974853515625, 0.486968994140625, 0.5221405029296875, 0.55731201171875, 0.5924835205078125, 0.627655029296875, 0.6628265380859375, 0.697998046875, 0.7331695556640625, 0.768341064453125, 0.8035125732421875, 0.83868408203125, 0.8738555908203125, 0.909027099609375, 0.9441986083984375, 0.9793701171875, 1.0145416259765625, 1.049713134765625, 1.0848846435546875, 1.12005615234375, 1.1552276611328125, 1.190399169921875, 1.2255706787109375, 1.2607421875]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 7.0, 9.0, 10.0, 19.0, 14.0, 31.0, 51.0, 70.0, 83.0, 116.0, 180.0, 277.0, 426.0, 566.0, 881.0, 1334.0, 2011.0, 3078.0, 4811.0, 8300.0, 16312.0, 41142.0, 161867.0, 479381.0, 228686.0, 54414.0, 19284.0, 9637.0, 5511.0, 3408.0, 2148.0, 1486.0, 938.0, 643.0, 432.0, 286.0, 211.0, 169.0, 91.0, 78.0, 37.0, 39.0, 23.0, 15.0, 14.0, 13.0, 3.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.259765625, -3.153289794921875, -3.04681396484375, -2.940338134765625, -2.8338623046875, -2.727386474609375, -2.62091064453125, -2.514434814453125, -2.407958984375, -2.301483154296875, -2.19500732421875, -2.088531494140625, -1.9820556640625, -1.875579833984375, -1.76910400390625, -1.662628173828125, -1.55615234375, -1.449676513671875, -1.34320068359375, -1.236724853515625, -1.1302490234375, -1.023773193359375, -0.91729736328125, -0.810821533203125, -0.704345703125, -0.597869873046875, -0.49139404296875, -0.384918212890625, -0.2784423828125, -0.171966552734375, -0.06549072265625, 0.040985107421875, 0.1474609375, 0.253936767578125, 0.36041259765625, 0.466888427734375, 0.5733642578125, 0.679840087890625, 0.78631591796875, 0.892791748046875, 0.999267578125, 1.105743408203125, 1.21221923828125, 1.318695068359375, 1.4251708984375, 1.531646728515625, 1.63812255859375, 1.744598388671875, 1.85107421875, 1.957550048828125, 2.06402587890625, 2.170501708984375, 2.2769775390625, 2.383453369140625, 2.48992919921875, 2.596405029296875, 2.702880859375, 2.809356689453125, 2.91583251953125, 3.022308349609375, 3.1287841796875, 3.235260009765625, 3.34173583984375, 3.448211669921875, 3.5546875]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 1.0, 3.0, 5.0, 3.0, 1.0, 5.0, 6.0, 7.0, 11.0, 9.0, 15.0, 12.0, 20.0, 21.0, 28.0, 19.0, 26.0, 34.0, 52.0, 49.0, 41.0, 71.0, 132.0, 253.0, 1348.0, 266.0, 128.0, 71.0, 61.0, 47.0, 49.0, 37.0, 36.0, 38.0, 32.0, 14.0, 20.0, 13.0, 20.0, 9.0, 12.0, 8.0, 7.0, 5.0, 2.0, 7.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.765625, -3.655975341796875, -3.54632568359375, -3.436676025390625, -3.3270263671875, -3.217376708984375, -3.10772705078125, -2.998077392578125, -2.888427734375, -2.778778076171875, -2.66912841796875, -2.559478759765625, -2.4498291015625, -2.340179443359375, -2.23052978515625, -2.120880126953125, -2.01123046875, -1.901580810546875, -1.79193115234375, -1.682281494140625, -1.5726318359375, -1.462982177734375, -1.35333251953125, -1.243682861328125, -1.134033203125, -1.024383544921875, -0.91473388671875, -0.805084228515625, -0.6954345703125, -0.585784912109375, -0.47613525390625, -0.366485595703125, -0.2568359375, -0.147186279296875, -0.03753662109375, 0.072113037109375, 0.1817626953125, 0.291412353515625, 0.40106201171875, 0.510711669921875, 0.620361328125, 0.730010986328125, 0.83966064453125, 0.949310302734375, 1.0589599609375, 1.168609619140625, 1.27825927734375, 1.387908935546875, 1.49755859375, 1.607208251953125, 1.71685791015625, 1.826507568359375, 1.9361572265625, 2.045806884765625, 2.15545654296875, 2.265106201171875, 2.374755859375, 2.484405517578125, 2.59405517578125, 2.703704833984375, 2.8133544921875, 2.923004150390625, 3.03265380859375, 3.142303466796875, 3.251953125]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 7.0, 5.0, 7.0, 14.0, 10.0, 11.0, 13.0, 22.0, 24.0, 29.0, 31.0, 54.0, 57.0, 91.0, 155.0, 297.0, 903.0, 8688.0, 3022259.0, 110387.0, 1630.0, 424.0, 207.0, 110.0, 62.0, 41.0, 31.0, 26.0, 22.0, 17.0, 13.0, 15.0, 8.0, 10.0, 3.0, 3.0, 6.0, 7.0, 1.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.140625, -12.68310546875, -12.2255859375, -11.76806640625, -11.310546875, -10.85302734375, -10.3955078125, -9.93798828125, -9.48046875, -9.02294921875, -8.5654296875, -8.10791015625, -7.650390625, -7.19287109375, -6.7353515625, -6.27783203125, -5.8203125, -5.36279296875, -4.9052734375, -4.44775390625, -3.990234375, -3.53271484375, -3.0751953125, -2.61767578125, -2.16015625, -1.70263671875, -1.2451171875, -0.78759765625, -0.330078125, 0.12744140625, 0.5849609375, 1.04248046875, 1.5, 1.95751953125, 2.4150390625, 2.87255859375, 3.330078125, 3.78759765625, 4.2451171875, 4.70263671875, 5.16015625, 5.61767578125, 6.0751953125, 6.53271484375, 6.990234375, 7.44775390625, 7.9052734375, 8.36279296875, 8.8203125, 9.27783203125, 9.7353515625, 10.19287109375, 10.650390625, 11.10791015625, 11.5654296875, 12.02294921875, 12.48046875, 12.93798828125, 13.3955078125, 13.85302734375, 14.310546875, 14.76806640625, 15.2255859375, 15.68310546875, 16.140625]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 1005.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.59013366699219, -43.11700439453125, -38.64387512207031, -34.17074203491211, -29.697612762451172, -25.224483489990234, -20.751352310180664, -16.278221130371094, -11.805091857910156, -7.331961631774902, -2.8588314056396484, 1.6142988204956055, 6.087429046630859, 10.560558319091797, 15.033689498901367, 19.506820678710938, 23.979949951171875, 28.453079223632812, 32.92620849609375, 37.39934158325195, 41.87247085571289, 46.34560012817383, 50.81873321533203, 55.29186248779297, 59.764991760253906, 64.23812103271484, 68.71125030517578, 73.18437957763672, 77.65751647949219, 82.13064575195312, 86.60377502441406, 91.076904296875, 95.550048828125, 100.02317810058594, 104.49630737304688, 108.96943664550781, 113.44256591796875, 117.91569519042969, 122.38883209228516, 126.8619613647461, 131.3350830078125, 135.80821228027344, 140.28134155273438, 144.7544708251953, 149.22760009765625, 153.7007293701172, 158.17385864257812, 162.64700317382812, 167.12013244628906, 171.59326171875, 176.06639099121094, 180.53952026367188, 185.0126495361328, 189.48577880859375, 193.9589080810547, 198.43203735351562, 202.90518188476562, 207.37831115722656, 211.8514404296875, 216.32456970214844, 220.79769897460938, 225.2708282470703, 229.74395751953125, 234.21710205078125, 238.69021606445312]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 6.0, 6.0, 2.0, 7.0, 8.0, 13.0, 8.0, 21.0, 7.0, 13.0, 10.0, 12.0, 20.0, 34.0, 26.0, 35.0, 38.0, 41.0, 37.0, 44.0, 41.0, 44.0, 38.0, 41.0, 34.0, 52.0, 29.0, 30.0, 43.0, 37.0, 23.0, 31.0, 19.0, 19.0, 18.0, 22.0, 13.0, 12.0, 17.0, 7.0, 9.0, 6.0, 7.0, 7.0, 9.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.096226692199707, -9.73198127746582, -9.367735862731934, -9.003490447998047, -8.63924503326416, -8.274999618530273, -7.910754203796387, -7.5465087890625, -7.182263374328613, -6.818017959594727, -6.45377254486084, -6.089527130126953, -5.725281715393066, -5.36103630065918, -4.996790885925293, -4.632545471191406, -4.2683000564575195, -3.904054641723633, -3.539809226989746, -3.1755638122558594, -2.8113183975219727, -2.447072982788086, -2.082827568054199, -1.7185821533203125, -1.3543367385864258, -0.9900913238525391, -0.6258459091186523, -0.2616004943847656, 0.1026449203491211, 0.4668903350830078, 0.8311357498168945, 1.1953811645507812, 1.5596275329589844, 1.923872947692871, 2.288118362426758, 2.6523637771606445, 3.0166091918945312, 3.380854606628418, 3.7451000213623047, 4.109345436096191, 4.473590850830078, 4.837836265563965, 5.202081680297852, 5.566327095031738, 5.930572509765625, 6.294817924499512, 6.659063339233398, 7.023308753967285, 7.387554168701172, 7.751799583435059, 8.116044998168945, 8.480290412902832, 8.844535827636719, 9.208781242370605, 9.573026657104492, 9.937272071838379, 10.301517486572266, 10.665762901306152, 11.030008316040039, 11.394253730773926, 11.758499145507812, 12.1227445602417, 12.486989974975586, 12.851235389709473, 13.21548080444336]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 7.0, 3.0, 2.0, 17.0, 13.0, 8.0, 11.0, 24.0, 17.0, 25.0, 15.0, 16.0, 34.0, 26.0, 30.0, 42.0, 36.0, 34.0, 38.0, 49.0, 57.0, 41.0, 44.0, 40.0, 46.0, 23.0, 42.0, 36.0, 45.0, 28.0, 19.0, 24.0, 20.0, 21.0, 19.0, 11.0, 8.0, 16.0, 8.0, 5.0, 6.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1640625, -1.1253204345703125, -1.086578369140625, -1.0478363037109375, -1.00909423828125, -0.9703521728515625, -0.931610107421875, -0.8928680419921875, -0.8541259765625, -0.8153839111328125, -0.776641845703125, -0.7378997802734375, -0.69915771484375, -0.6604156494140625, -0.621673583984375, -0.5829315185546875, -0.544189453125, -0.5054473876953125, -0.466705322265625, -0.4279632568359375, -0.38922119140625, -0.3504791259765625, -0.311737060546875, -0.2729949951171875, -0.2342529296875, -0.1955108642578125, -0.156768798828125, -0.1180267333984375, -0.07928466796875, -0.0405426025390625, -0.001800537109375, 0.0369415283203125, 0.07568359375, 0.1144256591796875, 0.153167724609375, 0.1919097900390625, 0.23065185546875, 0.2693939208984375, 0.308135986328125, 0.3468780517578125, 0.3856201171875, 0.4243621826171875, 0.463104248046875, 0.5018463134765625, 0.54058837890625, 0.5793304443359375, 0.618072509765625, 0.6568145751953125, 0.695556640625, 0.7342987060546875, 0.773040771484375, 0.8117828369140625, 0.85052490234375, 0.8892669677734375, 0.928009033203125, 0.9667510986328125, 1.0054931640625, 1.0442352294921875, 1.082977294921875, 1.1217193603515625, 1.16046142578125, 1.1992034912109375, 1.237945556640625, 1.2766876220703125, 1.3154296875]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 7.0, 12.0, 15.0, 22.0, 22.0, 19.0, 35.0, 56.0, 82.0, 117.0, 138.0, 212.0, 324.0, 521.0, 1008.0, 2043.0, 5840.0, 23026.0, 139137.0, 1701901.0, 2105413.0, 175187.0, 27508.0, 6718.0, 2284.0, 1018.0, 529.0, 338.0, 204.0, 154.0, 104.0, 98.0, 51.0, 37.0, 39.0, 19.0, 14.0, 8.0, 6.0, 5.0, 3.0, 6.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.71484375, -4.5677490234375, -4.420654296875, -4.2735595703125, -4.12646484375, -3.9793701171875, -3.832275390625, -3.6851806640625, -3.5380859375, -3.3909912109375, -3.243896484375, -3.0968017578125, -2.94970703125, -2.8026123046875, -2.655517578125, -2.5084228515625, -2.361328125, -2.2142333984375, -2.067138671875, -1.9200439453125, -1.77294921875, -1.6258544921875, -1.478759765625, -1.3316650390625, -1.1845703125, -1.0374755859375, -0.890380859375, -0.7432861328125, -0.59619140625, -0.4490966796875, -0.302001953125, -0.1549072265625, -0.0078125, 0.1392822265625, 0.286376953125, 0.4334716796875, 0.58056640625, 0.7276611328125, 0.874755859375, 1.0218505859375, 1.1689453125, 1.3160400390625, 1.463134765625, 1.6102294921875, 1.75732421875, 1.9044189453125, 2.051513671875, 2.1986083984375, 2.345703125, 2.4927978515625, 2.639892578125, 2.7869873046875, 2.93408203125, 3.0811767578125, 3.228271484375, 3.3753662109375, 3.5224609375, 3.6695556640625, 3.816650390625, 3.9637451171875, 4.11083984375, 4.2579345703125, 4.405029296875, 4.5521240234375, 4.69921875]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 10.0, 9.0, 15.0, 19.0, 41.0, 63.0, 98.0, 130.0, 231.0, 321.0, 479.0, 573.0, 606.0, 473.0, 313.0, 236.0, 159.0, 124.0, 60.0, 38.0, 34.0, 19.0, 10.0, 5.0, 3.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4375, -6.26763916015625, -6.0977783203125, -5.92791748046875, -5.758056640625, -5.58819580078125, -5.4183349609375, -5.24847412109375, -5.07861328125, -4.90875244140625, -4.7388916015625, -4.56903076171875, -4.399169921875, -4.22930908203125, -4.0594482421875, -3.88958740234375, -3.7197265625, -3.54986572265625, -3.3800048828125, -3.21014404296875, -3.040283203125, -2.87042236328125, -2.7005615234375, -2.53070068359375, -2.36083984375, -2.19097900390625, -2.0211181640625, -1.85125732421875, -1.681396484375, -1.51153564453125, -1.3416748046875, -1.17181396484375, -1.001953125, -0.83209228515625, -0.6622314453125, -0.49237060546875, -0.322509765625, -0.15264892578125, 0.0172119140625, 0.18707275390625, 0.35693359375, 0.52679443359375, 0.6966552734375, 0.86651611328125, 1.036376953125, 1.20623779296875, 1.3760986328125, 1.54595947265625, 1.7158203125, 1.88568115234375, 2.0555419921875, 2.22540283203125, 2.395263671875, 2.56512451171875, 2.7349853515625, 2.90484619140625, 3.07470703125, 3.24456787109375, 3.4144287109375, 3.58428955078125, 3.754150390625, 3.92401123046875, 4.0938720703125, 4.26373291015625, 4.43359375]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 9.0, 15.0, 18.0, 31.0, 67.0, 136.0, 301.0, 946.0, 5874.0, 1240925.0, 2935294.0, 9157.0, 1042.0, 279.0, 114.0, 46.0, 19.0, 11.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.53125, -12.88916015625, -12.2470703125, -11.60498046875, -10.962890625, -10.32080078125, -9.6787109375, -9.03662109375, -8.39453125, -7.75244140625, -7.1103515625, -6.46826171875, -5.826171875, -5.18408203125, -4.5419921875, -3.89990234375, -3.2578125, -2.61572265625, -1.9736328125, -1.33154296875, -0.689453125, -0.04736328125, 0.5947265625, 1.23681640625, 1.87890625, 2.52099609375, 3.1630859375, 3.80517578125, 4.447265625, 5.08935546875, 5.7314453125, 6.37353515625, 7.015625, 7.65771484375, 8.2998046875, 8.94189453125, 9.583984375, 10.22607421875, 10.8681640625, 11.51025390625, 12.15234375, 12.79443359375, 13.4365234375, 14.07861328125, 14.720703125, 15.36279296875, 16.0048828125, 16.64697265625, 17.2890625, 17.93115234375, 18.5732421875, 19.21533203125, 19.857421875, 20.49951171875, 21.1416015625, 21.78369140625, 22.42578125, 23.06787109375, 23.7099609375, 24.35205078125, 24.994140625, 25.63623046875, 26.2783203125, 26.92041015625, 27.5625]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 180.0, 771.0, 63.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.1727180480957, -56.4937744140625, -52.81482696533203, -49.13588333129883, -45.456939697265625, -41.777992248535156, -38.09904861450195, -34.42010498046875, -30.741159439086914, -27.062213897705078, -23.383270263671875, -19.70432472229004, -16.025379180908203, -12.346435546875, -8.667490005493164, -4.988546371459961, -1.309600830078125, 2.3693439960479736, 6.048288822174072, 9.72723388671875, 13.40617847442627, 17.08512306213379, 20.764068603515625, 24.443012237548828, 28.121957778930664, 31.8009033203125, 35.4798469543457, 39.158790588378906, 42.837738037109375, 46.51668167114258, 50.19562530517578, 53.87457275390625, 57.55352020263672, 61.23246383666992, 64.91140747070312, 68.5903549194336, 72.26930236816406, 75.9482421875, 79.62718963623047, 83.30613708496094, 86.98507690429688, 90.66402435302734, 94.34296417236328, 98.02191162109375, 101.70085906982422, 105.37979888916016, 109.05874633789062, 112.73768615722656, 116.41664123535156, 120.09558868408203, 123.77452850341797, 127.45347595214844, 131.13241577148438, 134.81137084960938, 138.4903106689453, 142.16925048828125, 145.8481903076172, 149.52713012695312, 153.20608520507812, 156.88502502441406, 160.56396484375, 164.242919921875, 167.92185974121094, 171.60079956054688, 175.27975463867188]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 8.0, 3.0, 15.0, 9.0, 17.0, 22.0, 21.0, 16.0, 27.0, 25.0, 22.0, 38.0, 23.0, 29.0, 44.0, 47.0, 33.0, 34.0, 41.0, 51.0, 54.0, 53.0, 42.0, 35.0, 36.0, 34.0, 29.0, 20.0, 33.0, 23.0, 20.0, 15.0, 20.0, 11.0, 13.0, 7.0, 8.0, 9.0, 2.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.660313606262207, -15.168632507324219, -14.67695140838623, -14.185270309448242, -13.69359016418457, -13.201908111572266, -12.710227966308594, -12.218546867370605, -11.726865768432617, -11.235184669494629, -10.74350357055664, -10.251822471618652, -9.760141372680664, -9.268461227416992, -8.776780128479004, -8.285099029541016, -7.793417930603027, -7.301736831665039, -6.810055732727051, -6.318375110626221, -5.826694011688232, -5.335012912750244, -4.843332290649414, -4.351651191711426, -3.8599700927734375, -3.368288993835449, -2.87660813331604, -2.384927272796631, -1.8932461738586426, -1.4015650749206543, -0.9098842144012451, -0.41820335388183594, 0.07347679138183594, 0.5651577711105347, 1.0568387508392334, 1.5485197305679321, 2.040200710296631, 2.531881809234619, 3.0235626697540283, 3.5152435302734375, 4.006924629211426, 4.498605728149414, 4.990286827087402, 5.481967449188232, 5.973648548126221, 6.465329647064209, 6.957010269165039, 7.448691368103027, 7.940372467041016, 8.432053565979004, 8.923734664916992, 9.41541576385498, 9.907096862792969, 10.39877700805664, 10.890458106994629, 11.382139205932617, 11.873820304870605, 12.365501403808594, 12.857182502746582, 13.34886360168457, 13.840543746948242, 14.332225799560547, 14.823905944824219, 15.315587043762207, 15.807268142700195]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 5.0, 8.0, 7.0, 17.0, 15.0, 12.0, 21.0, 32.0, 24.0, 27.0, 30.0, 30.0, 40.0, 46.0, 49.0, 51.0, 45.0, 42.0, 45.0, 39.0, 53.0, 45.0, 41.0, 36.0, 30.0, 37.0, 26.0, 36.0, 25.0, 21.0, 15.0, 10.0, 9.0, 9.0, 8.0, 6.0, 4.0, 6.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2802734375, -1.2374420166015625, -1.194610595703125, -1.1517791748046875, -1.10894775390625, -1.0661163330078125, -1.023284912109375, -0.9804534912109375, -0.9376220703125, -0.8947906494140625, -0.851959228515625, -0.8091278076171875, -0.76629638671875, -0.7234649658203125, -0.680633544921875, -0.6378021240234375, -0.594970703125, -0.5521392822265625, -0.509307861328125, -0.4664764404296875, -0.42364501953125, -0.3808135986328125, -0.337982177734375, -0.2951507568359375, -0.2523193359375, -0.2094879150390625, -0.166656494140625, -0.1238250732421875, -0.08099365234375, -0.0381622314453125, 0.004669189453125, 0.0475006103515625, 0.09033203125, 0.1331634521484375, 0.175994873046875, 0.2188262939453125, 0.26165771484375, 0.3044891357421875, 0.347320556640625, 0.3901519775390625, 0.4329833984375, 0.4758148193359375, 0.518646240234375, 0.5614776611328125, 0.60430908203125, 0.6471405029296875, 0.689971923828125, 0.7328033447265625, 0.775634765625, 0.8184661865234375, 0.861297607421875, 0.9041290283203125, 0.94696044921875, 0.9897918701171875, 1.032623291015625, 1.0754547119140625, 1.1182861328125, 1.1611175537109375, 1.203948974609375, 1.2467803955078125, 1.28961181640625, 1.3324432373046875, 1.375274658203125, 1.4181060791015625, 1.4609375]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 6.0, 12.0, 13.0, 18.0, 28.0, 34.0, 62.0, 89.0, 140.0, 238.0, 313.0, 527.0, 838.0, 1315.0, 2079.0, 3288.0, 5386.0, 8524.0, 14280.0, 24163.0, 40672.0, 71941.0, 128851.0, 228163.0, 222296.0, 125603.0, 70078.0, 39775.0, 23256.0, 13817.0, 8576.0, 5358.0, 3241.0, 2067.0, 1247.0, 807.0, 531.0, 297.0, 228.0, 134.0, 87.0, 54.0, 50.0, 28.0, 18.0, 13.0, 3.0, 6.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.169921875, -0.16492080688476562, -0.15991973876953125, -0.15491867065429688, -0.1499176025390625, -0.14491653442382812, -0.13991546630859375, -0.13491439819335938, -0.129913330078125, -0.12491226196289062, -0.11991119384765625, -0.11491012573242188, -0.1099090576171875, -0.10490798950195312, -0.09990692138671875, -0.09490585327148438, -0.08990478515625, -0.08490371704101562, -0.07990264892578125, -0.07490158081054688, -0.0699005126953125, -0.06489944458007812, -0.05989837646484375, -0.054897308349609375, -0.049896240234375, -0.044895172119140625, -0.03989410400390625, -0.034893035888671875, -0.0298919677734375, -0.024890899658203125, -0.01988983154296875, -0.014888763427734375, -0.0098876953125, -0.004886627197265625, 0.00011444091796875, 0.005115509033203125, 0.0101165771484375, 0.015117645263671875, 0.02011871337890625, 0.025119781494140625, 0.030120849609375, 0.035121917724609375, 0.04012298583984375, 0.045124053955078125, 0.0501251220703125, 0.055126190185546875, 0.06012725830078125, 0.06512832641601562, 0.07012939453125, 0.07513046264648438, 0.08013153076171875, 0.08513259887695312, 0.0901336669921875, 0.09513473510742188, 0.10013580322265625, 0.10513687133789062, 0.110137939453125, 0.11513900756835938, 0.12014007568359375, 0.12514114379882812, 0.1301422119140625, 0.13514328002929688, 0.14014434814453125, 0.14514541625976562, 0.150146484375]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 3.0, 3.0, 10.0, 5.0, 4.0, 14.0, 7.0, 13.0, 12.0, 15.0, 14.0, 19.0, 20.0, 20.0, 23.0, 33.0, 27.0, 31.0, 29.0, 36.0, 34.0, 31.0, 37.0, 36.0, 1059.0, 33.0, 31.0, 41.0, 41.0, 49.0, 33.0, 39.0, 37.0, 24.0, 19.0, 17.0, 23.0, 13.0, 16.0, 12.0, 12.0, 6.0, 6.0, 11.0, 5.0, 5.0, 3.0, 1.0, 3.0, 1.0, 3.0, 1.0, 4.0, 4.0, 1.0], "bins": [-0.72412109375, -0.702301025390625, -0.68048095703125, -0.658660888671875, -0.6368408203125, -0.615020751953125, -0.59320068359375, -0.571380615234375, -0.549560546875, -0.527740478515625, -0.50592041015625, -0.484100341796875, -0.4622802734375, -0.440460205078125, -0.41864013671875, -0.396820068359375, -0.375, -0.353179931640625, -0.33135986328125, -0.309539794921875, -0.2877197265625, -0.265899658203125, -0.24407958984375, -0.222259521484375, -0.200439453125, -0.178619384765625, -0.15679931640625, -0.134979248046875, -0.1131591796875, -0.091339111328125, -0.06951904296875, -0.047698974609375, -0.02587890625, -0.004058837890625, 0.01776123046875, 0.039581298828125, 0.0614013671875, 0.083221435546875, 0.10504150390625, 0.126861572265625, 0.148681640625, 0.170501708984375, 0.19232177734375, 0.214141845703125, 0.2359619140625, 0.257781982421875, 0.27960205078125, 0.301422119140625, 0.3232421875, 0.345062255859375, 0.36688232421875, 0.388702392578125, 0.4105224609375, 0.432342529296875, 0.45416259765625, 0.475982666015625, 0.497802734375, 0.519622802734375, 0.54144287109375, 0.563262939453125, 0.5850830078125, 0.606903076171875, 0.62872314453125, 0.650543212890625, 0.67236328125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 5.0, 9.0, 10.0, 29.0, 33.0, 52.0, 67.0, 92.0, 144.0, 206.0, 269.0, 399.0, 568.0, 754.0, 1131.0, 1726.0, 2407.0, 3613.0, 5323.0, 8177.0, 12404.0, 19155.0, 30545.0, 48243.0, 79312.0, 133233.0, 1246298.0, 195477.0, 116978.0, 70407.0, 42587.0, 26645.0, 17198.0, 10899.0, 7248.0, 4936.0, 3352.0, 2243.0, 1508.0, 1030.0, 737.0, 490.0, 380.0, 256.0, 155.0, 122.0, 93.0, 62.0, 43.0, 27.0, 19.0, 16.0, 11.0, 8.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.09942626953125, -0.0962057113647461, -0.09298515319824219, -0.08976459503173828, -0.08654403686523438, -0.08332347869873047, -0.08010292053222656, -0.07688236236572266, -0.07366180419921875, -0.07044124603271484, -0.06722068786621094, -0.06400012969970703, -0.060779571533203125, -0.05755901336669922, -0.05433845520019531, -0.051117897033691406, -0.0478973388671875, -0.044676780700683594, -0.04145622253417969, -0.03823566436767578, -0.035015106201171875, -0.03179454803466797, -0.028573989868164062, -0.025353431701660156, -0.02213287353515625, -0.018912315368652344, -0.015691757202148438, -0.012471199035644531, -0.009250640869140625, -0.006030082702636719, -0.0028095245361328125, 0.00041103363037109375, 0.003631591796875, 0.006852149963378906, 0.010072708129882812, 0.013293266296386719, 0.016513824462890625, 0.01973438262939453, 0.022954940795898438, 0.026175498962402344, 0.02939605712890625, 0.032616615295410156, 0.03583717346191406, 0.03905773162841797, 0.042278289794921875, 0.04549884796142578, 0.04871940612792969, 0.051939964294433594, 0.0551605224609375, 0.058381080627441406, 0.06160163879394531, 0.06482219696044922, 0.06804275512695312, 0.07126331329345703, 0.07448387145996094, 0.07770442962646484, 0.08092498779296875, 0.08414554595947266, 0.08736610412597656, 0.09058666229248047, 0.09380722045898438, 0.09702777862548828, 0.10024833679199219, 0.1034688949584961, 0.106689453125]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 0.0, 4.0, 6.0, 7.0, 9.0, 6.0, 13.0, 8.0, 5.0, 19.0, 21.0, 27.0, 40.0, 46.0, 48.0, 55.0, 57.0, 79.0, 77.0, 55.0, 63.0, 60.0, 57.0, 33.0, 35.0, 21.0, 34.0, 26.0, 19.0, 12.0, 10.0, 6.0, 15.0, 5.0, 3.0, 4.0, 5.0, 4.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0004394054412841797, -0.00042537227272987366, -0.0004113391041755676, -0.0003973059356212616, -0.00038327276706695557, -0.00036923959851264954, -0.0003552064299583435, -0.0003411732614040375, -0.00032714009284973145, -0.0003131069242954254, -0.0002990737557411194, -0.00028504058718681335, -0.0002710074186325073, -0.0002569742500782013, -0.00024294108152389526, -0.00022890791296958923, -0.0002148747444152832, -0.00020084157586097717, -0.00018680840730667114, -0.0001727752387523651, -0.00015874207019805908, -0.00014470890164375305, -0.00013067573308944702, -0.00011664256453514099, -0.00010260939598083496, -8.857622742652893e-05, -7.45430588722229e-05, -6.050989031791687e-05, -4.647672176361084e-05, -3.244355320930481e-05, -1.841038465499878e-05, -4.377216100692749e-06, 9.655952453613281e-06, 2.368912100791931e-05, 3.772228956222534e-05, 5.175545811653137e-05, 6.57886266708374e-05, 7.982179522514343e-05, 9.385496377944946e-05, 0.00010788813233375549, 0.00012192130088806152, 0.00013595446944236755, 0.00014998763799667358, 0.00016402080655097961, 0.00017805397510528564, 0.00019208714365959167, 0.0002061203122138977, 0.00022015348076820374, 0.00023418664932250977, 0.0002482198178768158, 0.0002622529864311218, 0.00027628615498542786, 0.0002903193235397339, 0.0003043524920940399, 0.00031838566064834595, 0.000332418829202652, 0.000346451997756958, 0.00036048516631126404, 0.00037451833486557007, 0.0003885515034198761, 0.00040258467197418213, 0.00041661784052848816, 0.0004306510090827942, 0.0004446841776371002, 0.00045871734619140625]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 6.0, 4.0, 2.0, 10.0, 6.0, 12.0, 16.0, 18.0, 16.0, 17.0, 32.0, 27.0, 57.0, 58.0, 56.0, 87.0, 152.0, 230.0, 328.0, 652.0, 2894.0, 1023302.0, 18590.0, 799.0, 369.0, 206.0, 136.0, 118.0, 87.0, 63.0, 34.0, 33.0, 23.0, 22.0, 16.0, 16.0, 12.0, 12.0, 11.0, 12.0, 4.0, 5.0, 5.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.0113372802734375, -0.011010169982910156, -0.010683059692382812, -0.010355949401855469, -0.010028839111328125, -0.009701728820800781, -0.009374618530273438, -0.009047508239746094, -0.00872039794921875, -0.008393287658691406, -0.008066177368164062, -0.007739067077636719, -0.007411956787109375, -0.007084846496582031, -0.0067577362060546875, -0.006430625915527344, -0.006103515625, -0.005776405334472656, -0.0054492950439453125, -0.005122184753417969, -0.004795074462890625, -0.004467964172363281, -0.0041408538818359375, -0.0038137435913085938, -0.00348663330078125, -0.0031595230102539062, -0.0028324127197265625, -0.0025053024291992188, -0.002178192138671875, -0.0018510818481445312, -0.0015239715576171875, -0.0011968612670898438, -0.0008697509765625, -0.0005426406860351562, -0.0002155303955078125, 0.00011157989501953125, 0.000438690185546875, 0.0007658004760742188, 0.0010929107666015625, 0.0014200210571289062, 0.00174713134765625, 0.0020742416381835938, 0.0024013519287109375, 0.0027284622192382812, 0.003055572509765625, 0.0033826828002929688, 0.0037097930908203125, 0.004036903381347656, 0.004364013671875, 0.004691123962402344, 0.0050182342529296875, 0.005345344543457031, 0.005672454833984375, 0.005999565124511719, 0.0063266754150390625, 0.006653785705566406, 0.00698089599609375, 0.007308006286621094, 0.0076351165771484375, 0.007962226867675781, 0.008289337158203125, 0.008616447448730469, 0.008943557739257812, 0.009270668029785156, 0.0095977783203125]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 218.0, 790.0, 7.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006028346251696348, -0.005922951735556126, -0.00581755768507719, -0.005712163168936968, -0.005606768652796745, -0.005501374136656523, -0.0053959800861775875, -0.005290585570037365, -0.005185191053897142, -0.00507979653775692, -0.004974402487277985, -0.004869007971137762, -0.0047636134549975395, -0.004658218938857317, -0.004552824888378382, -0.004447430372238159, -0.004342035856097937, -0.004236641339957714, -0.004131247289478779, -0.004025852773338556, -0.003920458257198334, -0.003815063973888755, -0.0037096694577485323, -0.0036042751744389534, -0.0034988808911293745, -0.0033934866078197956, -0.003288092091679573, -0.003182697808369994, -0.0030773032922297716, -0.0029719090089201927, -0.00286651449277997, -0.0027611202094703913, -0.002655725460499525, -0.002550331177189946, -0.0024449366610497236, -0.0023395423777401447, -0.002234147861599922, -0.0021287535782903433, -0.0020233590621501207, -0.0019179647788405418, -0.001812570495530963, -0.0017071760958060622, -0.0016017816960811615, -0.0014963872963562608, -0.00139099289663136, -0.0012855986133217812, -0.0011802040971815586, -0.0010748098138719797, -0.0009694152977317572, -0.0008640208980068564, -0.0007586264982819557, -0.000653232098557055, -0.0005478376988321543, -0.00044244335731491446, -0.00033704895759001374, -0.00023165455786511302, -0.0001262601581402123, -2.086576569126919e-05, 8.452862675767392e-05, 0.0001899230119306594, 0.00029531741165556014, 0.0004007117822766304, 0.0005061061820015311, 0.0006115005817264318, 0.0007168949814513326]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 3.0, 3.0, 7.0, 8.0, 10.0, 12.0, 17.0, 17.0, 21.0, 16.0, 28.0, 21.0, 20.0, 35.0, 33.0, 34.0, 34.0, 38.0, 45.0, 34.0, 39.0, 39.0, 43.0, 33.0, 30.0, 38.0, 33.0, 42.0, 32.0, 29.0, 30.0, 27.0, 24.0, 16.0, 18.0, 13.0, 11.0, 13.0, 11.0, 8.0, 10.0, 7.0, 6.0, 2.0, 6.0, 3.0, 2.0, 2.0, 1.0, 5.0], "bins": [-0.00024271011352539062, -0.0002358676865696907, -0.00022902525961399078, -0.00022218283265829086, -0.00021534040570259094, -0.00020849797874689102, -0.0002016555517911911, -0.00019481312483549118, -0.00018797069787979126, -0.00018112827092409134, -0.00017428584396839142, -0.0001674434170126915, -0.00016060099005699158, -0.00015375856310129166, -0.00014691613614559174, -0.00014007370918989182, -0.0001332312822341919, -0.00012638885527849197, -0.00011954642832279205, -0.00011270400136709213, -0.00010586157441139221, -9.901914745569229e-05, -9.217672049999237e-05, -8.533429354429245e-05, -7.849186658859253e-05, -7.164943963289261e-05, -6.480701267719269e-05, -5.796458572149277e-05, -5.112215876579285e-05, -4.4279731810092926e-05, -3.7437304854393005e-05, -3.0594877898693085e-05, -2.3752450942993164e-05, -1.6910023987293243e-05, -1.0067597031593323e-05, -3.225170075893402e-06, 3.6172568798065186e-06, 1.045968383550644e-05, 1.730211079120636e-05, 2.414453774690628e-05, 3.09869647026062e-05, 3.782939165830612e-05, 4.467181861400604e-05, 5.151424556970596e-05, 5.8356672525405884e-05, 6.51990994811058e-05, 7.204152643680573e-05, 7.888395339250565e-05, 8.572638034820557e-05, 9.256880730390549e-05, 9.941123425960541e-05, 0.00010625366121530533, 0.00011309608817100525, 0.00011993851512670517, 0.0001267809420824051, 0.000133623369038105, 0.00014046579599380493, 0.00014730822294950485, 0.00015415064990520477, 0.0001609930768609047, 0.00016783550381660461, 0.00017467793077230453, 0.00018152035772800446, 0.00018836278468370438, 0.0001952052116394043]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 5.0, 8.0, 7.0, 17.0, 15.0, 12.0, 21.0, 32.0, 24.0, 27.0, 30.0, 30.0, 40.0, 46.0, 49.0, 51.0, 45.0, 42.0, 45.0, 39.0, 53.0, 45.0, 41.0, 36.0, 30.0, 37.0, 26.0, 36.0, 25.0, 21.0, 15.0, 10.0, 9.0, 9.0, 8.0, 6.0, 4.0, 6.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2802734375, -1.2374420166015625, -1.194610595703125, -1.1517791748046875, -1.10894775390625, -1.0661163330078125, -1.023284912109375, -0.9804534912109375, -0.9376220703125, -0.8947906494140625, -0.851959228515625, -0.8091278076171875, -0.76629638671875, -0.7234649658203125, -0.680633544921875, -0.6378021240234375, -0.594970703125, -0.5521392822265625, -0.509307861328125, -0.4664764404296875, -0.42364501953125, -0.3808135986328125, -0.337982177734375, -0.2951507568359375, -0.2523193359375, -0.2094879150390625, -0.166656494140625, -0.1238250732421875, -0.08099365234375, -0.0381622314453125, 0.004669189453125, 0.0475006103515625, 0.09033203125, 0.1331634521484375, 0.175994873046875, 0.2188262939453125, 0.26165771484375, 0.3044891357421875, 0.347320556640625, 0.3901519775390625, 0.4329833984375, 0.4758148193359375, 0.518646240234375, 0.5614776611328125, 0.60430908203125, 0.6471405029296875, 0.689971923828125, 0.7328033447265625, 0.775634765625, 0.8184661865234375, 0.861297607421875, 0.9041290283203125, 0.94696044921875, 0.9897918701171875, 1.032623291015625, 1.0754547119140625, 1.1182861328125, 1.1611175537109375, 1.203948974609375, 1.2467803955078125, 1.28961181640625, 1.3324432373046875, 1.375274658203125, 1.4181060791015625, 1.4609375]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 10.0, 12.0, 16.0, 21.0, 46.0, 42.0, 77.0, 100.0, 153.0, 300.0, 443.0, 751.0, 1418.0, 3032.0, 7683.0, 22073.0, 66514.0, 193782.0, 362484.0, 248662.0, 92745.0, 30138.0, 10160.0, 3894.0, 1759.0, 898.0, 499.0, 316.0, 183.0, 101.0, 80.0, 58.0, 36.0, 24.0, 17.0, 15.0, 6.0, 7.0, 3.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5546875, -1.5004119873046875, -1.446136474609375, -1.3918609619140625, -1.33758544921875, -1.2833099365234375, -1.229034423828125, -1.1747589111328125, -1.1204833984375, -1.0662078857421875, -1.011932373046875, -0.9576568603515625, -0.90338134765625, -0.8491058349609375, -0.794830322265625, -0.7405548095703125, -0.686279296875, -0.6320037841796875, -0.577728271484375, -0.5234527587890625, -0.46917724609375, -0.4149017333984375, -0.360626220703125, -0.3063507080078125, -0.2520751953125, -0.1977996826171875, -0.143524169921875, -0.0892486572265625, -0.03497314453125, 0.0193023681640625, 0.073577880859375, 0.1278533935546875, 0.18212890625, 0.2364044189453125, 0.290679931640625, 0.3449554443359375, 0.39923095703125, 0.4535064697265625, 0.507781982421875, 0.5620574951171875, 0.6163330078125, 0.6706085205078125, 0.724884033203125, 0.7791595458984375, 0.83343505859375, 0.8877105712890625, 0.941986083984375, 0.9962615966796875, 1.050537109375, 1.1048126220703125, 1.159088134765625, 1.2133636474609375, 1.26763916015625, 1.3219146728515625, 1.376190185546875, 1.4304656982421875, 1.4847412109375, 1.5390167236328125, 1.593292236328125, 1.6475677490234375, 1.70184326171875, 1.7561187744140625, 1.810394287109375, 1.8646697998046875, 1.9189453125]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 7.0, 5.0, 5.0, 5.0, 6.0, 19.0, 7.0, 16.0, 20.0, 31.0, 32.0, 30.0, 35.0, 46.0, 43.0, 54.0, 64.0, 104.0, 179.0, 1342.0, 310.0, 175.0, 103.0, 65.0, 40.0, 41.0, 39.0, 42.0, 26.0, 29.0, 23.0, 17.0, 18.0, 12.0, 8.0, 12.0, 7.0, 7.0, 6.0, 10.0, 4.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.44921875, -4.30999755859375, -4.1707763671875, -4.03155517578125, -3.892333984375, -3.75311279296875, -3.6138916015625, -3.47467041015625, -3.33544921875, -3.19622802734375, -3.0570068359375, -2.91778564453125, -2.778564453125, -2.63934326171875, -2.5001220703125, -2.36090087890625, -2.2216796875, -2.08245849609375, -1.9432373046875, -1.80401611328125, -1.664794921875, -1.52557373046875, -1.3863525390625, -1.24713134765625, -1.10791015625, -0.96868896484375, -0.8294677734375, -0.69024658203125, -0.551025390625, -0.41180419921875, -0.2725830078125, -0.13336181640625, 0.005859375, 0.14508056640625, 0.2843017578125, 0.42352294921875, 0.562744140625, 0.70196533203125, 0.8411865234375, 0.98040771484375, 1.11962890625, 1.25885009765625, 1.3980712890625, 1.53729248046875, 1.676513671875, 1.81573486328125, 1.9549560546875, 2.09417724609375, 2.2333984375, 2.37261962890625, 2.5118408203125, 2.65106201171875, 2.790283203125, 2.92950439453125, 3.0687255859375, 3.20794677734375, 3.34716796875, 3.48638916015625, 3.6256103515625, 3.76483154296875, 3.904052734375, 4.04327392578125, 4.1824951171875, 4.32171630859375, 4.4609375]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 6.0, 9.0, 12.0, 4.0, 8.0, 10.0, 13.0, 15.0, 22.0, 29.0, 36.0, 38.0, 71.0, 90.0, 137.0, 247.0, 480.0, 1223.0, 8411.0, 1323228.0, 1798725.0, 10412.0, 1294.0, 442.0, 215.0, 141.0, 101.0, 71.0, 40.0, 47.0, 31.0, 25.0, 16.0, 16.0, 10.0, 3.0, 7.0, 3.0, 12.0, 3.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3515625, -9.0501708984375, -8.748779296875, -8.4473876953125, -8.14599609375, -7.8446044921875, -7.543212890625, -7.2418212890625, -6.9404296875, -6.6390380859375, -6.337646484375, -6.0362548828125, -5.73486328125, -5.4334716796875, -5.132080078125, -4.8306884765625, -4.529296875, -4.2279052734375, -3.926513671875, -3.6251220703125, -3.32373046875, -3.0223388671875, -2.720947265625, -2.4195556640625, -2.1181640625, -1.8167724609375, -1.515380859375, -1.2139892578125, -0.91259765625, -0.6112060546875, -0.309814453125, -0.0084228515625, 0.29296875, 0.5943603515625, 0.895751953125, 1.1971435546875, 1.49853515625, 1.7999267578125, 2.101318359375, 2.4027099609375, 2.7041015625, 3.0054931640625, 3.306884765625, 3.6082763671875, 3.90966796875, 4.2110595703125, 4.512451171875, 4.8138427734375, 5.115234375, 5.4166259765625, 5.718017578125, 6.0194091796875, 6.32080078125, 6.6221923828125, 6.923583984375, 7.2249755859375, 7.5263671875, 7.8277587890625, 8.129150390625, 8.4305419921875, 8.73193359375, 9.0333251953125, 9.334716796875, 9.6361083984375, 9.9375]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 47.0, 280.0, 493.0, 166.0, 19.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.51102066040039, -24.72133445739746, -23.93164825439453, -23.141963958740234, -22.352277755737305, -21.562591552734375, -20.772905349731445, -19.983219146728516, -19.19353485107422, -18.40384864807129, -17.61416244506836, -16.824478149414062, -16.034791946411133, -15.245105743408203, -14.455419540405273, -13.66573429107666, -12.87604808807373, -12.0863618850708, -11.296676635742188, -10.506990432739258, -9.717305183410645, -8.927618980407715, -8.137933731079102, -7.348247528076172, -6.5585618019104, -5.768876075744629, -4.979190349578857, -4.189504623413086, -3.3998186588287354, -2.610132932662964, -1.8204469680786133, -1.0307612419128418, -0.2410755157470703, 0.548610270023346, 1.3382960557937622, 2.1279819011688232, 2.9176676273345947, 3.707353353500366, 4.497039318084717, 5.286725044250488, 6.07641077041626, 6.866096496582031, 7.655782222747803, 8.445467948913574, 9.235154151916504, 10.024839401245117, 10.814525604248047, 11.604211807250977, 12.39389705657959, 13.18358325958252, 13.973268508911133, 14.762954711914062, 15.552639961242676, 16.34232521057129, 17.13201141357422, 17.92169761657715, 18.711383819580078, 19.501070022583008, 20.290756225585938, 21.080440521240234, 21.870126724243164, 22.659812927246094, 23.449499130249023, 24.239185333251953, 25.02886962890625]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 1.0, 2.0, 6.0, 5.0, 6.0, 6.0, 6.0, 10.0, 12.0, 9.0, 12.0, 20.0, 10.0, 27.0, 32.0, 17.0, 16.0, 35.0, 28.0, 24.0, 24.0, 43.0, 33.0, 40.0, 51.0, 49.0, 29.0, 20.0, 31.0, 46.0, 29.0, 26.0, 40.0, 34.0, 23.0, 22.0, 31.0, 17.0, 20.0, 10.0, 18.0, 18.0, 10.0, 14.0, 10.0, 6.0, 11.0, 6.0, 5.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0], "bins": [-12.911194801330566, -12.52262020111084, -12.134044647216797, -11.74547004699707, -11.356895446777344, -10.9683198928833, -10.579745292663574, -10.191169738769531, -9.802595138549805, -9.414020538330078, -9.025444984436035, -8.636870384216309, -8.248294830322266, -7.859720230102539, -7.4711456298828125, -7.082570552825928, -6.693995475769043, -6.305420398712158, -5.916845321655273, -5.528270721435547, -5.139695644378662, -4.751120567321777, -4.362545967102051, -3.973970890045166, -3.5853958129882812, -3.1968207359313965, -2.808245897293091, -2.419671058654785, -2.0310959815979004, -1.6425210237503052, -1.25394606590271, -0.8653712272644043, -0.4767951965332031, -0.08822023868560791, 0.3003547191619873, 0.6889296770095825, 1.0775046348571777, 1.466079592704773, 1.8546545505523682, 2.243229389190674, 2.6318044662475586, 3.0203795433044434, 3.408954381942749, 3.7975292205810547, 4.1861042976379395, 4.574679374694824, 4.963253974914551, 5.3518290519714355, 5.74040412902832, 6.128979206085205, 6.51755428314209, 6.906128883361816, 7.294703960418701, 7.683279037475586, 8.071853637695312, 8.460428237915039, 8.849003791809082, 9.237578392028809, 9.626153945922852, 10.014728546142578, 10.403303146362305, 10.791878700256348, 11.180453300476074, 11.569028854370117, 11.957603454589844]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 3.0, 5.0, 12.0, 7.0, 17.0, 24.0, 14.0, 23.0, 30.0, 34.0, 29.0, 37.0, 31.0, 56.0, 48.0, 43.0, 45.0, 50.0, 42.0, 41.0, 55.0, 36.0, 42.0, 37.0, 42.0, 36.0, 21.0, 22.0, 22.0, 20.0, 19.0, 13.0, 12.0, 13.0, 6.0, 5.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3544921875, -1.3092193603515625, -1.263946533203125, -1.2186737060546875, -1.17340087890625, -1.1281280517578125, -1.082855224609375, -1.0375823974609375, -0.9923095703125, -0.9470367431640625, -0.901763916015625, -0.8564910888671875, -0.81121826171875, -0.7659454345703125, -0.720672607421875, -0.6753997802734375, -0.630126953125, -0.5848541259765625, -0.539581298828125, -0.4943084716796875, -0.44903564453125, -0.4037628173828125, -0.358489990234375, -0.3132171630859375, -0.2679443359375, -0.2226715087890625, -0.177398681640625, -0.1321258544921875, -0.08685302734375, -0.0415802001953125, 0.003692626953125, 0.0489654541015625, 0.09423828125, 0.1395111083984375, 0.184783935546875, 0.2300567626953125, 0.27532958984375, 0.3206024169921875, 0.365875244140625, 0.4111480712890625, 0.4564208984375, 0.5016937255859375, 0.546966552734375, 0.5922393798828125, 0.63751220703125, 0.6827850341796875, 0.728057861328125, 0.7733306884765625, 0.818603515625, 0.8638763427734375, 0.909149169921875, 0.9544219970703125, 0.99969482421875, 1.0449676513671875, 1.090240478515625, 1.1355133056640625, 1.1807861328125, 1.2260589599609375, 1.271331787109375, 1.3166046142578125, 1.36187744140625, 1.4071502685546875, 1.452423095703125, 1.4976959228515625, 1.54296875]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 8.0, 12.0, 8.0, 14.0, 11.0, 21.0, 30.0, 38.0, 34.0, 55.0, 86.0, 122.0, 197.0, 449.0, 1221.0, 4672.0, 30195.0, 358525.0, 3049782.0, 690835.0, 48172.0, 6919.0, 1616.0, 489.0, 258.0, 150.0, 89.0, 67.0, 50.0, 40.0, 27.0, 20.0, 15.0, 17.0, 13.0, 6.0, 8.0, 7.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4765625, -4.32537841796875, -4.1741943359375, -4.02301025390625, -3.871826171875, -3.72064208984375, -3.5694580078125, -3.41827392578125, -3.26708984375, -3.11590576171875, -2.9647216796875, -2.81353759765625, -2.662353515625, -2.51116943359375, -2.3599853515625, -2.20880126953125, -2.0576171875, -1.90643310546875, -1.7552490234375, -1.60406494140625, -1.452880859375, -1.30169677734375, -1.1505126953125, -0.99932861328125, -0.84814453125, -0.69696044921875, -0.5457763671875, -0.39459228515625, -0.243408203125, -0.09222412109375, 0.0589599609375, 0.21014404296875, 0.361328125, 0.51251220703125, 0.6636962890625, 0.81488037109375, 0.966064453125, 1.11724853515625, 1.2684326171875, 1.41961669921875, 1.57080078125, 1.72198486328125, 1.8731689453125, 2.02435302734375, 2.175537109375, 2.32672119140625, 2.4779052734375, 2.62908935546875, 2.7802734375, 2.93145751953125, 3.0826416015625, 3.23382568359375, 3.385009765625, 3.53619384765625, 3.6873779296875, 3.83856201171875, 3.98974609375, 4.14093017578125, 4.2921142578125, 4.44329833984375, 4.594482421875, 4.74566650390625, 4.8968505859375, 5.04803466796875, 5.19921875]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 8.0, 13.0, 14.0, 19.0, 25.0, 34.0, 56.0, 76.0, 97.0, 155.0, 234.0, 327.0, 391.0, 432.0, 515.0, 419.0, 355.0, 243.0, 205.0, 132.0, 93.0, 63.0, 56.0, 41.0, 26.0, 9.0, 10.0, 10.0, 5.0, 6.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.359375, -5.222808837890625, -5.08624267578125, -4.949676513671875, -4.8131103515625, -4.676544189453125, -4.53997802734375, -4.403411865234375, -4.266845703125, -4.130279541015625, -3.99371337890625, -3.857147216796875, -3.7205810546875, -3.584014892578125, -3.44744873046875, -3.310882568359375, -3.17431640625, -3.037750244140625, -2.90118408203125, -2.764617919921875, -2.6280517578125, -2.491485595703125, -2.35491943359375, -2.218353271484375, -2.081787109375, -1.945220947265625, -1.80865478515625, -1.672088623046875, -1.5355224609375, -1.398956298828125, -1.26239013671875, -1.125823974609375, -0.9892578125, -0.852691650390625, -0.71612548828125, -0.579559326171875, -0.4429931640625, -0.306427001953125, -0.16986083984375, -0.033294677734375, 0.103271484375, 0.239837646484375, 0.37640380859375, 0.512969970703125, 0.6495361328125, 0.786102294921875, 0.92266845703125, 1.059234619140625, 1.19580078125, 1.332366943359375, 1.46893310546875, 1.605499267578125, 1.7420654296875, 1.878631591796875, 2.01519775390625, 2.151763916015625, 2.288330078125, 2.424896240234375, 2.56146240234375, 2.698028564453125, 2.8345947265625, 2.971160888671875, 3.10772705078125, 3.244293212890625, 3.380859375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 4.0, 7.0, 5.0, 16.0, 29.0, 40.0, 79.0, 143.0, 278.0, 586.0, 1598.0, 8209.0, 123993.0, 2873267.0, 1137180.0, 42722.0, 4276.0, 1012.0, 401.0, 188.0, 97.0, 61.0, 32.0, 19.0, 15.0, 12.0, 11.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.828125, -8.5218505859375, -8.215576171875, -7.9093017578125, -7.60302734375, -7.2967529296875, -6.990478515625, -6.6842041015625, -6.3779296875, -6.0716552734375, -5.765380859375, -5.4591064453125, -5.15283203125, -4.8465576171875, -4.540283203125, -4.2340087890625, -3.927734375, -3.6214599609375, -3.315185546875, -3.0089111328125, -2.70263671875, -2.3963623046875, -2.090087890625, -1.7838134765625, -1.4775390625, -1.1712646484375, -0.864990234375, -0.5587158203125, -0.25244140625, 0.0538330078125, 0.360107421875, 0.6663818359375, 0.97265625, 1.2789306640625, 1.585205078125, 1.8914794921875, 2.19775390625, 2.5040283203125, 2.810302734375, 3.1165771484375, 3.4228515625, 3.7291259765625, 4.035400390625, 4.3416748046875, 4.64794921875, 4.9542236328125, 5.260498046875, 5.5667724609375, 5.873046875, 6.1793212890625, 6.485595703125, 6.7918701171875, 7.09814453125, 7.4044189453125, 7.710693359375, 8.0169677734375, 8.3232421875, 8.6295166015625, 8.935791015625, 9.2420654296875, 9.54833984375, 9.8546142578125, 10.160888671875, 10.4671630859375, 10.7734375]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 25.0, 62.0, 109.0, 213.0, 224.0, 189.0, 110.0, 57.0, 18.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.527366638183594, -36.52328872680664, -35.51920700073242, -34.51512908935547, -33.511051177978516, -32.5069694519043, -31.502891540527344, -30.498811721801758, -29.494731903076172, -28.490652084350586, -27.486574172973633, -26.482494354248047, -25.47841453552246, -24.474334716796875, -23.470256805419922, -22.466176986694336, -21.462099075317383, -20.458019256591797, -19.453941345214844, -18.449861526489258, -17.445781707763672, -16.44170379638672, -15.437623977661133, -14.433544158935547, -13.429465293884277, -12.425386428833008, -11.421306610107422, -10.417227745056152, -9.413148880004883, -8.409069061279297, -7.404990196228027, -6.4009108543396, -5.396829605102539, -4.392750263214111, -3.3886711597442627, -2.384592056274414, -1.3805127143859863, -0.3764333724975586, 0.6276454925537109, 1.6317248344421387, 2.6358041763305664, 3.639883518218994, 4.643962860107422, 5.648041725158691, 6.652121067047119, 7.656200408935547, 8.660279273986816, 9.664358139038086, 10.668437957763672, 11.672516822814941, 12.676596641540527, 13.680675506591797, 14.684755325317383, 15.688834190368652, 16.692913055419922, 17.696992874145508, 18.701072692871094, 19.70515251159668, 20.709230422973633, 21.71331024169922, 22.717390060424805, 23.72146987915039, 24.725547790527344, 25.72962760925293, 26.733705520629883]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 7.0, 7.0, 10.0, 15.0, 12.0, 15.0, 12.0, 26.0, 20.0, 27.0, 29.0, 35.0, 37.0, 31.0, 31.0, 47.0, 35.0, 39.0, 46.0, 43.0, 38.0, 41.0, 46.0, 44.0, 42.0, 33.0, 24.0, 38.0, 35.0, 33.0, 14.0, 17.0, 12.0, 18.0, 7.0, 9.0, 7.0, 8.0, 2.0, 6.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.223062515258789, -11.807843208312988, -11.392623901367188, -10.97740364074707, -10.56218433380127, -10.146965026855469, -9.731745719909668, -9.316526412963867, -8.901307106018066, -8.486087799072266, -8.070868492126465, -7.655648708343506, -7.240429401397705, -6.825209617614746, -6.409990310668945, -5.9947710037231445, -5.5795512199401855, -5.164331912994385, -4.749112129211426, -4.333892822265625, -3.918673515319824, -3.5034539699554443, -3.0882344245910645, -2.6730151176452637, -2.257795572280884, -1.8425761461257935, -1.4273567199707031, -1.0121371746063232, -0.5969177484512329, -0.18169832229614258, 0.2335212230682373, 0.6487405300140381, 1.063960075378418, 1.4791795015335083, 1.8943989276885986, 2.3096184730529785, 2.7248377799987793, 3.140057325363159, 3.555276870727539, 3.97049617767334, 4.385715484619141, 4.800934791564941, 5.2161545753479, 5.631373882293701, 6.046593189239502, 6.461812973022461, 6.877032279968262, 7.2922515869140625, 7.7074713706970215, 8.12269115447998, 8.537910461425781, 8.953129768371582, 9.368349075317383, 9.783568382263184, 10.198787689208984, 10.614007949829102, 11.029227256774902, 11.444446563720703, 11.859665870666504, 12.274885177612305, 12.690105438232422, 13.105324745178223, 13.520544052124023, 13.935763359069824, 14.350982666015625]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 7.0, 6.0, 6.0, 5.0, 13.0, 18.0, 19.0, 17.0, 22.0, 18.0, 33.0, 30.0, 28.0, 39.0, 43.0, 35.0, 38.0, 37.0, 53.0, 51.0, 39.0, 56.0, 41.0, 37.0, 47.0, 36.0, 27.0, 25.0, 34.0, 20.0, 22.0, 20.0, 18.0, 8.0, 7.0, 12.0, 14.0, 8.0, 9.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3330078125, -1.2894134521484375, -1.245819091796875, -1.2022247314453125, -1.15863037109375, -1.1150360107421875, -1.071441650390625, -1.0278472900390625, -0.9842529296875, -0.9406585693359375, -0.897064208984375, -0.8534698486328125, -0.80987548828125, -0.7662811279296875, -0.722686767578125, -0.6790924072265625, -0.635498046875, -0.5919036865234375, -0.548309326171875, -0.5047149658203125, -0.46112060546875, -0.4175262451171875, -0.373931884765625, -0.3303375244140625, -0.2867431640625, -0.2431488037109375, -0.199554443359375, -0.1559600830078125, -0.11236572265625, -0.0687713623046875, -0.025177001953125, 0.0184173583984375, 0.06201171875, 0.1056060791015625, 0.149200439453125, 0.1927947998046875, 0.23638916015625, 0.2799835205078125, 0.323577880859375, 0.3671722412109375, 0.4107666015625, 0.4543609619140625, 0.497955322265625, 0.5415496826171875, 0.58514404296875, 0.6287384033203125, 0.672332763671875, 0.7159271240234375, 0.759521484375, 0.8031158447265625, 0.846710205078125, 0.8903045654296875, 0.93389892578125, 0.9774932861328125, 1.021087646484375, 1.0646820068359375, 1.1082763671875, 1.1518707275390625, 1.195465087890625, 1.2390594482421875, 1.28265380859375, 1.3262481689453125, 1.369842529296875, 1.4134368896484375, 1.45703125]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 9.0, 6.0, 14.0, 13.0, 23.0, 41.0, 56.0, 85.0, 141.0, 193.0, 366.0, 502.0, 950.0, 1415.0, 2287.0, 3907.0, 6326.0, 10934.0, 19152.0, 35089.0, 65272.0, 129089.0, 248485.0, 248533.0, 128879.0, 65203.0, 34969.0, 19155.0, 11118.0, 6515.0, 3814.0, 2215.0, 1393.0, 877.0, 514.0, 383.0, 221.0, 138.0, 99.0, 59.0, 36.0, 29.0, 24.0, 10.0, 7.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.182373046875, -0.17667388916015625, -0.1709747314453125, -0.16527557373046875, -0.159576416015625, -0.15387725830078125, -0.1481781005859375, -0.14247894287109375, -0.13677978515625, -0.13108062744140625, -0.1253814697265625, -0.11968231201171875, -0.113983154296875, -0.10828399658203125, -0.1025848388671875, -0.09688568115234375, -0.0911865234375, -0.08548736572265625, -0.0797882080078125, -0.07408905029296875, -0.068389892578125, -0.06269073486328125, -0.0569915771484375, -0.05129241943359375, -0.04559326171875, -0.03989410400390625, -0.0341949462890625, -0.02849578857421875, -0.022796630859375, -0.01709747314453125, -0.0113983154296875, -0.00569915771484375, 0.0, 0.00569915771484375, 0.0113983154296875, 0.01709747314453125, 0.022796630859375, 0.02849578857421875, 0.0341949462890625, 0.03989410400390625, 0.04559326171875, 0.05129241943359375, 0.0569915771484375, 0.06269073486328125, 0.068389892578125, 0.07408905029296875, 0.0797882080078125, 0.08548736572265625, 0.0911865234375, 0.09688568115234375, 0.1025848388671875, 0.10828399658203125, 0.113983154296875, 0.11968231201171875, 0.1253814697265625, 0.13108062744140625, 0.13677978515625, 0.14247894287109375, 0.1481781005859375, 0.15387725830078125, 0.159576416015625, 0.16527557373046875, 0.1709747314453125, 0.17667388916015625, 0.182373046875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 2.0, 5.0, 5.0, 5.0, 5.0, 4.0, 7.0, 6.0, 9.0, 12.0, 11.0, 21.0, 15.0, 15.0, 20.0, 20.0, 24.0, 24.0, 33.0, 36.0, 20.0, 45.0, 25.0, 32.0, 34.0, 33.0, 38.0, 1067.0, 32.0, 33.0, 33.0, 37.0, 30.0, 26.0, 22.0, 29.0, 25.0, 22.0, 20.0, 20.0, 28.0, 16.0, 11.0, 15.0, 14.0, 8.0, 12.0, 7.0, 5.0, 3.0, 5.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.69287109375, -0.6699142456054688, -0.6469573974609375, -0.6240005493164062, -0.601043701171875, -0.5780868530273438, -0.5551300048828125, -0.5321731567382812, -0.50921630859375, -0.48625946044921875, -0.4633026123046875, -0.44034576416015625, -0.417388916015625, -0.39443206787109375, -0.3714752197265625, -0.34851837158203125, -0.3255615234375, -0.30260467529296875, -0.2796478271484375, -0.25669097900390625, -0.233734130859375, -0.21077728271484375, -0.1878204345703125, -0.16486358642578125, -0.14190673828125, -0.11894989013671875, -0.0959930419921875, -0.07303619384765625, -0.050079345703125, -0.02712249755859375, -0.0041656494140625, 0.01879119873046875, 0.041748046875, 0.06470489501953125, 0.0876617431640625, 0.11061859130859375, 0.133575439453125, 0.15653228759765625, 0.1794891357421875, 0.20244598388671875, 0.22540283203125, 0.24835968017578125, 0.2713165283203125, 0.29427337646484375, 0.317230224609375, 0.34018707275390625, 0.3631439208984375, 0.38610076904296875, 0.4090576171875, 0.43201446533203125, 0.4549713134765625, 0.47792816162109375, 0.500885009765625, 0.5238418579101562, 0.5467987060546875, 0.5697555541992188, 0.59271240234375, 0.6156692504882812, 0.6386260986328125, 0.6615829467773438, 0.684539794921875, 0.7074966430664062, 0.7304534912109375, 0.7534103393554688, 0.7763671875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 12.0, 5.0, 24.0, 23.0, 37.0, 70.0, 108.0, 171.0, 261.0, 423.0, 604.0, 1117.0, 1773.0, 2849.0, 4900.0, 8457.0, 15187.0, 27707.0, 50495.0, 93891.0, 179794.0, 1318894.0, 181355.0, 94524.0, 50428.0, 27588.0, 15127.0, 8732.0, 5096.0, 2927.0, 1770.0, 1045.0, 656.0, 429.0, 239.0, 137.0, 99.0, 60.0, 41.0, 26.0, 14.0, 10.0, 11.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1348876953125, -0.13031578063964844, -0.12574386596679688, -0.12117195129394531, -0.11660003662109375, -0.11202812194824219, -0.10745620727539062, -0.10288429260253906, -0.0983123779296875, -0.09374046325683594, -0.08916854858398438, -0.08459663391113281, -0.08002471923828125, -0.07545280456542969, -0.07088088989257812, -0.06630897521972656, -0.061737060546875, -0.05716514587402344, -0.052593231201171875, -0.04802131652832031, -0.04344940185546875, -0.03887748718261719, -0.034305572509765625, -0.029733657836914062, -0.0251617431640625, -0.020589828491210938, -0.016017913818359375, -0.011445999145507812, -0.00687408447265625, -0.0023021697998046875, 0.002269744873046875, 0.0068416595458984375, 0.01141357421875, 0.015985488891601562, 0.020557403564453125, 0.025129318237304688, 0.02970123291015625, 0.03427314758300781, 0.038845062255859375, 0.04341697692871094, 0.0479888916015625, 0.05256080627441406, 0.057132720947265625, 0.06170463562011719, 0.06627655029296875, 0.07084846496582031, 0.07542037963867188, 0.07999229431152344, 0.084564208984375, 0.08913612365722656, 0.09370803833007812, 0.09827995300292969, 0.10285186767578125, 0.10742378234863281, 0.11199569702148438, 0.11656761169433594, 0.1211395263671875, 0.12571144104003906, 0.13028335571289062, 0.1348552703857422, 0.13942718505859375, 0.1439990997314453, 0.14857101440429688, 0.15314292907714844, 0.15771484375]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 4.0, 4.0, 5.0, 5.0, 5.0, 11.0, 19.0, 20.0, 23.0, 31.0, 45.0, 55.0, 62.0, 68.0, 78.0, 84.0, 75.0, 78.0, 56.0, 53.0, 50.0, 38.0, 41.0, 18.0, 15.0, 9.0, 10.0, 11.0, 3.0, 8.0, 5.0, 1.0, 1.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0005235671997070312, -0.0005041211843490601, -0.00048467516899108887, -0.0004652291536331177, -0.0004457831382751465, -0.0004263371229171753, -0.0004068911075592041, -0.0003874450922012329, -0.0003679990768432617, -0.00034855306148529053, -0.00032910704612731934, -0.00030966103076934814, -0.00029021501541137695, -0.00027076900005340576, -0.00025132298469543457, -0.00023187696933746338, -0.0002124309539794922, -0.000192984938621521, -0.0001735389232635498, -0.0001540929079055786, -0.00013464689254760742, -0.00011520087718963623, -9.575486183166504e-05, -7.630884647369385e-05, -5.6862831115722656e-05, -3.7416815757751465e-05, -1.7970800399780273e-05, 1.475214958190918e-06, 2.092123031616211e-05, 4.03672456741333e-05, 5.981326103210449e-05, 7.925927639007568e-05, 9.870529174804688e-05, 0.00011815130710601807, 0.00013759732246398926, 0.00015704333782196045, 0.00017648935317993164, 0.00019593536853790283, 0.00021538138389587402, 0.00023482739925384521, 0.0002542734146118164, 0.0002737194299697876, 0.0002931654453277588, 0.00031261146068573, 0.00033205747604370117, 0.00035150349140167236, 0.00037094950675964355, 0.00039039552211761475, 0.00040984153747558594, 0.00042928755283355713, 0.0004487335681915283, 0.0004681795835494995, 0.0004876255989074707, 0.0005070716142654419, 0.0005265176296234131, 0.0005459636449813843, 0.0005654096603393555, 0.0005848556756973267, 0.0006043016910552979, 0.000623747706413269, 0.0006431937217712402, 0.0006626397371292114, 0.0006820857524871826, 0.0007015317678451538, 0.000720977783203125]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 1.0, 8.0, 11.0, 8.0, 17.0, 20.0, 18.0, 44.0, 50.0, 79.0, 103.0, 161.0, 281.0, 591.0, 4343.0, 1039524.0, 2126.0, 429.0, 260.0, 152.0, 88.0, 63.0, 55.0, 38.0, 16.0, 16.0, 14.0, 6.0, 5.0, 5.0, 4.0, 6.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0174407958984375, -0.016986966133117676, -0.01653313636779785, -0.016079306602478027, -0.015625476837158203, -0.015171647071838379, -0.014717817306518555, -0.01426398754119873, -0.013810157775878906, -0.013356328010559082, -0.012902498245239258, -0.012448668479919434, -0.01199483871459961, -0.011541008949279785, -0.011087179183959961, -0.010633349418640137, -0.010179519653320312, -0.009725689888000488, -0.009271860122680664, -0.00881803035736084, -0.008364200592041016, -0.007910370826721191, -0.007456541061401367, -0.007002711296081543, -0.006548881530761719, -0.0060950517654418945, -0.00564122200012207, -0.005187392234802246, -0.004733562469482422, -0.004279732704162598, -0.0038259029388427734, -0.0033720731735229492, -0.002918243408203125, -0.0024644136428833008, -0.0020105838775634766, -0.0015567541122436523, -0.0011029243469238281, -0.0006490945816040039, -0.0001952648162841797, 0.00025856494903564453, 0.0007123947143554688, 0.001166224479675293, 0.0016200542449951172, 0.0020738840103149414, 0.0025277137756347656, 0.00298154354095459, 0.003435373306274414, 0.0038892030715942383, 0.0043430328369140625, 0.004796862602233887, 0.005250692367553711, 0.005704522132873535, 0.006158351898193359, 0.006612181663513184, 0.007066011428833008, 0.007519841194152832, 0.007973670959472656, 0.00842750072479248, 0.008881330490112305, 0.009335160255432129, 0.009788990020751953, 0.010242819786071777, 0.010696649551391602, 0.011150479316711426, 0.01160430908203125]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 23.0, 938.0, 57.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005855758674442768, -0.005739997606724501, -0.005624236539006233, -0.0055084750056266785, -0.005392713937908411, -0.005276952870190144, -0.005161191802471876, -0.005045430269092321, -0.004929669201374054, -0.0048139081336557865, -0.004698147065937519, -0.004582385532557964, -0.004466624464839697, -0.0043508633971214294, -0.004235102329403162, -0.004119340796023607, -0.00400357972830534, -0.0038878186605870724, -0.0037720573600381613, -0.003656296292319894, -0.0035405349917709827, -0.0034247739240527153, -0.003309012623503804, -0.0031932515557855368, -0.0030774904880672693, -0.002961729420349002, -0.002845968119800091, -0.0027302070520818233, -0.0026144457515329123, -0.002498684683814645, -0.0023829233832657337, -0.0022671623155474663, -0.002151401014998555, -0.0020356399472802877, -0.0019198786467313766, -0.0018041174625977874, -0.0016883562784641981, -0.0015725952107459307, -0.0014568339101970196, -0.0013410728424787521, -0.001225311541929841, -0.0011095503577962518, -0.0009937891736626625, -0.0008780279895290732, -0.000762266805395484, -0.0006465056794695556, -0.0005307444953359663, -0.0004149833112023771, -0.0002992221852764487, -0.00018346100114285946, -6.769983156118542e-05, 4.806133802048862e-05, 0.0001638225221540779, 0.0002795836771838367, 0.00039534486131742597, 0.0005111060454510152, 0.0006268672295846045, 0.0007426284137181938, 0.000858389597851783, 0.0009741507237777114, 0.0010899119079113007, 0.00120567309204489, 0.0013214342761784792, 0.0014371954603120685, 0.0015529566444456577]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 5.0, 7.0, 9.0, 13.0, 17.0, 13.0, 15.0, 14.0, 23.0, 31.0, 21.0, 38.0, 26.0, 26.0, 36.0, 56.0, 55.0, 52.0, 46.0, 47.0, 54.0, 52.0, 44.0, 25.0, 44.0, 34.0, 32.0, 28.0, 21.0, 19.0, 18.0, 13.0, 15.0, 11.0, 12.0, 9.0, 2.0, 9.0, 4.0, 7.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002983212471008301, -0.00028892606496810913, -0.0002795308828353882, -0.00027013570070266724, -0.0002607405185699463, -0.00025134533643722534, -0.0002419501543045044, -0.00023255497217178345, -0.0002231597900390625, -0.00021376460790634155, -0.0002043694257736206, -0.00019497424364089966, -0.0001855790615081787, -0.00017618387937545776, -0.00016678869724273682, -0.00015739351511001587, -0.00014799833297729492, -0.00013860315084457397, -0.00012920796871185303, -0.00011981278657913208, -0.00011041760444641113, -0.00010102242231369019, -9.162724018096924e-05, -8.223205804824829e-05, -7.283687591552734e-05, -6.34416937828064e-05, -5.404651165008545e-05, -4.46513295173645e-05, -3.5256147384643555e-05, -2.5860965251922607e-05, -1.646578311920166e-05, -7.070600986480713e-06, 2.3245811462402344e-06, 1.1719763278961182e-05, 2.111494541168213e-05, 3.0510127544403076e-05, 3.9905309677124023e-05, 4.930049180984497e-05, 5.869567394256592e-05, 6.809085607528687e-05, 7.748603820800781e-05, 8.688122034072876e-05, 9.627640247344971e-05, 0.00010567158460617065, 0.0001150667667388916, 0.00012446194887161255, 0.0001338571310043335, 0.00014325231313705444, 0.0001526474952697754, 0.00016204267740249634, 0.00017143785953521729, 0.00018083304166793823, 0.00019022822380065918, 0.00019962340593338013, 0.00020901858806610107, 0.00021841377019882202, 0.00022780895233154297, 0.00023720413446426392, 0.00024659931659698486, 0.0002559944987297058, 0.00026538968086242676, 0.0002747848629951477, 0.00028418004512786865, 0.0002935752272605896, 0.00030297040939331055]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 7.0, 6.0, 6.0, 5.0, 13.0, 18.0, 19.0, 17.0, 22.0, 18.0, 33.0, 30.0, 28.0, 39.0, 43.0, 35.0, 38.0, 37.0, 53.0, 51.0, 39.0, 56.0, 41.0, 37.0, 48.0, 35.0, 27.0, 25.0, 34.0, 20.0, 22.0, 20.0, 18.0, 8.0, 7.0, 12.0, 14.0, 8.0, 9.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3330078125, -1.2894134521484375, -1.245819091796875, -1.2022247314453125, -1.15863037109375, -1.1150360107421875, -1.071441650390625, -1.0278472900390625, -0.9842529296875, -0.9406585693359375, -0.897064208984375, -0.8534698486328125, -0.80987548828125, -0.7662811279296875, -0.722686767578125, -0.6790924072265625, -0.635498046875, -0.5919036865234375, -0.548309326171875, -0.5047149658203125, -0.46112060546875, -0.4175262451171875, -0.373931884765625, -0.3303375244140625, -0.2867431640625, -0.2431488037109375, -0.199554443359375, -0.1559600830078125, -0.11236572265625, -0.0687713623046875, -0.025177001953125, 0.0184173583984375, 0.06201171875, 0.1056060791015625, 0.149200439453125, 0.1927947998046875, 0.23638916015625, 0.2799835205078125, 0.323577880859375, 0.3671722412109375, 0.4107666015625, 0.4543609619140625, 0.497955322265625, 0.5415496826171875, 0.58514404296875, 0.6287384033203125, 0.672332763671875, 0.7159271240234375, 0.759521484375, 0.8031158447265625, 0.846710205078125, 0.8903045654296875, 0.93389892578125, 0.9774932861328125, 1.021087646484375, 1.0646820068359375, 1.1082763671875, 1.1518707275390625, 1.195465087890625, 1.2390594482421875, 1.28265380859375, 1.3262481689453125, 1.369842529296875, 1.4134368896484375, 1.45703125]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 6.0, 7.0, 13.0, 15.0, 17.0, 31.0, 39.0, 69.0, 99.0, 128.0, 163.0, 259.0, 388.0, 622.0, 1147.0, 1974.0, 3485.0, 6780.0, 13542.0, 29863.0, 74622.0, 199490.0, 385026.0, 198367.0, 74057.0, 29613.0, 13525.0, 6661.0, 3666.0, 1895.0, 1104.0, 690.0, 389.0, 259.0, 174.0, 112.0, 77.0, 59.0, 38.0, 36.0, 19.0, 16.0, 7.0, 5.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5927734375, -1.546600341796875, -1.50042724609375, -1.454254150390625, -1.4080810546875, -1.361907958984375, -1.31573486328125, -1.269561767578125, -1.223388671875, -1.177215576171875, -1.13104248046875, -1.084869384765625, -1.0386962890625, -0.992523193359375, -0.94635009765625, -0.900177001953125, -0.85400390625, -0.807830810546875, -0.76165771484375, -0.715484619140625, -0.6693115234375, -0.623138427734375, -0.57696533203125, -0.530792236328125, -0.484619140625, -0.438446044921875, -0.39227294921875, -0.346099853515625, -0.2999267578125, -0.253753662109375, -0.20758056640625, -0.161407470703125, -0.115234375, -0.069061279296875, -0.02288818359375, 0.023284912109375, 0.0694580078125, 0.115631103515625, 0.16180419921875, 0.207977294921875, 0.254150390625, 0.300323486328125, 0.34649658203125, 0.392669677734375, 0.4388427734375, 0.485015869140625, 0.53118896484375, 0.577362060546875, 0.62353515625, 0.669708251953125, 0.71588134765625, 0.762054443359375, 0.8082275390625, 0.854400634765625, 0.90057373046875, 0.946746826171875, 0.992919921875, 1.039093017578125, 1.08526611328125, 1.131439208984375, 1.1776123046875, 1.223785400390625, 1.26995849609375, 1.316131591796875, 1.3623046875]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 3.0, 5.0, 6.0, 9.0, 5.0, 15.0, 10.0, 17.0, 11.0, 15.0, 25.0, 32.0, 28.0, 37.0, 47.0, 38.0, 39.0, 44.0, 68.0, 103.0, 237.0, 1527.0, 234.0, 84.0, 55.0, 47.0, 35.0, 31.0, 32.0, 33.0, 30.0, 29.0, 26.0, 22.0, 23.0, 9.0, 9.0, 7.0, 8.0, 6.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-4.94140625, -4.7935791015625, -4.645751953125, -4.4979248046875, -4.35009765625, -4.2022705078125, -4.054443359375, -3.9066162109375, -3.7587890625, -3.6109619140625, -3.463134765625, -3.3153076171875, -3.16748046875, -3.0196533203125, -2.871826171875, -2.7239990234375, -2.576171875, -2.4283447265625, -2.280517578125, -2.1326904296875, -1.98486328125, -1.8370361328125, -1.689208984375, -1.5413818359375, -1.3935546875, -1.2457275390625, -1.097900390625, -0.9500732421875, -0.80224609375, -0.6544189453125, -0.506591796875, -0.3587646484375, -0.2109375, -0.0631103515625, 0.084716796875, 0.2325439453125, 0.38037109375, 0.5281982421875, 0.676025390625, 0.8238525390625, 0.9716796875, 1.1195068359375, 1.267333984375, 1.4151611328125, 1.56298828125, 1.7108154296875, 1.858642578125, 2.0064697265625, 2.154296875, 2.3021240234375, 2.449951171875, 2.5977783203125, 2.74560546875, 2.8934326171875, 3.041259765625, 3.1890869140625, 3.3369140625, 3.4847412109375, 3.632568359375, 3.7803955078125, 3.92822265625, 4.0760498046875, 4.223876953125, 4.3717041015625, 4.51953125]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 7.0, 6.0, 3.0, 11.0, 10.0, 6.0, 16.0, 28.0, 30.0, 44.0, 30.0, 68.0, 61.0, 91.0, 164.0, 258.0, 629.0, 1960.0, 20424.0, 1930017.0, 1172163.0, 16590.0, 1699.0, 496.0, 274.0, 155.0, 106.0, 89.0, 59.0, 41.0, 38.0, 23.0, 23.0, 17.0, 16.0, 14.0, 8.0, 7.0, 8.0, 5.0, 3.0, 6.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3125, -8.060302734375, -7.80810546875, -7.555908203125, -7.3037109375, -7.051513671875, -6.79931640625, -6.547119140625, -6.294921875, -6.042724609375, -5.79052734375, -5.538330078125, -5.2861328125, -5.033935546875, -4.78173828125, -4.529541015625, -4.27734375, -4.025146484375, -3.77294921875, -3.520751953125, -3.2685546875, -3.016357421875, -2.76416015625, -2.511962890625, -2.259765625, -2.007568359375, -1.75537109375, -1.503173828125, -1.2509765625, -0.998779296875, -0.74658203125, -0.494384765625, -0.2421875, 0.010009765625, 0.26220703125, 0.514404296875, 0.7666015625, 1.018798828125, 1.27099609375, 1.523193359375, 1.775390625, 2.027587890625, 2.27978515625, 2.531982421875, 2.7841796875, 3.036376953125, 3.28857421875, 3.540771484375, 3.79296875, 4.045166015625, 4.29736328125, 4.549560546875, 4.8017578125, 5.053955078125, 5.30615234375, 5.558349609375, 5.810546875, 6.062744140625, 6.31494140625, 6.567138671875, 6.8193359375, 7.071533203125, 7.32373046875, 7.575927734375, 7.828125]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 11.0, 69.0, 236.0, 379.0, 250.0, 62.0, 8.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.540201187133789, -11.824516296386719, -11.108830451965332, -10.393145561218262, -9.677459716796875, -8.961774826049805, -8.246089935302734, -7.530404567718506, -6.814719200134277, -6.099033832550049, -5.38334846496582, -4.66766357421875, -3.9519782066345215, -3.236292839050293, -2.5206079483032227, -1.8049225807189941, -1.0892372131347656, -0.37355196475982666, 0.3421332836151123, 1.0578184127807617, 1.7735037803649902, 2.4891891479492188, 3.204874038696289, 3.9205594062805176, 4.636244773864746, 5.351930141448975, 6.067615509033203, 6.783300399780273, 7.498985767364502, 8.21467113494873, 8.9303560256958, 9.646041870117188, 10.36172866821289, 11.077413558959961, 11.793099403381348, 12.508784294128418, 13.224470138549805, 13.940155029296875, 14.655839920043945, 15.371524810791016, 16.08721160888672, 16.80289649963379, 17.51858139038086, 18.234268188476562, 18.949953079223633, 19.665637969970703, 20.381322860717773, 21.097007751464844, 21.812692642211914, 22.528377532958984, 23.244062423706055, 23.959747314453125, 24.675434112548828, 25.3911190032959, 26.10680389404297, 26.82248878479004, 27.53817367553711, 28.25385856628418, 28.96954345703125, 29.685230255126953, 30.400915145874023, 31.116600036621094, 31.832284927368164, 32.547969818115234, 33.26365661621094]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 8.0, 4.0, 6.0, 8.0, 11.0, 18.0, 7.0, 15.0, 21.0, 24.0, 37.0, 26.0, 25.0, 33.0, 34.0, 39.0, 35.0, 42.0, 47.0, 30.0, 50.0, 38.0, 43.0, 46.0, 39.0, 37.0, 37.0, 27.0, 22.0, 25.0, 23.0, 27.0, 12.0, 23.0, 10.0, 14.0, 15.0, 13.0, 6.0, 12.0, 5.0, 5.0, 1.0, 4.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-16.035961151123047, -15.573179244995117, -15.110397338867188, -14.647616386413574, -14.184834480285645, -13.722052574157715, -13.259271621704102, -12.796489715576172, -12.333707809448242, -11.870925903320312, -11.408143997192383, -10.94536304473877, -10.48258113861084, -10.01979923248291, -9.557018280029297, -9.094236373901367, -8.631454467773438, -8.168672561645508, -7.705891132354736, -7.243109703063965, -6.780327796936035, -6.3175458908081055, -5.854764461517334, -5.3919830322265625, -4.929201126098633, -4.466419219970703, -4.003637790679932, -3.540856122970581, -3.0780744552612305, -2.61529278755188, -2.1525111198425293, -1.6897294521331787, -1.2269477844238281, -0.7641661167144775, -0.30138444900512695, 0.16139721870422363, 0.6241788864135742, 1.0869605541229248, 1.5497422218322754, 2.012523889541626, 2.4753055572509766, 2.938087224960327, 3.4008688926696777, 3.8636505603790283, 4.326432228088379, 4.789214134216309, 5.25199556350708, 5.714776992797852, 6.177558898925781, 6.640340805053711, 7.103122234344482, 7.565903663635254, 8.028685569763184, 8.491467475891113, 8.954248428344727, 9.417030334472656, 9.879812240600586, 10.342594146728516, 10.805376052856445, 11.268157005310059, 11.730938911437988, 12.193720817565918, 12.656501770019531, 13.119283676147461, 13.58206558227539]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 4.0, 4.0, 6.0, 11.0, 11.0, 9.0, 12.0, 19.0, 20.0, 19.0, 23.0, 32.0, 27.0, 23.0, 35.0, 40.0, 36.0, 32.0, 44.0, 56.0, 38.0, 57.0, 45.0, 43.0, 49.0, 39.0, 28.0, 32.0, 34.0, 24.0, 24.0, 28.0, 19.0, 13.0, 14.0, 14.0, 9.0, 13.0, 7.0, 8.0, 6.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4287109375, -1.382354736328125, -1.33599853515625, -1.289642333984375, -1.2432861328125, -1.196929931640625, -1.15057373046875, -1.104217529296875, -1.057861328125, -1.011505126953125, -0.96514892578125, -0.918792724609375, -0.8724365234375, -0.826080322265625, -0.77972412109375, -0.733367919921875, -0.68701171875, -0.640655517578125, -0.59429931640625, -0.547943115234375, -0.5015869140625, -0.455230712890625, -0.40887451171875, -0.362518310546875, -0.316162109375, -0.269805908203125, -0.22344970703125, -0.177093505859375, -0.1307373046875, -0.084381103515625, -0.03802490234375, 0.008331298828125, 0.0546875, 0.101043701171875, 0.14739990234375, 0.193756103515625, 0.2401123046875, 0.286468505859375, 0.33282470703125, 0.379180908203125, 0.425537109375, 0.471893310546875, 0.51824951171875, 0.564605712890625, 0.6109619140625, 0.657318115234375, 0.70367431640625, 0.750030517578125, 0.79638671875, 0.842742919921875, 0.88909912109375, 0.935455322265625, 0.9818115234375, 1.028167724609375, 1.07452392578125, 1.120880126953125, 1.167236328125, 1.213592529296875, 1.25994873046875, 1.306304931640625, 1.3526611328125, 1.399017333984375, 1.44537353515625, 1.491729736328125, 1.5380859375]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 4.0, 11.0, 8.0, 12.0, 13.0, 12.0, 15.0, 14.0, 16.0, 21.0, 28.0, 30.0, 31.0, 37.0, 82.0, 156.0, 480.0, 1818.0, 12125.0, 193414.0, 3238021.0, 713958.0, 29248.0, 3424.0, 693.0, 212.0, 93.0, 60.0, 42.0, 26.0, 25.0, 28.0, 25.0, 18.0, 22.0, 14.0, 7.0, 11.0, 7.0, 5.0, 4.0, 2.0, 5.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.1796875, -5.984619140625, -5.78955078125, -5.594482421875, -5.3994140625, -5.204345703125, -5.00927734375, -4.814208984375, -4.619140625, -4.424072265625, -4.22900390625, -4.033935546875, -3.8388671875, -3.643798828125, -3.44873046875, -3.253662109375, -3.05859375, -2.863525390625, -2.66845703125, -2.473388671875, -2.2783203125, -2.083251953125, -1.88818359375, -1.693115234375, -1.498046875, -1.302978515625, -1.10791015625, -0.912841796875, -0.7177734375, -0.522705078125, -0.32763671875, -0.132568359375, 0.0625, 0.257568359375, 0.45263671875, 0.647705078125, 0.8427734375, 1.037841796875, 1.23291015625, 1.427978515625, 1.623046875, 1.818115234375, 2.01318359375, 2.208251953125, 2.4033203125, 2.598388671875, 2.79345703125, 2.988525390625, 3.18359375, 3.378662109375, 3.57373046875, 3.768798828125, 3.9638671875, 4.158935546875, 4.35400390625, 4.549072265625, 4.744140625, 4.939208984375, 5.13427734375, 5.329345703125, 5.5244140625, 5.719482421875, 5.91455078125, 6.109619140625, 6.3046875]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 3.0, 3.0, 2.0, 7.0, 6.0, 14.0, 20.0, 18.0, 30.0, 39.0, 53.0, 79.0, 117.0, 145.0, 238.0, 275.0, 403.0, 505.0, 459.0, 437.0, 332.0, 257.0, 188.0, 108.0, 95.0, 69.0, 40.0, 26.0, 32.0, 20.0, 18.0, 8.0, 9.0, 6.0, 10.0, 1.0, 3.0, 6.0, 0.0, 0.0, 1.0], "bins": [-5.4375, -5.305511474609375, -5.17352294921875, -5.041534423828125, -4.9095458984375, -4.777557373046875, -4.64556884765625, -4.513580322265625, -4.381591796875, -4.249603271484375, -4.11761474609375, -3.985626220703125, -3.8536376953125, -3.721649169921875, -3.58966064453125, -3.457672119140625, -3.32568359375, -3.193695068359375, -3.06170654296875, -2.929718017578125, -2.7977294921875, -2.665740966796875, -2.53375244140625, -2.401763916015625, -2.269775390625, -2.137786865234375, -2.00579833984375, -1.873809814453125, -1.7418212890625, -1.609832763671875, -1.47784423828125, -1.345855712890625, -1.2138671875, -1.081878662109375, -0.94989013671875, -0.817901611328125, -0.6859130859375, -0.553924560546875, -0.42193603515625, -0.289947509765625, -0.157958984375, -0.025970458984375, 0.10601806640625, 0.238006591796875, 0.3699951171875, 0.501983642578125, 0.63397216796875, 0.765960693359375, 0.89794921875, 1.029937744140625, 1.16192626953125, 1.293914794921875, 1.4259033203125, 1.557891845703125, 1.68988037109375, 1.821868896484375, 1.953857421875, 2.085845947265625, 2.21783447265625, 2.349822998046875, 2.4818115234375, 2.613800048828125, 2.74578857421875, 2.877777099609375, 3.009765625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 2.0, 2.0, 6.0, 8.0, 8.0, 17.0, 15.0, 32.0, 33.0, 44.0, 65.0, 88.0, 160.0, 226.0, 389.0, 903.0, 2610.0, 11670.0, 106132.0, 1723480.0, 2188735.0, 140675.0, 14057.0, 2878.0, 989.0, 408.0, 223.0, 118.0, 89.0, 68.0, 51.0, 27.0, 27.0, 13.0, 11.0, 10.0, 5.0, 3.0, 6.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.2890625, -6.027587890625, -5.76611328125, -5.504638671875, -5.2431640625, -4.981689453125, -4.72021484375, -4.458740234375, -4.197265625, -3.935791015625, -3.67431640625, -3.412841796875, -3.1513671875, -2.889892578125, -2.62841796875, -2.366943359375, -2.10546875, -1.843994140625, -1.58251953125, -1.321044921875, -1.0595703125, -0.798095703125, -0.53662109375, -0.275146484375, -0.013671875, 0.247802734375, 0.50927734375, 0.770751953125, 1.0322265625, 1.293701171875, 1.55517578125, 1.816650390625, 2.078125, 2.339599609375, 2.60107421875, 2.862548828125, 3.1240234375, 3.385498046875, 3.64697265625, 3.908447265625, 4.169921875, 4.431396484375, 4.69287109375, 4.954345703125, 5.2158203125, 5.477294921875, 5.73876953125, 6.000244140625, 6.26171875, 6.523193359375, 6.78466796875, 7.046142578125, 7.3076171875, 7.569091796875, 7.83056640625, 8.092041015625, 8.353515625, 8.614990234375, 8.87646484375, 9.137939453125, 9.3994140625, 9.660888671875, 9.92236328125, 10.183837890625, 10.4453125]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 19.0, 25.0, 40.0, 74.0, 74.0, 101.0, 111.0, 142.0, 113.0, 101.0, 77.0, 53.0, 35.0, 19.0, 9.0, 7.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.354969024658203, -28.734386444091797, -28.113805770874023, -27.493223190307617, -26.87264060974121, -26.252059936523438, -25.63147735595703, -25.010894775390625, -24.39031219482422, -23.769729614257812, -23.14914894104004, -22.528566360473633, -21.907983779907227, -21.287403106689453, -20.666820526123047, -20.04623794555664, -19.425657272338867, -18.80507469177246, -18.184494018554688, -17.56391143798828, -16.943328857421875, -16.32274627685547, -15.702165603637695, -15.081583023071289, -14.4610013961792, -13.84041976928711, -13.219837188720703, -12.599255561828613, -11.978673934936523, -11.358091354370117, -10.737509727478027, -10.116928100585938, -9.496347427368164, -8.875765800476074, -8.255183219909668, -7.634601593017578, -7.01401948928833, -6.393437385559082, -5.772855758666992, -5.152273654937744, -4.531691551208496, -3.911109447479248, -3.290527582168579, -2.66994571685791, -2.049363613128662, -1.428781509399414, -0.8081996440887451, -0.18761777877807617, 0.4329643249511719, 1.0535463094711304, 1.6741282939910889, 2.294710159301758, 2.915292263031006, 3.535874366760254, 4.156455993652344, 4.777038097381592, 5.39762020111084, 6.018202304840088, 6.638784408569336, 7.259366035461426, 7.879948139190674, 8.500530242919922, 9.121111869812012, 9.741693496704102, 10.362276077270508]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 4.0, 4.0, 2.0, 3.0, 10.0, 14.0, 12.0, 13.0, 16.0, 15.0, 26.0, 15.0, 24.0, 25.0, 27.0, 22.0, 28.0, 29.0, 34.0, 34.0, 41.0, 42.0, 38.0, 40.0, 40.0, 39.0, 42.0, 40.0, 36.0, 35.0, 29.0, 24.0, 18.0, 24.0, 13.0, 18.0, 23.0, 24.0, 13.0, 13.0, 8.0, 11.0, 9.0, 8.0, 6.0, 4.0, 4.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-12.049810409545898, -11.677988052368164, -11.30616569519043, -10.934343338012695, -10.562520980834961, -10.19069766998291, -9.818875312805176, -9.447052955627441, -9.075230598449707, -8.703408241271973, -8.331585884094238, -7.959763050079346, -7.587940692901611, -7.216118335723877, -6.844295501708984, -6.47247314453125, -6.100650787353516, -5.728828430175781, -5.357006072998047, -4.985183238983154, -4.61336088180542, -4.2415385246276855, -3.869715929031372, -3.4978933334350586, -3.126070976257324, -2.75424861907959, -2.3824260234832764, -2.010603427886963, -1.6387810707092285, -1.2669585943222046, -0.8951361179351807, -0.5233135223388672, -0.1514911651611328, 0.2203313112258911, 0.592153787612915, 0.963976263999939, 1.335798740386963, 1.7076212167739868, 2.0794436931610107, 2.451266288757324, 2.8230886459350586, 3.194911003112793, 3.5667335987091064, 3.93855619430542, 4.310378551483154, 4.682200908660889, 5.054023742675781, 5.425846099853516, 5.79766845703125, 6.169490814208984, 6.541313171386719, 6.913136005401611, 7.284958362579346, 7.65678071975708, 8.028603553771973, 8.400425910949707, 8.772248268127441, 9.144070625305176, 9.51589298248291, 9.887715339660645, 10.259538650512695, 10.63136100769043, 11.003183364868164, 11.375005722045898, 11.746828079223633]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 6.0, 6.0, 5.0, 8.0, 12.0, 9.0, 18.0, 17.0, 13.0, 22.0, 13.0, 15.0, 20.0, 29.0, 27.0, 30.0, 29.0, 40.0, 55.0, 46.0, 49.0, 35.0, 38.0, 42.0, 41.0, 45.0, 32.0, 34.0, 44.0, 29.0, 19.0, 33.0, 20.0, 20.0, 12.0, 15.0, 22.0, 14.0, 6.0, 8.0, 9.0, 5.0, 9.0, 0.0, 2.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2734375, -1.2295379638671875, -1.185638427734375, -1.1417388916015625, -1.09783935546875, -1.0539398193359375, -1.010040283203125, -0.9661407470703125, -0.9222412109375, -0.8783416748046875, -0.834442138671875, -0.7905426025390625, -0.74664306640625, -0.7027435302734375, -0.658843994140625, -0.6149444580078125, -0.571044921875, -0.5271453857421875, -0.483245849609375, -0.4393463134765625, -0.39544677734375, -0.3515472412109375, -0.307647705078125, -0.2637481689453125, -0.2198486328125, -0.1759490966796875, -0.132049560546875, -0.0881500244140625, -0.04425048828125, -0.0003509521484375, 0.043548583984375, 0.0874481201171875, 0.13134765625, 0.1752471923828125, 0.219146728515625, 0.2630462646484375, 0.30694580078125, 0.3508453369140625, 0.394744873046875, 0.4386444091796875, 0.4825439453125, 0.5264434814453125, 0.570343017578125, 0.6142425537109375, 0.65814208984375, 0.7020416259765625, 0.745941162109375, 0.7898406982421875, 0.833740234375, 0.8776397705078125, 0.921539306640625, 0.9654388427734375, 1.00933837890625, 1.0532379150390625, 1.097137451171875, 1.1410369873046875, 1.1849365234375, 1.2288360595703125, 1.272735595703125, 1.3166351318359375, 1.36053466796875, 1.4044342041015625, 1.448333740234375, 1.4922332763671875, 1.5361328125]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 5.0, 6.0, 16.0, 15.0, 24.0, 41.0, 37.0, 56.0, 80.0, 115.0, 184.0, 225.0, 329.0, 469.0, 693.0, 1090.0, 1443.0, 2195.0, 3370.0, 5029.0, 7819.0, 12330.0, 19972.0, 32768.0, 56516.0, 99313.0, 175462.0, 242434.0, 161135.0, 91178.0, 51909.0, 30280.0, 18697.0, 11440.0, 7393.0, 4728.0, 3123.0, 2133.0, 1360.0, 965.0, 664.0, 477.0, 308.0, 214.0, 147.0, 111.0, 71.0, 73.0, 27.0, 26.0, 19.0, 14.0, 10.0, 11.0, 8.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.166259765625, -0.1607952117919922, -0.15533065795898438, -0.14986610412597656, -0.14440155029296875, -0.13893699645996094, -0.13347244262695312, -0.1280078887939453, -0.1225433349609375, -0.11707878112792969, -0.11161422729492188, -0.10614967346191406, -0.10068511962890625, -0.09522056579589844, -0.08975601196289062, -0.08429145812988281, -0.078826904296875, -0.07336235046386719, -0.06789779663085938, -0.06243324279785156, -0.05696868896484375, -0.05150413513183594, -0.046039581298828125, -0.04057502746582031, -0.0351104736328125, -0.029645919799804688, -0.024181365966796875, -0.018716812133789062, -0.01325225830078125, -0.0077877044677734375, -0.002323150634765625, 0.0031414031982421875, 0.00860595703125, 0.014070510864257812, 0.019535064697265625, 0.024999618530273438, 0.03046417236328125, 0.03592872619628906, 0.041393280029296875, 0.04685783386230469, 0.0523223876953125, 0.05778694152832031, 0.06325149536132812, 0.06871604919433594, 0.07418060302734375, 0.07964515686035156, 0.08510971069335938, 0.09057426452636719, 0.096038818359375, 0.10150337219238281, 0.10696792602539062, 0.11243247985839844, 0.11789703369140625, 0.12336158752441406, 0.12882614135742188, 0.1342906951904297, 0.1397552490234375, 0.1452198028564453, 0.15068435668945312, 0.15614891052246094, 0.16161346435546875, 0.16707801818847656, 0.17254257202148438, 0.1780071258544922, 0.1834716796875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 1.0, 2.0, 9.0, 3.0, 5.0, 8.0, 6.0, 7.0, 12.0, 8.0, 17.0, 12.0, 20.0, 19.0, 21.0, 29.0, 28.0, 18.0, 24.0, 36.0, 30.0, 54.0, 41.0, 48.0, 38.0, 1064.0, 39.0, 36.0, 35.0, 31.0, 37.0, 32.0, 25.0, 30.0, 40.0, 26.0, 22.0, 14.0, 13.0, 13.0, 21.0, 17.0, 7.0, 7.0, 7.0, 5.0, 4.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.86083984375, -0.8330841064453125, -0.805328369140625, -0.7775726318359375, -0.74981689453125, -0.7220611572265625, -0.694305419921875, -0.6665496826171875, -0.6387939453125, -0.6110382080078125, -0.583282470703125, -0.5555267333984375, -0.52777099609375, -0.5000152587890625, -0.472259521484375, -0.4445037841796875, -0.416748046875, -0.3889923095703125, -0.361236572265625, -0.3334808349609375, -0.30572509765625, -0.2779693603515625, -0.250213623046875, -0.2224578857421875, -0.1947021484375, -0.1669464111328125, -0.139190673828125, -0.1114349365234375, -0.08367919921875, -0.0559234619140625, -0.028167724609375, -0.0004119873046875, 0.02734375, 0.0550994873046875, 0.082855224609375, 0.1106109619140625, 0.13836669921875, 0.1661224365234375, 0.193878173828125, 0.2216339111328125, 0.2493896484375, 0.2771453857421875, 0.304901123046875, 0.3326568603515625, 0.36041259765625, 0.3881683349609375, 0.415924072265625, 0.4436798095703125, 0.471435546875, 0.4991912841796875, 0.526947021484375, 0.5547027587890625, 0.58245849609375, 0.6102142333984375, 0.637969970703125, 0.6657257080078125, 0.6934814453125, 0.7212371826171875, 0.748992919921875, 0.7767486572265625, 0.80450439453125, 0.8322601318359375, 0.860015869140625, 0.8877716064453125, 0.91552734375]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 7.0, 4.0, 7.0, 18.0, 22.0, 27.0, 49.0, 83.0, 110.0, 153.0, 240.0, 393.0, 585.0, 915.0, 1418.0, 2117.0, 3363.0, 5253.0, 8449.0, 14075.0, 22840.0, 38911.0, 67453.0, 122172.0, 230333.0, 1262001.0, 134550.0, 73876.0, 42468.0, 25419.0, 14965.0, 9328.0, 5536.0, 3633.0, 2210.0, 1426.0, 915.0, 610.0, 409.0, 255.0, 166.0, 133.0, 63.0, 61.0, 45.0, 31.0, 15.0, 11.0, 6.0, 6.0, 1.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1375732421875, -0.13299942016601562, -0.12842559814453125, -0.12385177612304688, -0.1192779541015625, -0.11470413208007812, -0.11013031005859375, -0.10555648803710938, -0.100982666015625, -0.09640884399414062, -0.09183502197265625, -0.08726119995117188, -0.0826873779296875, -0.07811355590820312, -0.07353973388671875, -0.06896591186523438, -0.06439208984375, -0.059818267822265625, -0.05524444580078125, -0.050670623779296875, -0.0460968017578125, -0.041522979736328125, -0.03694915771484375, -0.032375335693359375, -0.027801513671875, -0.023227691650390625, -0.01865386962890625, -0.014080047607421875, -0.0095062255859375, -0.004932403564453125, -0.00035858154296875, 0.004215240478515625, 0.0087890625, 0.013362884521484375, 0.01793670654296875, 0.022510528564453125, 0.0270843505859375, 0.031658172607421875, 0.03623199462890625, 0.040805816650390625, 0.045379638671875, 0.049953460693359375, 0.05452728271484375, 0.059101104736328125, 0.0636749267578125, 0.06824874877929688, 0.07282257080078125, 0.07739639282226562, 0.08197021484375, 0.08654403686523438, 0.09111785888671875, 0.09569168090820312, 0.1002655029296875, 0.10483932495117188, 0.10941314697265625, 0.11398696899414062, 0.118560791015625, 0.12313461303710938, 0.12770843505859375, 0.13228225708007812, 0.1368560791015625, 0.14142990112304688, 0.14600372314453125, 0.15057754516601562, 0.1551513671875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 6.0, 3.0, 5.0, 5.0, 1.0, 4.0, 13.0, 12.0, 13.0, 19.0, 34.0, 40.0, 56.0, 56.0, 64.0, 64.0, 61.0, 87.0, 87.0, 75.0, 62.0, 42.0, 46.0, 32.0, 21.0, 19.0, 19.0, 9.0, 10.0, 8.0, 11.0, 6.0, 3.0, 4.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007195472717285156, -0.0006979405879974365, -0.0006763339042663574, -0.0006547272205352783, -0.0006331205368041992, -0.0006115138530731201, -0.000589907169342041, -0.0005683004856109619, -0.0005466938018798828, -0.0005250871181488037, -0.0005034804344177246, -0.0004818737506866455, -0.0004602670669555664, -0.0004386603832244873, -0.0004170536994934082, -0.0003954470157623291, -0.00037384033203125, -0.0003522336483001709, -0.0003306269645690918, -0.0003090202808380127, -0.0002874135971069336, -0.0002658069133758545, -0.0002442002296447754, -0.0002225935459136963, -0.0002009868621826172, -0.00017938017845153809, -0.00015777349472045898, -0.00013616681098937988, -0.00011456012725830078, -9.295344352722168e-05, -7.134675979614258e-05, -4.9740076065063477e-05, -2.8133392333984375e-05, -6.5267086029052734e-06, 1.5079975128173828e-05, 3.668665885925293e-05, 5.829334259033203e-05, 7.990002632141113e-05, 0.00010150671005249023, 0.00012311339378356934, 0.00014472007751464844, 0.00016632676124572754, 0.00018793344497680664, 0.00020954012870788574, 0.00023114681243896484, 0.00025275349617004395, 0.00027436017990112305, 0.00029596686363220215, 0.00031757354736328125, 0.00033918023109436035, 0.00036078691482543945, 0.00038239359855651855, 0.00040400028228759766, 0.00042560696601867676, 0.00044721364974975586, 0.00046882033348083496, 0.0004904270172119141, 0.0005120337009429932, 0.0005336403846740723, 0.0005552470684051514, 0.0005768537521362305, 0.0005984604358673096, 0.0006200671195983887, 0.0006416738033294678, 0.0006632804870605469]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 2.0, 4.0, 3.0, 10.0, 6.0, 6.0, 9.0, 15.0, 15.0, 27.0, 31.0, 52.0, 53.0, 95.0, 113.0, 174.0, 353.0, 665.0, 6337.0, 1028132.0, 10690.0, 712.0, 327.0, 220.0, 160.0, 102.0, 58.0, 51.0, 28.0, 24.0, 24.0, 15.0, 11.0, 4.0, 9.0, 7.0, 6.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01235198974609375, -0.011919260025024414, -0.011486530303955078, -0.011053800582885742, -0.010621070861816406, -0.01018834114074707, -0.009755611419677734, -0.009322881698608398, -0.008890151977539062, -0.008457422256469727, -0.00802469253540039, -0.007591962814331055, -0.007159233093261719, -0.006726503372192383, -0.006293773651123047, -0.005861043930053711, -0.005428314208984375, -0.004995584487915039, -0.004562854766845703, -0.004130125045776367, -0.0036973953247070312, -0.0032646656036376953, -0.0028319358825683594, -0.0023992061614990234, -0.0019664764404296875, -0.0015337467193603516, -0.0011010169982910156, -0.0006682872772216797, -0.00023555755615234375, 0.0001971721649169922, 0.0006299018859863281, 0.001062631607055664, 0.001495361328125, 0.001928091049194336, 0.002360820770263672, 0.002793550491333008, 0.0032262802124023438, 0.0036590099334716797, 0.004091739654541016, 0.0045244693756103516, 0.0049571990966796875, 0.0053899288177490234, 0.005822658538818359, 0.006255388259887695, 0.006688117980957031, 0.007120847702026367, 0.007553577423095703, 0.007986307144165039, 0.008419036865234375, 0.008851766586303711, 0.009284496307373047, 0.009717226028442383, 0.010149955749511719, 0.010582685470581055, 0.01101541519165039, 0.011448144912719727, 0.011880874633789062, 0.012313604354858398, 0.012746334075927734, 0.01317906379699707, 0.013611793518066406, 0.014044523239135742, 0.014477252960205078, 0.014909982681274414, 0.01534271240234375]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 59.0, 825.0, 133.0], "bins": [-0.007198513485491276, -0.007083520758897066, -0.0069685280323028564, -0.006853535771369934, -0.006738543044775724, -0.006623550318181515, -0.006508557591587305, -0.006393564864993095, -0.006278572138398886, -0.006163579411804676, -0.006048586685210466, -0.005933593958616257, -0.005818601697683334, -0.005703608971089125, -0.005588616244494915, -0.005473623517900705, -0.005358631256967783, -0.005243638530373573, -0.005128645803779364, -0.005013653077185154, -0.004898660816252232, -0.004783668089658022, -0.004668675363063812, -0.004553682636469603, -0.004438689909875393, -0.004323697183281183, -0.004208704456686974, -0.004093712195754051, -0.0039787194691598415, -0.003863726742565632, -0.003748734015971422, -0.0036337412893772125, -0.0035187487956136465, -0.003403756069019437, -0.003288763575255871, -0.003173770848661661, -0.0030587781220674515, -0.0029437856283038855, -0.002828792901709676, -0.0027138004079461098, -0.0025988076813519, -0.0024838149547576904, -0.0023688224609941244, -0.0022538297343999147, -0.002138837007805705, -0.002023844514042139, -0.0019088517874479294, -0.0017938591772690415, -0.0016788664506748319, -0.001563873840495944, -0.0014488811139017344, -0.0013338885037228465, -0.0012188958935439587, -0.001103903166949749, -0.0009889105567708611, -0.0008739179465919733, -0.0007589252199977636, -0.0006439325516112149, -0.000528939941432327, -0.0004139472730457783, -0.00029895463376306, -0.00018396199448034167, -6.896932609379292e-05, 4.602328408509493e-05, 0.00016101592336781323]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 8.0, 4.0, 5.0, 8.0, 8.0, 11.0, 13.0, 20.0, 19.0, 26.0, 15.0, 30.0, 18.0, 35.0, 33.0, 33.0, 49.0, 42.0, 40.0, 31.0, 39.0, 42.0, 47.0, 36.0, 45.0, 30.0, 32.0, 27.0, 26.0, 24.0, 23.0, 15.0, 24.0, 28.0, 17.0, 13.0, 14.0, 10.0, 8.0, 14.0, 4.0, 7.0, 10.0, 2.0, 1.0, 2.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0002689361572265625, -0.0002603195607662201, -0.0002517029643058777, -0.00024308636784553528, -0.00023446977138519287, -0.00022585317492485046, -0.00021723657846450806, -0.00020861998200416565, -0.00020000338554382324, -0.00019138678908348083, -0.00018277019262313843, -0.00017415359616279602, -0.0001655369997024536, -0.0001569204032421112, -0.0001483038067817688, -0.0001396872103214264, -0.00013107061386108398, -0.00012245401740074158, -0.00011383742094039917, -0.00010522082448005676, -9.660422801971436e-05, -8.798763155937195e-05, -7.937103509902954e-05, -7.075443863868713e-05, -6.213784217834473e-05, -5.352124571800232e-05, -4.490464925765991e-05, -3.6288052797317505e-05, -2.7671456336975098e-05, -1.905485987663269e-05, -1.0438263416290283e-05, -1.821666955947876e-06, 6.794929504394531e-06, 1.541152596473694e-05, 2.4028122425079346e-05, 3.264471888542175e-05, 4.126131534576416e-05, 4.987791180610657e-05, 5.8494508266448975e-05, 6.711110472679138e-05, 7.572770118713379e-05, 8.43442976474762e-05, 9.29608941078186e-05, 0.00010157749056816101, 0.00011019408702850342, 0.00011881068348884583, 0.00012742727994918823, 0.00013604387640953064, 0.00014466047286987305, 0.00015327706933021545, 0.00016189366579055786, 0.00017051026225090027, 0.00017912685871124268, 0.00018774345517158508, 0.0001963600516319275, 0.0002049766480922699, 0.0002135932445526123, 0.0002222098410129547, 0.00023082643747329712, 0.00023944303393363953, 0.00024805963039398193, 0.00025667622685432434, 0.00026529282331466675, 0.00027390941977500916, 0.00028252601623535156]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 6.0, 6.0, 5.0, 8.0, 12.0, 9.0, 18.0, 17.0, 13.0, 22.0, 13.0, 15.0, 20.0, 29.0, 27.0, 30.0, 29.0, 40.0, 55.0, 46.0, 49.0, 35.0, 38.0, 42.0, 41.0, 45.0, 32.0, 34.0, 44.0, 29.0, 19.0, 33.0, 20.0, 20.0, 12.0, 15.0, 22.0, 14.0, 6.0, 8.0, 9.0, 5.0, 9.0, 0.0, 2.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2734375, -1.2295379638671875, -1.185638427734375, -1.1417388916015625, -1.09783935546875, -1.0539398193359375, -1.010040283203125, -0.9661407470703125, -0.9222412109375, -0.8783416748046875, -0.834442138671875, -0.7905426025390625, -0.74664306640625, -0.7027435302734375, -0.658843994140625, -0.6149444580078125, -0.571044921875, -0.5271453857421875, -0.483245849609375, -0.4393463134765625, -0.39544677734375, -0.3515472412109375, -0.307647705078125, -0.2637481689453125, -0.2198486328125, -0.1759490966796875, -0.132049560546875, -0.0881500244140625, -0.04425048828125, -0.0003509521484375, 0.043548583984375, 0.0874481201171875, 0.13134765625, 0.1752471923828125, 0.219146728515625, 0.2630462646484375, 0.30694580078125, 0.3508453369140625, 0.394744873046875, 0.4386444091796875, 0.4825439453125, 0.5264434814453125, 0.570343017578125, 0.6142425537109375, 0.65814208984375, 0.7020416259765625, 0.745941162109375, 0.7898406982421875, 0.833740234375, 0.8776397705078125, 0.921539306640625, 0.9654388427734375, 1.00933837890625, 1.0532379150390625, 1.097137451171875, 1.1410369873046875, 1.1849365234375, 1.2288360595703125, 1.272735595703125, 1.3166351318359375, 1.36053466796875, 1.4044342041015625, 1.448333740234375, 1.4922332763671875, 1.5361328125]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 6.0, 1.0, 5.0, 8.0, 8.0, 8.0, 15.0, 27.0, 30.0, 39.0, 48.0, 60.0, 105.0, 132.0, 195.0, 258.0, 371.0, 612.0, 1136.0, 2231.0, 5395.0, 14458.0, 47683.0, 193239.0, 480379.0, 220517.0, 54144.0, 15921.0, 5957.0, 2447.0, 1144.0, 640.0, 398.0, 279.0, 167.0, 126.0, 89.0, 80.0, 57.0, 39.0, 26.0, 21.0, 15.0, 11.0, 16.0, 8.0, 1.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-1.7939453125, -1.7332305908203125, -1.672515869140625, -1.6118011474609375, -1.55108642578125, -1.4903717041015625, -1.429656982421875, -1.3689422607421875, -1.3082275390625, -1.2475128173828125, -1.186798095703125, -1.1260833740234375, -1.06536865234375, -1.0046539306640625, -0.943939208984375, -0.8832244873046875, -0.822509765625, -0.7617950439453125, -0.701080322265625, -0.6403656005859375, -0.57965087890625, -0.5189361572265625, -0.458221435546875, -0.3975067138671875, -0.3367919921875, -0.2760772705078125, -0.215362548828125, -0.1546478271484375, -0.09393310546875, -0.0332183837890625, 0.027496337890625, 0.0882110595703125, 0.14892578125, 0.2096405029296875, 0.270355224609375, 0.3310699462890625, 0.39178466796875, 0.4524993896484375, 0.513214111328125, 0.5739288330078125, 0.6346435546875, 0.6953582763671875, 0.756072998046875, 0.8167877197265625, 0.87750244140625, 0.9382171630859375, 0.998931884765625, 1.0596466064453125, 1.120361328125, 1.1810760498046875, 1.241790771484375, 1.3025054931640625, 1.36322021484375, 1.4239349365234375, 1.484649658203125, 1.5453643798828125, 1.6060791015625, 1.6667938232421875, 1.727508544921875, 1.7882232666015625, 1.84893798828125, 1.9096527099609375, 1.970367431640625, 2.0310821533203125, 2.091796875]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 4.0, 4.0, 9.0, 7.0, 5.0, 5.0, 13.0, 10.0, 14.0, 9.0, 12.0, 19.0, 20.0, 27.0, 22.0, 28.0, 36.0, 27.0, 40.0, 49.0, 50.0, 74.0, 120.0, 330.0, 1438.0, 159.0, 77.0, 70.0, 49.0, 39.0, 30.0, 28.0, 33.0, 20.0, 23.0, 22.0, 18.0, 13.0, 16.0, 12.0, 15.0, 12.0, 11.0, 11.0, 3.0, 6.0, 0.0, 2.0, 5.0, 2.0, 4.0, 1.0, 1.0, 2.0], "bins": [-4.78515625, -4.6451416015625, -4.505126953125, -4.3651123046875, -4.22509765625, -4.0850830078125, -3.945068359375, -3.8050537109375, -3.6650390625, -3.5250244140625, -3.385009765625, -3.2449951171875, -3.10498046875, -2.9649658203125, -2.824951171875, -2.6849365234375, -2.544921875, -2.4049072265625, -2.264892578125, -2.1248779296875, -1.98486328125, -1.8448486328125, -1.704833984375, -1.5648193359375, -1.4248046875, -1.2847900390625, -1.144775390625, -1.0047607421875, -0.86474609375, -0.7247314453125, -0.584716796875, -0.4447021484375, -0.3046875, -0.1646728515625, -0.024658203125, 0.1153564453125, 0.25537109375, 0.3953857421875, 0.535400390625, 0.6754150390625, 0.8154296875, 0.9554443359375, 1.095458984375, 1.2354736328125, 1.37548828125, 1.5155029296875, 1.655517578125, 1.7955322265625, 1.935546875, 2.0755615234375, 2.215576171875, 2.3555908203125, 2.49560546875, 2.6356201171875, 2.775634765625, 2.9156494140625, 3.0556640625, 3.1956787109375, 3.335693359375, 3.4757080078125, 3.61572265625, 3.7557373046875, 3.895751953125, 4.0357666015625, 4.17578125]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 7.0, 6.0, 7.0, 7.0, 12.0, 17.0, 19.0, 26.0, 31.0, 31.0, 51.0, 51.0, 77.0, 119.0, 194.0, 380.0, 934.0, 4317.0, 98276.0, 2980788.0, 55237.0, 3370.0, 782.0, 329.0, 173.0, 125.0, 78.0, 52.0, 46.0, 32.0, 29.0, 20.0, 18.0, 12.0, 16.0, 14.0, 5.0, 8.0, 7.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.8515625, -8.5699462890625, -8.288330078125, -8.0067138671875, -7.72509765625, -7.4434814453125, -7.161865234375, -6.8802490234375, -6.5986328125, -6.3170166015625, -6.035400390625, -5.7537841796875, -5.47216796875, -5.1905517578125, -4.908935546875, -4.6273193359375, -4.345703125, -4.0640869140625, -3.782470703125, -3.5008544921875, -3.21923828125, -2.9376220703125, -2.656005859375, -2.3743896484375, -2.0927734375, -1.8111572265625, -1.529541015625, -1.2479248046875, -0.96630859375, -0.6846923828125, -0.403076171875, -0.1214599609375, 0.16015625, 0.4417724609375, 0.723388671875, 1.0050048828125, 1.28662109375, 1.5682373046875, 1.849853515625, 2.1314697265625, 2.4130859375, 2.6947021484375, 2.976318359375, 3.2579345703125, 3.53955078125, 3.8211669921875, 4.102783203125, 4.3843994140625, 4.666015625, 4.9476318359375, 5.229248046875, 5.5108642578125, 5.79248046875, 6.0740966796875, 6.355712890625, 6.6373291015625, 6.9189453125, 7.2005615234375, 7.482177734375, 7.7637939453125, 8.04541015625, 8.3270263671875, 8.608642578125, 8.8902587890625, 9.171875]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [3.0, 5.0, 31.0, 211.0, 485.0, 233.0, 45.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.144052982330322, -3.2300913333892822, -2.316129684448242, -1.4021680355072021, -0.4882063865661621, 0.42575502395629883, 1.339716911315918, 2.253678798675537, 3.167640209197998, 4.081602096557617, 4.995563507080078, 5.909524917602539, 6.823486804962158, 7.737448215484619, 8.651410102844238, 9.565372467041016, 10.479333877563477, 11.393295288085938, 12.307256698608398, 13.221219062805176, 14.135180473327637, 15.049141883850098, 15.963104248046875, 16.877065658569336, 17.791027069091797, 18.704988479614258, 19.61894989013672, 20.53291130065918, 21.44687271118164, 22.360836029052734, 23.274797439575195, 24.188758850097656, 25.102718353271484, 26.016679763793945, 26.930641174316406, 27.844602584838867, 28.758563995361328, 29.672527313232422, 30.586488723754883, 31.500450134277344, 32.41441345214844, 33.32837677001953, 34.24233627319336, 35.15629959106445, 36.07025909423828, 36.984222412109375, 37.8981819152832, 38.8121452331543, 39.726104736328125, 40.64006805419922, 41.55402755737305, 42.46799087524414, 43.38195037841797, 44.29591369628906, 45.20987319946289, 46.123836517333984, 47.03779602050781, 47.951759338378906, 48.865718841552734, 49.77968215942383, 50.693641662597656, 51.60760498046875, 52.52156448364258, 53.43552780151367, 54.349491119384766]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 1.0, 7.0, 10.0, 13.0, 4.0, 9.0, 10.0, 16.0, 15.0, 18.0, 16.0, 23.0, 23.0, 23.0, 21.0, 20.0, 31.0, 32.0, 27.0, 35.0, 39.0, 31.0, 34.0, 41.0, 44.0, 34.0, 28.0, 30.0, 31.0, 39.0, 35.0, 31.0, 26.0, 25.0, 30.0, 20.0, 16.0, 23.0, 11.0, 8.0, 14.0, 11.0, 10.0, 11.0, 3.0, 8.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0], "bins": [-14.873390197753906, -14.422867774963379, -13.972346305847168, -13.52182388305664, -13.071301460266113, -12.620779037475586, -12.170257568359375, -11.719735145568848, -11.26921272277832, -10.818690299987793, -10.368168830871582, -9.917646408081055, -9.467123985290527, -9.0166015625, -8.566080093383789, -8.115557670593262, -7.665035724639893, -7.214513778686523, -6.763991355895996, -6.313469409942627, -5.8629469871521, -5.4124250411987305, -4.961902618408203, -4.511380672454834, -4.060858726501465, -3.6103365421295166, -3.1598143577575684, -2.709292411804199, -2.258769989013672, -1.8082480430603027, -1.3577258586883545, -0.9072036743164062, -0.4566812515258789, -0.006159096956253052, 0.4443630576133728, 0.8948851823806763, 1.3454073667526245, 1.7959294319152832, 2.2464516162872314, 2.6969738006591797, 3.147495985031128, 3.598018169403076, 4.048540115356445, 4.499062538146973, 4.949584484100342, 5.400106430053711, 5.850628852844238, 6.301151275634766, 6.751673221588135, 7.202195167541504, 7.652717590332031, 8.103240013122559, 8.55376148223877, 9.004283905029297, 9.454806327819824, 9.905328750610352, 10.355850219726562, 10.80637264251709, 11.2568941116333, 11.707416534423828, 12.157938957214355, 12.608461380004883, 13.058982849121094, 13.509505271911621, 13.960027694702148]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 6.0, 2.0, 5.0, 14.0, 9.0, 9.0, 14.0, 16.0, 18.0, 10.0, 14.0, 15.0, 27.0, 21.0, 21.0, 32.0, 38.0, 34.0, 34.0, 33.0, 50.0, 51.0, 45.0, 42.0, 35.0, 43.0, 31.0, 37.0, 42.0, 30.0, 32.0, 31.0, 22.0, 26.0, 18.0, 15.0, 14.0, 9.0, 12.0, 12.0, 7.0, 7.0, 6.0, 6.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.33203125, -1.28704833984375, -1.2420654296875, -1.19708251953125, -1.152099609375, -1.10711669921875, -1.0621337890625, -1.01715087890625, -0.97216796875, -0.92718505859375, -0.8822021484375, -0.83721923828125, -0.792236328125, -0.74725341796875, -0.7022705078125, -0.65728759765625, -0.6123046875, -0.56732177734375, -0.5223388671875, -0.47735595703125, -0.432373046875, -0.38739013671875, -0.3424072265625, -0.29742431640625, -0.25244140625, -0.20745849609375, -0.1624755859375, -0.11749267578125, -0.072509765625, -0.02752685546875, 0.0174560546875, 0.06243896484375, 0.107421875, 0.15240478515625, 0.1973876953125, 0.24237060546875, 0.287353515625, 0.33233642578125, 0.3773193359375, 0.42230224609375, 0.46728515625, 0.51226806640625, 0.5572509765625, 0.60223388671875, 0.647216796875, 0.69219970703125, 0.7371826171875, 0.78216552734375, 0.8271484375, 0.87213134765625, 0.9171142578125, 0.96209716796875, 1.007080078125, 1.05206298828125, 1.0970458984375, 1.14202880859375, 1.18701171875, 1.23199462890625, 1.2769775390625, 1.32196044921875, 1.366943359375, 1.41192626953125, 1.4569091796875, 1.50189208984375, 1.546875]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 7.0, 2.0, 7.0, 10.0, 14.0, 12.0, 17.0, 15.0, 29.0, 30.0, 47.0, 75.0, 117.0, 209.0, 514.0, 1385.0, 4384.0, 16195.0, 75600.0, 517653.0, 2254480.0, 1125309.0, 157741.0, 29269.0, 7370.0, 2261.0, 783.0, 311.0, 137.0, 91.0, 56.0, 32.0, 21.0, 17.0, 19.0, 15.0, 16.0, 14.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.060546875, -2.95391845703125, -2.8472900390625, -2.74066162109375, -2.634033203125, -2.52740478515625, -2.4207763671875, -2.31414794921875, -2.20751953125, -2.10089111328125, -1.9942626953125, -1.88763427734375, -1.781005859375, -1.67437744140625, -1.5677490234375, -1.46112060546875, -1.3544921875, -1.24786376953125, -1.1412353515625, -1.03460693359375, -0.927978515625, -0.82135009765625, -0.7147216796875, -0.60809326171875, -0.50146484375, -0.39483642578125, -0.2882080078125, -0.18157958984375, -0.074951171875, 0.03167724609375, 0.1383056640625, 0.24493408203125, 0.3515625, 0.45819091796875, 0.5648193359375, 0.67144775390625, 0.778076171875, 0.88470458984375, 0.9913330078125, 1.09796142578125, 1.20458984375, 1.31121826171875, 1.4178466796875, 1.52447509765625, 1.631103515625, 1.73773193359375, 1.8443603515625, 1.95098876953125, 2.0576171875, 2.16424560546875, 2.2708740234375, 2.37750244140625, 2.484130859375, 2.59075927734375, 2.6973876953125, 2.80401611328125, 2.91064453125, 3.01727294921875, 3.1239013671875, 3.23052978515625, 3.337158203125, 3.44378662109375, 3.5504150390625, 3.65704345703125, 3.763671875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 4.0, 2.0, 7.0, 5.0, 8.0, 14.0, 15.0, 26.0, 35.0, 37.0, 53.0, 79.0, 99.0, 118.0, 154.0, 233.0, 263.0, 359.0, 431.0, 412.0, 353.0, 340.0, 244.0, 189.0, 137.0, 107.0, 82.0, 53.0, 61.0, 35.0, 27.0, 32.0, 25.0, 10.0, 7.0, 7.0, 5.0, 1.0, 5.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.548828125, -3.43157958984375, -3.3143310546875, -3.19708251953125, -3.079833984375, -2.96258544921875, -2.8453369140625, -2.72808837890625, -2.61083984375, -2.49359130859375, -2.3763427734375, -2.25909423828125, -2.141845703125, -2.02459716796875, -1.9073486328125, -1.79010009765625, -1.6728515625, -1.55560302734375, -1.4383544921875, -1.32110595703125, -1.203857421875, -1.08660888671875, -0.9693603515625, -0.85211181640625, -0.73486328125, -0.61761474609375, -0.5003662109375, -0.38311767578125, -0.265869140625, -0.14862060546875, -0.0313720703125, 0.08587646484375, 0.203125, 0.32037353515625, 0.4376220703125, 0.55487060546875, 0.672119140625, 0.78936767578125, 0.9066162109375, 1.02386474609375, 1.14111328125, 1.25836181640625, 1.3756103515625, 1.49285888671875, 1.610107421875, 1.72735595703125, 1.8446044921875, 1.96185302734375, 2.0791015625, 2.19635009765625, 2.3135986328125, 2.43084716796875, 2.548095703125, 2.66534423828125, 2.7825927734375, 2.89984130859375, 3.01708984375, 3.13433837890625, 3.2515869140625, 3.36883544921875, 3.486083984375, 3.60333251953125, 3.7205810546875, 3.83782958984375, 3.955078125]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 8.0, 11.0, 31.0, 33.0, 72.0, 168.0, 389.0, 1566.0, 16975.0, 768467.0, 3313250.0, 88018.0, 4119.0, 726.0, 237.0, 111.0, 44.0, 27.0, 13.0, 11.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 2.0, 2.0], "bins": [-18.515625, -18.11517333984375, -17.7147216796875, -17.31427001953125, -16.913818359375, -16.51336669921875, -16.1129150390625, -15.71246337890625, -15.31201171875, -14.91156005859375, -14.5111083984375, -14.11065673828125, -13.710205078125, -13.30975341796875, -12.9093017578125, -12.50885009765625, -12.1083984375, -11.70794677734375, -11.3074951171875, -10.90704345703125, -10.506591796875, -10.10614013671875, -9.7056884765625, -9.30523681640625, -8.90478515625, -8.50433349609375, -8.1038818359375, -7.70343017578125, -7.302978515625, -6.90252685546875, -6.5020751953125, -6.10162353515625, -5.701171875, -5.30072021484375, -4.9002685546875, -4.49981689453125, -4.099365234375, -3.69891357421875, -3.2984619140625, -2.89801025390625, -2.49755859375, -2.09710693359375, -1.6966552734375, -1.29620361328125, -0.895751953125, -0.49530029296875, -0.0948486328125, 0.30560302734375, 0.7060546875, 1.10650634765625, 1.5069580078125, 1.90740966796875, 2.307861328125, 2.70831298828125, 3.1087646484375, 3.50921630859375, 3.90966796875, 4.31011962890625, 4.7105712890625, 5.11102294921875, 5.511474609375, 5.91192626953125, 6.3123779296875, 6.71282958984375, 7.11328125]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 20.0, 38.0, 61.0, 93.0, 159.0, 182.0, 176.0, 122.0, 77.0, 49.0, 19.0, 8.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.47494888305664, -39.52104949951172, -38.56714630126953, -37.61324691772461, -36.65934371948242, -35.7054443359375, -34.75154113769531, -33.79764175415039, -32.84374237060547, -31.889841079711914, -30.93593978881836, -29.982040405273438, -29.028139114379883, -28.074237823486328, -27.120336532592773, -26.16643524169922, -25.212533950805664, -24.25863265991211, -23.304731369018555, -22.350830078125, -21.396930694580078, -20.443029403686523, -19.48912811279297, -18.535226821899414, -17.58132553100586, -16.627424240112305, -15.673523902893066, -14.719622611999512, -13.765722274780273, -12.811820983886719, -11.857919692993164, -10.90401840209961, -9.950117111206055, -8.9962158203125, -8.042315483093262, -7.088414192199707, -6.1345133781433105, -5.180612564086914, -4.226711273193359, -3.272810459136963, -2.3189096450805664, -1.3650087118148804, -0.41110777854919434, 0.5427932739257812, 1.4966940879821777, 2.450594902038574, 3.404496192932129, 4.358397006988525, 5.312297821044922, 6.266198635101318, 7.220099449157715, 8.17400074005127, 9.127901077270508, 10.081802368164062, 11.035703659057617, 11.989604949951172, 12.94350528717041, 13.897406578063965, 14.851306915283203, 15.805208206176758, 16.759109497070312, 17.713008880615234, 18.666912078857422, 19.620811462402344, 20.5747127532959]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 10.0, 5.0, 8.0, 5.0, 5.0, 14.0, 13.0, 13.0, 12.0, 25.0, 21.0, 18.0, 20.0, 21.0, 31.0, 25.0, 30.0, 31.0, 35.0, 45.0, 29.0, 37.0, 41.0, 43.0, 43.0, 39.0, 32.0, 31.0, 35.0, 27.0, 27.0, 27.0, 32.0, 32.0, 23.0, 21.0, 18.0, 19.0, 16.0, 7.0, 9.0, 8.0, 3.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0], "bins": [-12.98921012878418, -12.58332633972168, -12.177443504333496, -11.771559715270996, -11.365676879882812, -10.959793090820312, -10.553909301757812, -10.148026466369629, -9.742143630981445, -9.336259841918945, -8.930377006530762, -8.524493217468262, -8.118610382080078, -7.712726593017578, -7.306843280792236, -6.9009599685668945, -6.4950761795043945, -6.089192867279053, -5.683309555053711, -5.277425765991211, -4.871542930603027, -4.465659141540527, -4.0597758293151855, -3.6538925170898438, -3.248009204864502, -2.84212589263916, -2.4362425804138184, -2.0303590297698975, -1.6244757175445557, -1.2185924053192139, -0.812708854675293, -0.40682554244995117, -0.000942230224609375, 0.4049411416053772, 0.8108245134353638, 1.2167079448699951, 1.622591257095337, 2.0284745693206787, 2.4343581199645996, 2.8402414321899414, 3.246124744415283, 3.652008056640625, 4.057891368865967, 4.463774681091309, 4.869658470153809, 5.275541305541992, 5.681425094604492, 6.087308406829834, 6.493191719055176, 6.899075031280518, 7.304958343505859, 7.710842132568359, 8.116724967956543, 8.522608757019043, 8.928491592407227, 9.334375381469727, 9.740259170532227, 10.146142959594727, 10.55202579498291, 10.95790958404541, 11.363792419433594, 11.769676208496094, 12.175559997558594, 12.581442832946777, 12.987325668334961]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 3.0, 10.0, 2.0, 4.0, 12.0, 12.0, 14.0, 12.0, 19.0, 19.0, 19.0, 23.0, 14.0, 32.0, 29.0, 40.0, 39.0, 25.0, 49.0, 41.0, 51.0, 36.0, 38.0, 36.0, 37.0, 36.0, 44.0, 33.0, 37.0, 33.0, 42.0, 22.0, 23.0, 17.0, 18.0, 11.0, 12.0, 10.0, 9.0, 10.0, 9.0, 3.0, 4.0, 7.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5322265625, -1.4853363037109375, -1.438446044921875, -1.3915557861328125, -1.34466552734375, -1.2977752685546875, -1.250885009765625, -1.2039947509765625, -1.1571044921875, -1.1102142333984375, -1.063323974609375, -1.0164337158203125, -0.96954345703125, -0.9226531982421875, -0.875762939453125, -0.8288726806640625, -0.781982421875, -0.7350921630859375, -0.688201904296875, -0.6413116455078125, -0.59442138671875, -0.5475311279296875, -0.500640869140625, -0.4537506103515625, -0.4068603515625, -0.3599700927734375, -0.313079833984375, -0.2661895751953125, -0.21929931640625, -0.1724090576171875, -0.125518798828125, -0.0786285400390625, -0.03173828125, 0.0151519775390625, 0.062042236328125, 0.1089324951171875, 0.15582275390625, 0.2027130126953125, 0.249603271484375, 0.2964935302734375, 0.3433837890625, 0.3902740478515625, 0.437164306640625, 0.4840545654296875, 0.53094482421875, 0.5778350830078125, 0.624725341796875, 0.6716156005859375, 0.718505859375, 0.7653961181640625, 0.812286376953125, 0.8591766357421875, 0.90606689453125, 0.9529571533203125, 0.999847412109375, 1.0467376708984375, 1.0936279296875, 1.1405181884765625, 1.187408447265625, 1.2342987060546875, 1.28118896484375, 1.3280792236328125, 1.374969482421875, 1.4218597412109375, 1.46875]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 5.0, 1.0, 8.0, 9.0, 12.0, 16.0, 14.0, 19.0, 25.0, 47.0, 72.0, 100.0, 134.0, 248.0, 275.0, 431.0, 527.0, 849.0, 1217.0, 1769.0, 2623.0, 3923.0, 5699.0, 8573.0, 13125.0, 20907.0, 33252.0, 55572.0, 96692.0, 173062.0, 234694.0, 161654.0, 91091.0, 52600.0, 31396.0, 19741.0, 12683.0, 8287.0, 5569.0, 3606.0, 2439.0, 1754.0, 1159.0, 809.0, 556.0, 366.0, 266.0, 220.0, 146.0, 95.0, 71.0, 42.0, 42.0, 18.0, 19.0, 13.0, 10.0, 11.0, 4.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.1795654296875, -0.17385482788085938, -0.16814422607421875, -0.16243362426757812, -0.1567230224609375, -0.15101242065429688, -0.14530181884765625, -0.13959121704101562, -0.133880615234375, -0.12817001342773438, -0.12245941162109375, -0.11674880981445312, -0.1110382080078125, -0.10532760620117188, -0.09961700439453125, -0.09390640258789062, -0.08819580078125, -0.08248519897460938, -0.07677459716796875, -0.07106399536132812, -0.0653533935546875, -0.059642791748046875, -0.05393218994140625, -0.048221588134765625, -0.042510986328125, -0.036800384521484375, -0.03108978271484375, -0.025379180908203125, -0.0196685791015625, -0.013957977294921875, -0.00824737548828125, -0.002536773681640625, 0.003173828125, 0.008884429931640625, 0.01459503173828125, 0.020305633544921875, 0.0260162353515625, 0.031726837158203125, 0.03743743896484375, 0.043148040771484375, 0.048858642578125, 0.054569244384765625, 0.06027984619140625, 0.06599044799804688, 0.0717010498046875, 0.07741165161132812, 0.08312225341796875, 0.08883285522460938, 0.09454345703125, 0.10025405883789062, 0.10596466064453125, 0.11167526245117188, 0.1173858642578125, 0.12309646606445312, 0.12880706787109375, 0.13451766967773438, 0.140228271484375, 0.14593887329101562, 0.15164947509765625, 0.15736007690429688, 0.1630706787109375, 0.16878128051757812, 0.17449188232421875, 0.18020248413085938, 0.1859130859375]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 4.0, 3.0, 6.0, 6.0, 12.0, 10.0, 13.0, 15.0, 15.0, 16.0, 28.0, 18.0, 31.0, 33.0, 37.0, 38.0, 33.0, 39.0, 36.0, 33.0, 48.0, 1057.0, 42.0, 34.0, 35.0, 32.0, 29.0, 35.0, 31.0, 21.0, 23.0, 28.0, 32.0, 19.0, 21.0, 19.0, 15.0, 9.0, 12.0, 6.0, 7.0, 8.0, 9.0, 8.0, 3.0, 1.0, 3.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.89599609375, -0.8679733276367188, -0.8399505615234375, -0.8119277954101562, -0.783905029296875, -0.7558822631835938, -0.7278594970703125, -0.6998367309570312, -0.67181396484375, -0.6437911987304688, -0.6157684326171875, -0.5877456665039062, -0.559722900390625, -0.5317001342773438, -0.5036773681640625, -0.47565460205078125, -0.4476318359375, -0.41960906982421875, -0.3915863037109375, -0.36356353759765625, -0.335540771484375, -0.30751800537109375, -0.2794952392578125, -0.25147247314453125, -0.22344970703125, -0.19542694091796875, -0.1674041748046875, -0.13938140869140625, -0.111358642578125, -0.08333587646484375, -0.0553131103515625, -0.02729034423828125, 0.000732421875, 0.02875518798828125, 0.0567779541015625, 0.08480072021484375, 0.112823486328125, 0.14084625244140625, 0.1688690185546875, 0.19689178466796875, 0.22491455078125, 0.25293731689453125, 0.2809600830078125, 0.30898284912109375, 0.337005615234375, 0.36502838134765625, 0.3930511474609375, 0.42107391357421875, 0.4490966796875, 0.47711944580078125, 0.5051422119140625, 0.5331649780273438, 0.561187744140625, 0.5892105102539062, 0.6172332763671875, 0.6452560424804688, 0.67327880859375, 0.7013015747070312, 0.7293243408203125, 0.7573471069335938, 0.785369873046875, 0.8133926391601562, 0.8414154052734375, 0.8694381713867188, 0.8974609375]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 13.0, 13.0, 28.0, 35.0, 42.0, 63.0, 115.0, 146.0, 223.0, 331.0, 456.0, 746.0, 1070.0, 1657.0, 2500.0, 3789.0, 5844.0, 9139.0, 14025.0, 22658.0, 36649.0, 61013.0, 103994.0, 176672.0, 1269919.0, 155068.0, 90264.0, 53379.0, 32201.0, 19736.0, 12219.0, 7871.0, 5125.0, 3354.0, 2220.0, 1408.0, 994.0, 679.0, 475.0, 355.0, 225.0, 132.0, 92.0, 58.0, 52.0, 43.0, 20.0, 8.0, 6.0, 2.0, 4.0, 3.0, 6.0, 0.0, 0.0, 1.0], "bins": [-0.145751953125, -0.1412487030029297, -0.13674545288085938, -0.13224220275878906, -0.12773895263671875, -0.12323570251464844, -0.11873245239257812, -0.11422920227050781, -0.1097259521484375, -0.10522270202636719, -0.10071945190429688, -0.09621620178222656, -0.09171295166015625, -0.08720970153808594, -0.08270645141601562, -0.07820320129394531, -0.073699951171875, -0.06919670104980469, -0.06469345092773438, -0.06019020080566406, -0.05568695068359375, -0.05118370056152344, -0.046680450439453125, -0.04217720031738281, -0.0376739501953125, -0.03317070007324219, -0.028667449951171875, -0.024164199829101562, -0.01966094970703125, -0.015157699584960938, -0.010654449462890625, -0.0061511993408203125, -0.00164794921875, 0.0028553009033203125, 0.007358551025390625, 0.011861801147460938, 0.01636505126953125, 0.020868301391601562, 0.025371551513671875, 0.029874801635742188, 0.0343780517578125, 0.03888130187988281, 0.043384552001953125, 0.04788780212402344, 0.05239105224609375, 0.05689430236816406, 0.061397552490234375, 0.06590080261230469, 0.070404052734375, 0.07490730285644531, 0.07941055297851562, 0.08391380310058594, 0.08841705322265625, 0.09292030334472656, 0.09742355346679688, 0.10192680358886719, 0.1064300537109375, 0.11093330383300781, 0.11543655395507812, 0.11993980407714844, 0.12444305419921875, 0.12894630432128906, 0.13344955444335938, 0.1379528045654297, 0.1424560546875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 7.0, 5.0, 7.0, 4.0, 8.0, 4.0, 7.0, 6.0, 12.0, 14.0, 9.0, 12.0, 24.0, 20.0, 33.0, 38.0, 40.0, 56.0, 49.0, 63.0, 61.0, 59.0, 50.0, 62.0, 46.0, 35.0, 55.0, 32.0, 27.0, 24.0, 19.0, 18.0, 16.0, 16.0, 13.0, 10.0, 7.0, 5.0, 5.0, 3.0, 3.0, 3.0, 5.0, 4.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0005083084106445312, -0.0004926994442939758, -0.0004770904779434204, -0.000461481511592865, -0.00044587254524230957, -0.00043026357889175415, -0.00041465461254119873, -0.0003990456461906433, -0.0003834366798400879, -0.00036782771348953247, -0.00035221874713897705, -0.00033660978078842163, -0.0003210008144378662, -0.0003053918480873108, -0.00028978288173675537, -0.00027417391538619995, -0.00025856494903564453, -0.0002429559826850891, -0.0002273470163345337, -0.00021173804998397827, -0.00019612908363342285, -0.00018052011728286743, -0.000164911150932312, -0.0001493021845817566, -0.00013369321823120117, -0.00011808425188064575, -0.00010247528553009033, -8.686631917953491e-05, -7.125735282897949e-05, -5.564838647842407e-05, -4.003942012786865e-05, -2.4430453777313232e-05, -8.821487426757812e-06, 6.787478923797607e-06, 2.2396445274353027e-05, 3.800541162490845e-05, 5.361437797546387e-05, 6.922334432601929e-05, 8.483231067657471e-05, 0.00010044127702713013, 0.00011605024337768555, 0.00013165920972824097, 0.0001472681760787964, 0.0001628771424293518, 0.00017848610877990723, 0.00019409507513046265, 0.00020970404148101807, 0.00022531300783157349, 0.0002409219741821289, 0.0002565309405326843, 0.00027213990688323975, 0.00028774887323379517, 0.0003033578395843506, 0.000318966805934906, 0.0003345757722854614, 0.00035018473863601685, 0.00036579370498657227, 0.0003814026713371277, 0.0003970116376876831, 0.0004126206040382385, 0.00042822957038879395, 0.00044383853673934937, 0.0004594475030899048, 0.0004750564694404602, 0.0004906654357910156]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 6.0, 6.0, 4.0, 5.0, 4.0, 5.0, 4.0, 10.0, 20.0, 17.0, 37.0, 36.0, 45.0, 83.0, 143.0, 219.0, 470.0, 1595.0, 882784.0, 161042.0, 1024.0, 388.0, 217.0, 131.0, 73.0, 44.0, 37.0, 19.0, 15.0, 14.0, 11.0, 11.0, 4.0, 8.0, 4.0, 5.0, 6.0, 2.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01273345947265625, -0.01229238510131836, -0.011851310729980469, -0.011410236358642578, -0.010969161987304688, -0.010528087615966797, -0.010087013244628906, -0.009645938873291016, -0.009204864501953125, -0.008763790130615234, -0.008322715759277344, -0.007881641387939453, -0.0074405670166015625, -0.006999492645263672, -0.006558418273925781, -0.006117343902587891, -0.00567626953125, -0.005235195159912109, -0.004794120788574219, -0.004353046417236328, -0.0039119720458984375, -0.003470897674560547, -0.0030298233032226562, -0.0025887489318847656, -0.002147674560546875, -0.0017066001892089844, -0.0012655258178710938, -0.0008244514465332031, -0.0003833770751953125, 5.7697296142578125e-05, 0.0004987716674804688, 0.0009398460388183594, 0.00138092041015625, 0.0018219947814941406, 0.0022630691528320312, 0.002704143524169922, 0.0031452178955078125, 0.003586292266845703, 0.004027366638183594, 0.004468441009521484, 0.004909515380859375, 0.005350589752197266, 0.005791664123535156, 0.006232738494873047, 0.0066738128662109375, 0.007114887237548828, 0.007555961608886719, 0.00799703598022461, 0.0084381103515625, 0.00887918472290039, 0.009320259094238281, 0.009761333465576172, 0.010202407836914062, 0.010643482208251953, 0.011084556579589844, 0.011525630950927734, 0.011966705322265625, 0.012407779693603516, 0.012848854064941406, 0.013289928436279297, 0.013731002807617188, 0.014172077178955078, 0.014613151550292969, 0.01505422592163086, 0.01549530029296875]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 20.0, 404.0, 551.0, 41.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0037929017562419176, -0.003706950694322586, -0.003620999399572611, -0.0035350483376532793, -0.003449097042903304, -0.0033631459809839725, -0.0032771946862339973, -0.003191243624314666, -0.0031052925623953342, -0.0030193415004760027, -0.0029333902057260275, -0.002847439143806696, -0.0027614878490567207, -0.002675536787137389, -0.0025895857252180576, -0.0025036344304680824, -0.0024176831357181072, -0.0023317320737987757, -0.0022457807790488005, -0.002159829717129469, -0.0020738784223794937, -0.001987927360460162, -0.0019019761821255088, -0.0018160250037908554, -0.001730073825456202, -0.0016441226471215487, -0.0015581714687868953, -0.001472220290452242, -0.0013862692285329103, -0.0013003179337829351, -0.0012143668718636036, -0.0011284156935289502, -0.0010424646316096187, -0.0009565134532749653, -0.0008705622749403119, -0.0007846111548133194, -0.0006986599764786661, -0.0006127087981440127, -0.0005267576780170202, -0.00044080649968236685, -0.00035485532134771347, -0.0002689041430130601, -0.00018295299378223717, -9.700184455141425e-05, -1.1050666216760874e-05, 7.49005121178925e-05, 0.00016085163224488497, 0.00024680281057953835, 0.0003327539889141917, 0.0004187051672488451, 0.0005046563455834985, 0.0005906074657104909, 0.0006765586440451443, 0.0007625098223797977, 0.0008484609425067902, 0.0009344121208414435, 0.001020363299176097, 0.0011063144775107503, 0.0011922656558454037, 0.0012782167177647352, 0.0013641680125147104, 0.001450119074434042, 0.0015360702527686954, 0.0016220214311033487, 0.0017079726094380021]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 6.0, 1.0, 4.0, 4.0, 8.0, 8.0, 14.0, 5.0, 14.0, 14.0, 16.0, 18.0, 22.0, 32.0, 34.0, 30.0, 23.0, 32.0, 41.0, 32.0, 46.0, 48.0, 49.0, 33.0, 47.0, 41.0, 42.0, 38.0, 42.0, 32.0, 30.0, 31.0, 25.0, 18.0, 19.0, 15.0, 21.0, 10.0, 13.0, 15.0, 9.0, 6.0, 6.0, 4.0, 2.0, 1.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00027120113372802734, -0.0002622026950120926, -0.00025320425629615784, -0.0002442058175802231, -0.00023520737886428833, -0.00022620894014835358, -0.00021721050143241882, -0.00020821206271648407, -0.00019921362400054932, -0.00019021518528461456, -0.0001812167465686798, -0.00017221830785274506, -0.0001632198691368103, -0.00015422143042087555, -0.0001452229917049408, -0.00013622455298900604, -0.0001272261142730713, -0.00011822767555713654, -0.00010922923684120178, -0.00010023079812526703, -9.123235940933228e-05, -8.223392069339752e-05, -7.323548197746277e-05, -6.423704326152802e-05, -5.523860454559326e-05, -4.624016582965851e-05, -3.7241727113723755e-05, -2.8243288397789e-05, -1.9244849681854248e-05, -1.0246410965919495e-05, -1.2479722499847412e-06, 7.750466465950012e-06, 1.6748905181884766e-05, 2.574734389781952e-05, 3.474578261375427e-05, 4.3744221329689026e-05, 5.274266004562378e-05, 6.174109876155853e-05, 7.073953747749329e-05, 7.973797619342804e-05, 8.873641490936279e-05, 9.773485362529755e-05, 0.0001067332923412323, 0.00011573173105716705, 0.0001247301697731018, 0.00013372860848903656, 0.0001427270472049713, 0.00015172548592090607, 0.00016072392463684082, 0.00016972236335277557, 0.00017872080206871033, 0.00018771924078464508, 0.00019671767950057983, 0.0002057161182165146, 0.00021471455693244934, 0.0002237129956483841, 0.00023271143436431885, 0.0002417098730802536, 0.00025070831179618835, 0.0002597067505121231, 0.00026870518922805786, 0.0002777036279439926, 0.00028670206665992737, 0.0002957005053758621, 0.0003046989440917969]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 3.0, 10.0, 2.0, 4.0, 12.0, 12.0, 14.0, 12.0, 19.0, 19.0, 19.0, 23.0, 14.0, 32.0, 29.0, 40.0, 39.0, 25.0, 49.0, 41.0, 51.0, 36.0, 38.0, 36.0, 37.0, 36.0, 45.0, 32.0, 37.0, 33.0, 41.0, 23.0, 23.0, 17.0, 17.0, 12.0, 12.0, 10.0, 9.0, 10.0, 9.0, 3.0, 4.0, 7.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5322265625, -1.4853363037109375, -1.438446044921875, -1.3915557861328125, -1.34466552734375, -1.2977752685546875, -1.250885009765625, -1.2039947509765625, -1.1571044921875, -1.1102142333984375, -1.063323974609375, -1.0164337158203125, -0.96954345703125, -0.9226531982421875, -0.875762939453125, -0.8288726806640625, -0.781982421875, -0.7350921630859375, -0.688201904296875, -0.6413116455078125, -0.59442138671875, -0.5475311279296875, -0.500640869140625, -0.4537506103515625, -0.4068603515625, -0.3599700927734375, -0.313079833984375, -0.2661895751953125, -0.21929931640625, -0.1724090576171875, -0.125518798828125, -0.0786285400390625, -0.03173828125, 0.0151519775390625, 0.062042236328125, 0.1089324951171875, 0.15582275390625, 0.2027130126953125, 0.249603271484375, 0.2964935302734375, 0.3433837890625, 0.3902740478515625, 0.437164306640625, 0.4840545654296875, 0.53094482421875, 0.5778350830078125, 0.624725341796875, 0.6716156005859375, 0.718505859375, 0.7653961181640625, 0.812286376953125, 0.8591766357421875, 0.90606689453125, 0.9529571533203125, 0.999847412109375, 1.0467376708984375, 1.0936279296875, 1.1405181884765625, 1.187408447265625, 1.2342987060546875, 1.28118896484375, 1.3280792236328125, 1.374969482421875, 1.4218597412109375, 1.46875]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 4.0, 3.0, 2.0, 7.0, 12.0, 11.0, 13.0, 14.0, 27.0, 36.0, 47.0, 52.0, 109.0, 165.0, 270.0, 390.0, 669.0, 1139.0, 1973.0, 3481.0, 6453.0, 12397.0, 25961.0, 55279.0, 117059.0, 212650.0, 256665.0, 178235.0, 91419.0, 42281.0, 19866.0, 9766.0, 5146.0, 2797.0, 1581.0, 989.0, 574.0, 340.0, 217.0, 158.0, 108.0, 52.0, 46.0, 31.0, 24.0, 11.0, 7.0, 9.0, 5.0, 5.0, 3.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.119140625, -1.0809783935546875, -1.042816162109375, -1.0046539306640625, -0.96649169921875, -0.9283294677734375, -0.890167236328125, -0.8520050048828125, -0.8138427734375, -0.7756805419921875, -0.737518310546875, -0.6993560791015625, -0.66119384765625, -0.6230316162109375, -0.584869384765625, -0.5467071533203125, -0.508544921875, -0.4703826904296875, -0.432220458984375, -0.3940582275390625, -0.35589599609375, -0.3177337646484375, -0.279571533203125, -0.2414093017578125, -0.2032470703125, -0.1650848388671875, -0.126922607421875, -0.0887603759765625, -0.05059814453125, -0.0124359130859375, 0.025726318359375, 0.0638885498046875, 0.10205078125, 0.1402130126953125, 0.178375244140625, 0.2165374755859375, 0.25469970703125, 0.2928619384765625, 0.331024169921875, 0.3691864013671875, 0.4073486328125, 0.4455108642578125, 0.483673095703125, 0.5218353271484375, 0.55999755859375, 0.5981597900390625, 0.636322021484375, 0.6744842529296875, 0.712646484375, 0.7508087158203125, 0.788970947265625, 0.8271331787109375, 0.86529541015625, 0.9034576416015625, 0.941619873046875, 0.9797821044921875, 1.0179443359375, 1.0561065673828125, 1.094268798828125, 1.1324310302734375, 1.17059326171875, 1.2087554931640625, 1.246917724609375, 1.2850799560546875, 1.3232421875]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 7.0, 6.0, 6.0, 9.0, 8.0, 8.0, 14.0, 16.0, 19.0, 26.0, 16.0, 27.0, 30.0, 38.0, 28.0, 39.0, 38.0, 71.0, 84.0, 213.0, 1431.0, 313.0, 146.0, 70.0, 66.0, 40.0, 38.0, 26.0, 28.0, 29.0, 28.0, 21.0, 17.0, 23.0, 11.0, 15.0, 16.0, 7.0, 9.0, 8.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.58984375, -5.41943359375, -5.2490234375, -5.07861328125, -4.908203125, -4.73779296875, -4.5673828125, -4.39697265625, -4.2265625, -4.05615234375, -3.8857421875, -3.71533203125, -3.544921875, -3.37451171875, -3.2041015625, -3.03369140625, -2.86328125, -2.69287109375, -2.5224609375, -2.35205078125, -2.181640625, -2.01123046875, -1.8408203125, -1.67041015625, -1.5, -1.32958984375, -1.1591796875, -0.98876953125, -0.818359375, -0.64794921875, -0.4775390625, -0.30712890625, -0.13671875, 0.03369140625, 0.2041015625, 0.37451171875, 0.544921875, 0.71533203125, 0.8857421875, 1.05615234375, 1.2265625, 1.39697265625, 1.5673828125, 1.73779296875, 1.908203125, 2.07861328125, 2.2490234375, 2.41943359375, 2.58984375, 2.76025390625, 2.9306640625, 3.10107421875, 3.271484375, 3.44189453125, 3.6123046875, 3.78271484375, 3.953125, 4.12353515625, 4.2939453125, 4.46435546875, 4.634765625, 4.80517578125, 4.9755859375, 5.14599609375, 5.31640625]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 1.0, 4.0, 13.0, 8.0, 9.0, 21.0, 12.0, 25.0, 43.0, 32.0, 54.0, 48.0, 82.0, 76.0, 132.0, 213.0, 434.0, 1239.0, 7341.0, 228587.0, 2832601.0, 68871.0, 3798.0, 944.0, 337.0, 219.0, 139.0, 89.0, 61.0, 49.0, 51.0, 30.0, 32.0, 26.0, 13.0, 15.0, 18.0, 4.0, 8.0, 4.0, 10.0, 4.0, 3.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 3.0], "bins": [-9.09375, -8.8211669921875, -8.548583984375, -8.2760009765625, -8.00341796875, -7.7308349609375, -7.458251953125, -7.1856689453125, -6.9130859375, -6.6405029296875, -6.367919921875, -6.0953369140625, -5.82275390625, -5.5501708984375, -5.277587890625, -5.0050048828125, -4.732421875, -4.4598388671875, -4.187255859375, -3.9146728515625, -3.64208984375, -3.3695068359375, -3.096923828125, -2.8243408203125, -2.5517578125, -2.2791748046875, -2.006591796875, -1.7340087890625, -1.46142578125, -1.1888427734375, -0.916259765625, -0.6436767578125, -0.37109375, -0.0985107421875, 0.174072265625, 0.4466552734375, 0.71923828125, 0.9918212890625, 1.264404296875, 1.5369873046875, 1.8095703125, 2.0821533203125, 2.354736328125, 2.6273193359375, 2.89990234375, 3.1724853515625, 3.445068359375, 3.7176513671875, 3.990234375, 4.2628173828125, 4.535400390625, 4.8079833984375, 5.08056640625, 5.3531494140625, 5.625732421875, 5.8983154296875, 6.1708984375, 6.4434814453125, 6.716064453125, 6.9886474609375, 7.26123046875, 7.5338134765625, 7.806396484375, 8.0789794921875, 8.3515625]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 131.0, 771.0, 113.0, 2.0], "bins": [-140.50949096679688, -138.22354125976562, -135.93759155273438, -133.65164184570312, -131.36569213867188, -129.07974243164062, -126.7938003540039, -124.50785064697266, -122.2219009399414, -119.93595123291016, -117.6500015258789, -115.36405944824219, -113.07810974121094, -110.79216003417969, -108.50621032714844, -106.22026062011719, -103.93431091308594, -101.64836120605469, -99.36241149902344, -97.07646179199219, -94.79051971435547, -92.50457000732422, -90.21862030029297, -87.93267059326172, -85.646728515625, -83.36077880859375, -81.0748291015625, -78.78887939453125, -76.50293731689453, -74.21698760986328, -71.93103790283203, -69.64508819580078, -67.35913848876953, -65.07318878173828, -62.7872428894043, -60.50129318237305, -58.2153434753418, -55.92939758300781, -53.64344787597656, -51.35749816894531, -49.07155227661133, -46.78560256958008, -44.499656677246094, -42.213706970214844, -39.927757263183594, -37.641807556152344, -35.35586166381836, -33.06991195678711, -30.783966064453125, -28.498018264770508, -26.212068557739258, -23.92612075805664, -21.64017105102539, -19.354223251342773, -17.068275451660156, -14.782325744628906, -12.496376991271973, -10.210428237915039, -7.924479961395264, -5.638531684875488, -3.3525829315185547, -1.066634178161621, 1.219313621520996, 3.505263328552246, 5.791211128234863]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 4.0, 1.0, 4.0, 3.0, 6.0, 5.0, 8.0, 3.0, 9.0, 11.0, 19.0, 18.0, 14.0, 24.0, 19.0, 26.0, 28.0, 42.0, 24.0, 49.0, 38.0, 35.0, 47.0, 37.0, 42.0, 39.0, 53.0, 53.0, 39.0, 42.0, 26.0, 30.0, 32.0, 26.0, 31.0, 23.0, 25.0, 9.0, 13.0, 13.0, 6.0, 6.0, 7.0, 6.0, 5.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.028182983398438, -17.48043441772461, -16.932687759399414, -16.384939193725586, -15.837190628051758, -15.289443016052246, -14.741695404052734, -14.193946838378906, -13.646199226379395, -13.098451614379883, -12.550703048706055, -12.002955436706543, -11.455207824707031, -10.907459259033203, -10.359711647033691, -9.81196403503418, -9.264215469360352, -8.71646785736084, -8.168719291687012, -7.6209716796875, -7.07322359085083, -6.52547550201416, -5.977727890014648, -5.4299798011779785, -4.882231712341309, -4.334483623504639, -3.786735773086548, -3.238987922668457, -2.691239833831787, -2.143491744995117, -1.5957438945770264, -1.0479960441589355, -0.5002479553222656, 0.047500014305114746, 0.5952479839324951, 1.1429959535598755, 1.6907439231872559, 2.238492012023926, 2.7862398624420166, 3.3339877128601074, 3.8817358016967773, 4.429483890533447, 4.977231979370117, 5.524979591369629, 6.072727680206299, 6.620475769042969, 7.1682233810424805, 7.71597146987915, 8.26371955871582, 8.811467170715332, 9.35921573638916, 9.906963348388672, 10.4547119140625, 11.002459526062012, 11.550207138061523, 12.097955703735352, 12.645703315734863, 13.193450927734375, 13.741199493408203, 14.288947105407715, 14.836694717407227, 15.384443283081055, 15.932190895080566, 16.479938507080078, 17.027687072753906]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 6.0, 3.0, 5.0, 4.0, 9.0, 8.0, 8.0, 11.0, 8.0, 12.0, 25.0, 14.0, 24.0, 19.0, 29.0, 22.0, 33.0, 43.0, 28.0, 41.0, 37.0, 48.0, 43.0, 38.0, 30.0, 40.0, 45.0, 37.0, 42.0, 43.0, 36.0, 29.0, 26.0, 28.0, 27.0, 16.0, 15.0, 10.0, 17.0, 16.0, 6.0, 11.0, 3.0, 3.0, 5.0, 1.0, 1.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.62890625, -1.578948974609375, -1.52899169921875, -1.479034423828125, -1.4290771484375, -1.379119873046875, -1.32916259765625, -1.279205322265625, -1.229248046875, -1.179290771484375, -1.12933349609375, -1.079376220703125, -1.0294189453125, -0.979461669921875, -0.92950439453125, -0.879547119140625, -0.82958984375, -0.779632568359375, -0.72967529296875, -0.679718017578125, -0.6297607421875, -0.579803466796875, -0.52984619140625, -0.479888916015625, -0.429931640625, -0.379974365234375, -0.33001708984375, -0.280059814453125, -0.2301025390625, -0.180145263671875, -0.13018798828125, -0.080230712890625, -0.0302734375, 0.019683837890625, 0.06964111328125, 0.119598388671875, 0.1695556640625, 0.219512939453125, 0.26947021484375, 0.319427490234375, 0.369384765625, 0.419342041015625, 0.46929931640625, 0.519256591796875, 0.5692138671875, 0.619171142578125, 0.66912841796875, 0.719085693359375, 0.76904296875, 0.819000244140625, 0.86895751953125, 0.918914794921875, 0.9688720703125, 1.018829345703125, 1.06878662109375, 1.118743896484375, 1.168701171875, 1.218658447265625, 1.26861572265625, 1.318572998046875, 1.3685302734375, 1.418487548828125, 1.46844482421875, 1.518402099609375, 1.568359375]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 8.0, 6.0, 10.0, 5.0, 8.0, 10.0, 13.0, 11.0, 17.0, 20.0, 28.0, 28.0, 33.0, 55.0, 80.0, 121.0, 235.0, 510.0, 1434.0, 5189.0, 24824.0, 166595.0, 1343461.0, 2189094.0, 398327.0, 50829.0, 9285.0, 2422.0, 770.0, 315.0, 159.0, 102.0, 66.0, 40.0, 45.0, 27.0, 17.0, 24.0, 13.0, 14.0, 12.0, 5.0, 3.0, 4.0, 4.0, 2.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.00390625, -3.88330078125, -3.7626953125, -3.64208984375, -3.521484375, -3.40087890625, -3.2802734375, -3.15966796875, -3.0390625, -2.91845703125, -2.7978515625, -2.67724609375, -2.556640625, -2.43603515625, -2.3154296875, -2.19482421875, -2.07421875, -1.95361328125, -1.8330078125, -1.71240234375, -1.591796875, -1.47119140625, -1.3505859375, -1.22998046875, -1.109375, -0.98876953125, -0.8681640625, -0.74755859375, -0.626953125, -0.50634765625, -0.3857421875, -0.26513671875, -0.14453125, -0.02392578125, 0.0966796875, 0.21728515625, 0.337890625, 0.45849609375, 0.5791015625, 0.69970703125, 0.8203125, 0.94091796875, 1.0615234375, 1.18212890625, 1.302734375, 1.42333984375, 1.5439453125, 1.66455078125, 1.78515625, 1.90576171875, 2.0263671875, 2.14697265625, 2.267578125, 2.38818359375, 2.5087890625, 2.62939453125, 2.75, 2.87060546875, 2.9912109375, 3.11181640625, 3.232421875, 3.35302734375, 3.4736328125, 3.59423828125, 3.71484375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 2.0, 3.0, 5.0, 7.0, 9.0, 13.0, 11.0, 20.0, 28.0, 27.0, 36.0, 69.0, 66.0, 109.0, 135.0, 196.0, 228.0, 302.0, 366.0, 416.0, 416.0, 344.0, 310.0, 249.0, 177.0, 138.0, 109.0, 65.0, 54.0, 49.0, 38.0, 13.0, 17.0, 15.0, 9.0, 8.0, 4.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.634765625, -3.509063720703125, -3.38336181640625, -3.257659912109375, -3.1319580078125, -3.006256103515625, -2.88055419921875, -2.754852294921875, -2.629150390625, -2.503448486328125, -2.37774658203125, -2.252044677734375, -2.1263427734375, -2.000640869140625, -1.87493896484375, -1.749237060546875, -1.62353515625, -1.497833251953125, -1.37213134765625, -1.246429443359375, -1.1207275390625, -0.995025634765625, -0.86932373046875, -0.743621826171875, -0.617919921875, -0.492218017578125, -0.36651611328125, -0.240814208984375, -0.1151123046875, 0.010589599609375, 0.13629150390625, 0.261993408203125, 0.3876953125, 0.513397216796875, 0.63909912109375, 0.764801025390625, 0.8905029296875, 1.016204833984375, 1.14190673828125, 1.267608642578125, 1.393310546875, 1.519012451171875, 1.64471435546875, 1.770416259765625, 1.8961181640625, 2.021820068359375, 2.14752197265625, 2.273223876953125, 2.39892578125, 2.524627685546875, 2.65032958984375, 2.776031494140625, 2.9017333984375, 3.027435302734375, 3.15313720703125, 3.278839111328125, 3.404541015625, 3.530242919921875, 3.65594482421875, 3.781646728515625, 3.9073486328125, 4.033050537109375, 4.15875244140625, 4.284454345703125, 4.41015625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 9.0, 5.0, 17.0, 28.0, 27.0, 46.0, 58.0, 71.0, 125.0, 170.0, 323.0, 569.0, 1468.0, 4415.0, 19605.0, 141518.0, 1328928.0, 2344974.0, 304018.0, 37199.0, 6875.0, 1955.0, 831.0, 382.0, 208.0, 131.0, 81.0, 60.0, 49.0, 38.0, 24.0, 21.0, 10.0, 12.0, 8.0, 7.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.20703125, -5.9942626953125, -5.781494140625, -5.5687255859375, -5.35595703125, -5.1431884765625, -4.930419921875, -4.7176513671875, -4.5048828125, -4.2921142578125, -4.079345703125, -3.8665771484375, -3.65380859375, -3.4410400390625, -3.228271484375, -3.0155029296875, -2.802734375, -2.5899658203125, -2.377197265625, -2.1644287109375, -1.95166015625, -1.7388916015625, -1.526123046875, -1.3133544921875, -1.1005859375, -0.8878173828125, -0.675048828125, -0.4622802734375, -0.24951171875, -0.0367431640625, 0.176025390625, 0.3887939453125, 0.6015625, 0.8143310546875, 1.027099609375, 1.2398681640625, 1.45263671875, 1.6654052734375, 1.878173828125, 2.0909423828125, 2.3037109375, 2.5164794921875, 2.729248046875, 2.9420166015625, 3.15478515625, 3.3675537109375, 3.580322265625, 3.7930908203125, 4.005859375, 4.2186279296875, 4.431396484375, 4.6441650390625, 4.85693359375, 5.0697021484375, 5.282470703125, 5.4952392578125, 5.7080078125, 5.9207763671875, 6.133544921875, 6.3463134765625, 6.55908203125, 6.7718505859375, 6.984619140625, 7.1973876953125, 7.41015625]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 9.0, 14.0, 25.0, 44.0, 58.0, 81.0, 111.0, 122.0, 117.0, 119.0, 113.0, 70.0, 51.0, 34.0, 18.0, 14.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.385751724243164, -11.62949275970459, -10.873233795166016, -10.116975784301758, -9.360716819763184, -8.60445785522461, -7.848199367523193, -7.091940879821777, -6.335681915283203, -5.579422950744629, -4.823164463043213, -4.066905975341797, -3.3106470108032227, -2.5543882846832275, -1.7981295585632324, -1.0418710708618164, -0.2856121063232422, 0.47064661979675293, 1.226905345916748, 1.9831640720367432, 2.7394227981567383, 3.4956815242767334, 4.2519402503967285, 5.0081987380981445, 5.764457702636719, 6.520716667175293, 7.276975154876709, 8.033233642578125, 8.7894926071167, 9.545751571655273, 10.302009582519531, 11.058268547058105, 11.814529418945312, 12.570788383483887, 13.327047348022461, 14.083305358886719, 14.839564323425293, 15.595823287963867, 16.352081298828125, 17.108341217041016, 17.864599227905273, 18.62085723876953, 19.377117156982422, 20.13337516784668, 20.889633178710938, 21.645893096923828, 22.402151107788086, 23.158409118652344, 23.914669036865234, 24.670927047729492, 25.427186965942383, 26.18344497680664, 26.93970489501953, 27.69596290588379, 28.452220916748047, 29.208480834960938, 29.964738845825195, 30.720996856689453, 31.477256774902344, 32.233516693115234, 32.98977279663086, 33.74603271484375, 34.50229263305664, 35.258548736572266, 36.014808654785156]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 5.0, 4.0, 5.0, 8.0, 10.0, 5.0, 11.0, 10.0, 16.0, 12.0, 21.0, 26.0, 29.0, 35.0, 31.0, 27.0, 22.0, 33.0, 38.0, 50.0, 33.0, 48.0, 35.0, 35.0, 33.0, 43.0, 38.0, 32.0, 31.0, 36.0, 31.0, 23.0, 24.0, 24.0, 22.0, 17.0, 18.0, 9.0, 8.0, 9.0, 14.0, 9.0, 7.0, 7.0, 4.0, 3.0, 2.0, 0.0, 3.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-11.570337295532227, -11.171588897705078, -10.77284049987793, -10.374092102050781, -9.975343704223633, -9.576595306396484, -9.177846908569336, -8.779098510742188, -8.380350112915039, -7.981601715087891, -7.582853317260742, -7.184104919433594, -6.785356521606445, -6.386608123779297, -5.98785924911499, -5.589110851287842, -5.190361976623535, -4.791613578796387, -4.392865180969238, -3.9941165447235107, -3.5953681468963623, -3.196619749069214, -2.7978711128234863, -2.399122714996338, -2.0003743171691895, -1.601625919342041, -1.202877402305603, -0.804128885269165, -0.4053804874420166, -0.006632089614868164, 0.3921165466308594, 0.7908649444580078, 1.1896123886108398, 1.5883607864379883, 1.9871093034744263, 2.3858578205108643, 2.7846062183380127, 3.183354616165161, 3.5821032524108887, 3.980851650238037, 4.3796000480651855, 4.778348445892334, 5.177096843719482, 5.575845718383789, 5.9745941162109375, 6.373342514038086, 6.772090911865234, 7.170839309692383, 7.569587707519531, 7.96833610534668, 8.367084503173828, 8.765832901000977, 9.164581298828125, 9.563329696655273, 9.962078094482422, 10.36082649230957, 10.759574890136719, 11.158323287963867, 11.557071685791016, 11.955820083618164, 12.354568481445312, 12.753316879272461, 13.15206527709961, 13.550813674926758, 13.949563026428223]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 4.0, 4.0, 5.0, 7.0, 7.0, 6.0, 6.0, 12.0, 10.0, 10.0, 18.0, 10.0, 17.0, 19.0, 23.0, 23.0, 30.0, 27.0, 28.0, 38.0, 24.0, 28.0, 47.0, 39.0, 33.0, 33.0, 54.0, 39.0, 46.0, 36.0, 30.0, 40.0, 23.0, 22.0, 31.0, 29.0, 15.0, 20.0, 10.0, 12.0, 17.0, 14.0, 8.0, 14.0, 10.0, 5.0, 7.0, 2.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0], "bins": [-1.46875, -1.4231719970703125, -1.377593994140625, -1.3320159912109375, -1.28643798828125, -1.2408599853515625, -1.195281982421875, -1.1497039794921875, -1.1041259765625, -1.0585479736328125, -1.012969970703125, -0.9673919677734375, -0.92181396484375, -0.8762359619140625, -0.830657958984375, -0.7850799560546875, -0.739501953125, -0.6939239501953125, -0.648345947265625, -0.6027679443359375, -0.55718994140625, -0.5116119384765625, -0.466033935546875, -0.4204559326171875, -0.3748779296875, -0.3292999267578125, -0.283721923828125, -0.2381439208984375, -0.19256591796875, -0.1469879150390625, -0.101409912109375, -0.0558319091796875, -0.01025390625, 0.0353240966796875, 0.080902099609375, 0.1264801025390625, 0.17205810546875, 0.2176361083984375, 0.263214111328125, 0.3087921142578125, 0.3543701171875, 0.3999481201171875, 0.445526123046875, 0.4911041259765625, 0.53668212890625, 0.5822601318359375, 0.627838134765625, 0.6734161376953125, 0.718994140625, 0.7645721435546875, 0.810150146484375, 0.8557281494140625, 0.90130615234375, 0.9468841552734375, 0.992462158203125, 1.0380401611328125, 1.0836181640625, 1.1291961669921875, 1.174774169921875, 1.2203521728515625, 1.26593017578125, 1.3115081787109375, 1.357086181640625, 1.4026641845703125, 1.4482421875]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 7.0, 9.0, 15.0, 13.0, 40.0, 52.0, 84.0, 112.0, 169.0, 294.0, 408.0, 644.0, 1030.0, 1669.0, 2544.0, 4185.0, 6656.0, 10647.0, 17680.0, 30003.0, 53821.0, 100919.0, 194447.0, 263882.0, 163053.0, 84374.0, 45708.0, 25894.0, 15296.0, 9373.0, 5677.0, 3625.0, 2248.0, 1389.0, 895.0, 597.0, 406.0, 252.0, 148.0, 89.0, 87.0, 46.0, 24.0, 22.0, 7.0, 8.0, 5.0, 4.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0], "bins": [-0.243896484375, -0.2365856170654297, -0.22927474975585938, -0.22196388244628906, -0.21465301513671875, -0.20734214782714844, -0.20003128051757812, -0.1927204132080078, -0.1854095458984375, -0.1780986785888672, -0.17078781127929688, -0.16347694396972656, -0.15616607666015625, -0.14885520935058594, -0.14154434204101562, -0.1342334747314453, -0.126922607421875, -0.11961174011230469, -0.11230087280273438, -0.10499000549316406, -0.09767913818359375, -0.09036827087402344, -0.08305740356445312, -0.07574653625488281, -0.0684356689453125, -0.06112480163574219, -0.053813934326171875, -0.04650306701660156, -0.03919219970703125, -0.03188133239746094, -0.024570465087890625, -0.017259597778320312, -0.00994873046875, -0.0026378631591796875, 0.004673004150390625, 0.011983871459960938, 0.01929473876953125, 0.026605606079101562, 0.033916473388671875, 0.04122734069824219, 0.0485382080078125, 0.05584907531738281, 0.06315994262695312, 0.07047080993652344, 0.07778167724609375, 0.08509254455566406, 0.09240341186523438, 0.09971427917480469, 0.107025146484375, 0.11433601379394531, 0.12164688110351562, 0.12895774841308594, 0.13626861572265625, 0.14357948303222656, 0.15089035034179688, 0.1582012176513672, 0.1655120849609375, 0.1728229522705078, 0.18013381958007812, 0.18744468688964844, 0.19475555419921875, 0.20206642150878906, 0.20937728881835938, 0.2166881561279297, 0.2239990234375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 4.0, 7.0, 1.0, 6.0, 10.0, 6.0, 10.0, 18.0, 26.0, 24.0, 18.0, 23.0, 30.0, 24.0, 29.0, 41.0, 33.0, 36.0, 33.0, 41.0, 1082.0, 45.0, 50.0, 47.0, 48.0, 46.0, 26.0, 31.0, 28.0, 26.0, 36.0, 21.0, 24.0, 17.0, 14.0, 13.0, 15.0, 7.0, 5.0, 4.0, 6.0, 5.0, 4.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-1.1748046875, -1.1409225463867188, -1.1070404052734375, -1.0731582641601562, -1.039276123046875, -1.0053939819335938, -0.9715118408203125, -0.9376296997070312, -0.90374755859375, -0.8698654174804688, -0.8359832763671875, -0.8021011352539062, -0.768218994140625, -0.7343368530273438, -0.7004547119140625, -0.6665725708007812, -0.6326904296875, -0.5988082885742188, -0.5649261474609375, -0.5310440063476562, -0.497161865234375, -0.46327972412109375, -0.4293975830078125, -0.39551544189453125, -0.36163330078125, -0.32775115966796875, -0.2938690185546875, -0.25998687744140625, -0.226104736328125, -0.19222259521484375, -0.1583404541015625, -0.12445831298828125, -0.090576171875, -0.05669403076171875, -0.0228118896484375, 0.01107025146484375, 0.044952392578125, 0.07883453369140625, 0.1127166748046875, 0.14659881591796875, 0.18048095703125, 0.21436309814453125, 0.2482452392578125, 0.28212738037109375, 0.316009521484375, 0.34989166259765625, 0.3837738037109375, 0.41765594482421875, 0.4515380859375, 0.48542022705078125, 0.5193023681640625, 0.5531845092773438, 0.587066650390625, 0.6209487915039062, 0.6548309326171875, 0.6887130737304688, 0.72259521484375, 0.7564773559570312, 0.7903594970703125, 0.8242416381835938, 0.858123779296875, 0.8920059204101562, 0.9258880615234375, 0.9597702026367188, 0.99365234375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 6.0, 9.0, 11.0, 22.0, 19.0, 28.0, 40.0, 66.0, 94.0, 119.0, 183.0, 255.0, 362.0, 568.0, 856.0, 1182.0, 1754.0, 2603.0, 3985.0, 5901.0, 9147.0, 14641.0, 22826.0, 37450.0, 63234.0, 108955.0, 190209.0, 1275113.0, 144850.0, 82674.0, 48316.0, 29522.0, 18422.0, 11648.0, 7446.0, 4751.0, 3243.0, 2124.0, 1443.0, 952.0, 618.0, 460.0, 302.0, 235.0, 158.0, 106.0, 79.0, 37.0, 40.0, 29.0, 21.0, 12.0, 9.0, 4.0, 2.0, 1.0, 3.0], "bins": [-0.1719970703125, -0.1669750213623047, -0.16195297241210938, -0.15693092346191406, -0.15190887451171875, -0.14688682556152344, -0.14186477661132812, -0.1368427276611328, -0.1318206787109375, -0.1267986297607422, -0.12177658081054688, -0.11675453186035156, -0.11173248291015625, -0.10671043395996094, -0.10168838500976562, -0.09666633605957031, -0.091644287109375, -0.08662223815917969, -0.08160018920898438, -0.07657814025878906, -0.07155609130859375, -0.06653404235839844, -0.061511993408203125, -0.05648994445800781, -0.0514678955078125, -0.04644584655761719, -0.041423797607421875, -0.03640174865722656, -0.03137969970703125, -0.026357650756835938, -0.021335601806640625, -0.016313552856445312, -0.01129150390625, -0.0062694549560546875, -0.001247406005859375, 0.0037746429443359375, 0.00879669189453125, 0.013818740844726562, 0.018840789794921875, 0.023862838745117188, 0.0288848876953125, 0.03390693664550781, 0.038928985595703125, 0.04395103454589844, 0.04897308349609375, 0.05399513244628906, 0.059017181396484375, 0.06403923034667969, 0.069061279296875, 0.07408332824707031, 0.07910537719726562, 0.08412742614746094, 0.08914947509765625, 0.09417152404785156, 0.09919357299804688, 0.10421562194824219, 0.1092376708984375, 0.11425971984863281, 0.11928176879882812, 0.12430381774902344, 0.12932586669921875, 0.13434791564941406, 0.13936996459960938, 0.1443920135498047, 0.1494140625]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 1.0, 5.0, 7.0, 13.0, 7.0, 14.0, 24.0, 26.0, 38.0, 38.0, 52.0, 67.0, 85.0, 72.0, 86.0, 90.0, 64.0, 58.0, 59.0, 41.0, 28.0, 20.0, 24.0, 17.0, 11.0, 6.0, 8.0, 6.0, 9.0, 5.0, 4.0, 6.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0007219314575195312, -0.0006989911198616028, -0.0006760507822036743, -0.0006531104445457458, -0.0006301701068878174, -0.0006072297692298889, -0.0005842894315719604, -0.000561349093914032, -0.0005384087562561035, -0.000515468418598175, -0.0004925280809402466, -0.0004695877432823181, -0.00044664740562438965, -0.0004237070679664612, -0.0004007667303085327, -0.00037782639265060425, -0.0003548860549926758, -0.0003319457173347473, -0.00030900537967681885, -0.0002860650420188904, -0.0002631247043609619, -0.00024018436670303345, -0.00021724402904510498, -0.00019430369138717651, -0.00017136335372924805, -0.00014842301607131958, -0.0001254826784133911, -0.00010254234075546265, -7.960200309753418e-05, -5.666166543960571e-05, -3.3721327781677246e-05, -1.078099012374878e-05, 1.2159347534179688e-05, 3.5099685192108154e-05, 5.804002285003662e-05, 8.098036050796509e-05, 0.00010392069816589355, 0.00012686103582382202, 0.0001498013734817505, 0.00017274171113967896, 0.00019568204879760742, 0.0002186223864555359, 0.00024156272411346436, 0.0002645030617713928, 0.0002874433994293213, 0.00031038373708724976, 0.0003333240747451782, 0.0003562644124031067, 0.00037920475006103516, 0.0004021450877189636, 0.0004250854253768921, 0.00044802576303482056, 0.000470966100692749, 0.0004939064383506775, 0.000516846776008606, 0.0005397871136665344, 0.0005627274513244629, 0.0005856677889823914, 0.0006086081266403198, 0.0006315484642982483, 0.0006544888019561768, 0.0006774291396141052, 0.0007003694772720337, 0.0007233098149299622, 0.0007462501525878906]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 8.0, 6.0, 7.0, 5.0, 10.0, 11.0, 6.0, 19.0, 21.0, 25.0, 52.0, 74.0, 142.0, 270.0, 622.0, 4829.0, 1028240.0, 12827.0, 654.0, 316.0, 147.0, 89.0, 61.0, 26.0, 18.0, 18.0, 9.0, 8.0, 7.0, 8.0, 4.0, 3.0, 6.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0178985595703125, -0.017365455627441406, -0.016832351684570312, -0.01629924774169922, -0.015766143798828125, -0.015233039855957031, -0.014699935913085938, -0.014166831970214844, -0.01363372802734375, -0.013100624084472656, -0.012567520141601562, -0.012034416198730469, -0.011501312255859375, -0.010968208312988281, -0.010435104370117188, -0.009902000427246094, -0.009368896484375, -0.008835792541503906, -0.008302688598632812, -0.007769584655761719, -0.007236480712890625, -0.006703376770019531, -0.0061702728271484375, -0.005637168884277344, -0.00510406494140625, -0.004570960998535156, -0.0040378570556640625, -0.0035047531127929688, -0.002971649169921875, -0.0024385452270507812, -0.0019054412841796875, -0.0013723373413085938, -0.0008392333984375, -0.00030612945556640625, 0.0002269744873046875, 0.0007600784301757812, 0.001293182373046875, 0.0018262863159179688, 0.0023593902587890625, 0.0028924942016601562, 0.00342559814453125, 0.003958702087402344, 0.0044918060302734375, 0.005024909973144531, 0.005558013916015625, 0.006091117858886719, 0.0066242218017578125, 0.007157325744628906, 0.0076904296875, 0.008223533630371094, 0.008756637573242188, 0.009289741516113281, 0.009822845458984375, 0.010355949401855469, 0.010889053344726562, 0.011422157287597656, 0.01195526123046875, 0.012488365173339844, 0.013021469116210938, 0.013554573059082031, 0.014087677001953125, 0.014620780944824219, 0.015153884887695312, 0.015686988830566406, 0.0162200927734375]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 71.0, 334.0, 454.0, 137.0, 13.0, 4.0], "bins": [-0.0037722978740930557, -0.003709677839651704, -0.003647057805210352, -0.003584437770769, -0.003521817736327648, -0.0034591974690556526, -0.0033965776674449444, -0.003333957400172949, -0.003271337365731597, -0.003208717331290245, -0.003146097296848893, -0.0030834772624075413, -0.0030208572279661894, -0.0029582371935248375, -0.002895616926252842, -0.00283299689181149, -0.002770376857370138, -0.0027077568229287863, -0.0026451367884874344, -0.0025825167540460825, -0.0025198967196047306, -0.002457276452332735, -0.002394656650722027, -0.0023320363834500313, -0.002269416581839323, -0.002206796547397971, -0.0021441765129566193, -0.0020815564785152674, -0.0020189364440739155, -0.00195631617680192, -0.0018936962587758899, -0.001831076224334538, -0.001768456306308508, -0.001705836271867156, -0.0016432162374258041, -0.0015805962029844522, -0.0015179760521277785, -0.0014553560176864266, -0.0013927359832450747, -0.0013301159488037229, -0.0012674957979470491, -0.0012048757635056973, -0.0011422557290643454, -0.0010796356946229935, -0.0010170155437663198, -0.0009543955093249679, -0.000891775474883616, -0.0008291554404422641, -0.0007665353477932513, -0.0007039153133518994, -0.0006412952207028866, -0.0005786751862615347, -0.0005160551518201828, -0.00045343505917117, -0.0003908150247298181, -0.00032819496118463576, -0.0002655748976394534, -0.00020295483409427106, -0.00014033478510100394, -7.771473610773683e-05, -1.5094672562554479e-05, 4.752539098262787e-05, 0.00011014542542397976, 0.0001727654889691621, 0.00023538555251434445]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 5.0, 4.0, 7.0, 10.0, 12.0, 13.0, 11.0, 27.0, 32.0, 29.0, 36.0, 39.0, 51.0, 37.0, 37.0, 51.0, 52.0, 47.0, 55.0, 54.0, 45.0, 47.0, 42.0, 37.0, 37.0, 45.0, 23.0, 23.0, 12.0, 18.0, 18.0, 14.0, 11.0, 5.0, 8.0, 6.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003330707550048828, -0.0003205714747309685, -0.00030807219445705414, -0.0002955729141831398, -0.00028307363390922546, -0.0002705743536353111, -0.0002580750733613968, -0.00024557579308748245, -0.00023307651281356812, -0.00022057723253965378, -0.00020807795226573944, -0.0001955786719918251, -0.00018307939171791077, -0.00017058011144399643, -0.0001580808311700821, -0.00014558155089616776, -0.00013308227062225342, -0.00012058299034833908, -0.00010808371007442474, -9.55844298005104e-05, -8.308514952659607e-05, -7.058586925268173e-05, -5.8086588978767395e-05, -4.558730870485306e-05, -3.308802843093872e-05, -2.0588748157024384e-05, -8.089467883110046e-06, 4.409812390804291e-06, 1.6909092664718628e-05, 2.9408372938632965e-05, 4.19076532125473e-05, 5.440693348646164e-05, 6.690621376037598e-05, 7.940549403429031e-05, 9.190477430820465e-05, 0.00010440405458211899, 0.00011690333485603333, 0.00012940261512994766, 0.000141901895403862, 0.00015440117567777634, 0.00016690045595169067, 0.000179399736225605, 0.00019189901649951935, 0.00020439829677343369, 0.00021689757704734802, 0.00022939685732126236, 0.0002418961375951767, 0.00025439541786909103, 0.00026689469814300537, 0.0002793939784169197, 0.00029189325869083405, 0.0003043925389647484, 0.0003168918192386627, 0.00032939109951257706, 0.0003418903797864914, 0.00035438966006040573, 0.00036688894033432007, 0.0003793882206082344, 0.00039188750088214874, 0.0004043867811560631, 0.0004168860614299774, 0.00042938534170389175, 0.0004418846219778061, 0.00045438390225172043, 0.00046688318252563477]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 4.0, 4.0, 5.0, 7.0, 7.0, 6.0, 6.0, 12.0, 10.0, 10.0, 18.0, 10.0, 17.0, 19.0, 23.0, 23.0, 30.0, 27.0, 28.0, 38.0, 24.0, 28.0, 47.0, 39.0, 33.0, 33.0, 54.0, 39.0, 46.0, 36.0, 30.0, 40.0, 23.0, 22.0, 31.0, 29.0, 15.0, 20.0, 10.0, 12.0, 17.0, 14.0, 8.0, 14.0, 10.0, 5.0, 7.0, 2.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0], "bins": [-1.46875, -1.4231719970703125, -1.377593994140625, -1.3320159912109375, -1.28643798828125, -1.2408599853515625, -1.195281982421875, -1.1497039794921875, -1.1041259765625, -1.0585479736328125, -1.012969970703125, -0.9673919677734375, -0.92181396484375, -0.8762359619140625, -0.830657958984375, -0.7850799560546875, -0.739501953125, -0.6939239501953125, -0.648345947265625, -0.6027679443359375, -0.55718994140625, -0.5116119384765625, -0.466033935546875, -0.4204559326171875, -0.3748779296875, -0.3292999267578125, -0.283721923828125, -0.2381439208984375, -0.19256591796875, -0.1469879150390625, -0.101409912109375, -0.0558319091796875, -0.01025390625, 0.0353240966796875, 0.080902099609375, 0.1264801025390625, 0.17205810546875, 0.2176361083984375, 0.263214111328125, 0.3087921142578125, 0.3543701171875, 0.3999481201171875, 0.445526123046875, 0.4911041259765625, 0.53668212890625, 0.5822601318359375, 0.627838134765625, 0.6734161376953125, 0.718994140625, 0.7645721435546875, 0.810150146484375, 0.8557281494140625, 0.90130615234375, 0.9468841552734375, 0.992462158203125, 1.0380401611328125, 1.0836181640625, 1.1291961669921875, 1.174774169921875, 1.2203521728515625, 1.26593017578125, 1.3115081787109375, 1.357086181640625, 1.4026641845703125, 1.4482421875]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 3.0, 1.0, 3.0, 7.0, 16.0, 13.0, 18.0, 26.0, 35.0, 47.0, 71.0, 92.0, 134.0, 184.0, 270.0, 389.0, 636.0, 1155.0, 1787.0, 3395.0, 6426.0, 13177.0, 31195.0, 86137.0, 293858.0, 407911.0, 124686.0, 42007.0, 16991.0, 7915.0, 4132.0, 2237.0, 1310.0, 780.0, 511.0, 300.0, 214.0, 128.0, 113.0, 63.0, 47.0, 41.0, 26.0, 18.0, 16.0, 13.0, 7.0, 4.0, 3.0, 5.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.34765625, -2.272308349609375, -2.19696044921875, -2.121612548828125, -2.0462646484375, -1.970916748046875, -1.89556884765625, -1.820220947265625, -1.744873046875, -1.669525146484375, -1.59417724609375, -1.518829345703125, -1.4434814453125, -1.368133544921875, -1.29278564453125, -1.217437744140625, -1.14208984375, -1.066741943359375, -0.99139404296875, -0.916046142578125, -0.8406982421875, -0.765350341796875, -0.69000244140625, -0.614654541015625, -0.539306640625, -0.463958740234375, -0.38861083984375, -0.313262939453125, -0.2379150390625, -0.162567138671875, -0.08721923828125, -0.011871337890625, 0.0634765625, 0.138824462890625, 0.21417236328125, 0.289520263671875, 0.3648681640625, 0.440216064453125, 0.51556396484375, 0.590911865234375, 0.666259765625, 0.741607666015625, 0.81695556640625, 0.892303466796875, 0.9676513671875, 1.042999267578125, 1.11834716796875, 1.193695068359375, 1.26904296875, 1.344390869140625, 1.41973876953125, 1.495086669921875, 1.5704345703125, 1.645782470703125, 1.72113037109375, 1.796478271484375, 1.871826171875, 1.947174072265625, 2.02252197265625, 2.097869873046875, 2.1732177734375, 2.248565673828125, 2.32391357421875, 2.399261474609375, 2.474609375]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 6.0, 8.0, 8.0, 7.0, 10.0, 7.0, 8.0, 10.0, 13.0, 11.0, 18.0, 17.0, 18.0, 22.0, 31.0, 41.0, 26.0, 35.0, 59.0, 62.0, 73.0, 119.0, 207.0, 1390.0, 245.0, 113.0, 81.0, 57.0, 51.0, 45.0, 32.0, 30.0, 27.0, 24.0, 17.0, 22.0, 12.0, 25.0, 16.0, 11.0, 7.0, 15.0, 4.0, 2.0, 4.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.46484375, -5.2918701171875, -5.118896484375, -4.9459228515625, -4.77294921875, -4.5999755859375, -4.427001953125, -4.2540283203125, -4.0810546875, -3.9080810546875, -3.735107421875, -3.5621337890625, -3.38916015625, -3.2161865234375, -3.043212890625, -2.8702392578125, -2.697265625, -2.5242919921875, -2.351318359375, -2.1783447265625, -2.00537109375, -1.8323974609375, -1.659423828125, -1.4864501953125, -1.3134765625, -1.1405029296875, -0.967529296875, -0.7945556640625, -0.62158203125, -0.4486083984375, -0.275634765625, -0.1026611328125, 0.0703125, 0.2432861328125, 0.416259765625, 0.5892333984375, 0.76220703125, 0.9351806640625, 1.108154296875, 1.2811279296875, 1.4541015625, 1.6270751953125, 1.800048828125, 1.9730224609375, 2.14599609375, 2.3189697265625, 2.491943359375, 2.6649169921875, 2.837890625, 3.0108642578125, 3.183837890625, 3.3568115234375, 3.52978515625, 3.7027587890625, 3.875732421875, 4.0487060546875, 4.2216796875, 4.3946533203125, 4.567626953125, 4.7406005859375, 4.91357421875, 5.0865478515625, 5.259521484375, 5.4324951171875, 5.60546875]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 8.0, 16.0, 16.0, 18.0, 43.0, 50.0, 80.0, 134.0, 269.0, 749.0, 7972.0, 3087682.0, 46628.0, 1194.0, 377.0, 172.0, 105.0, 69.0, 43.0, 25.0, 25.0, 10.0, 11.0, 5.0, 2.0, 1.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.71875, -25.925048828125, -25.13134765625, -24.337646484375, -23.5439453125, -22.750244140625, -21.95654296875, -21.162841796875, -20.369140625, -19.575439453125, -18.78173828125, -17.988037109375, -17.1943359375, -16.400634765625, -15.60693359375, -14.813232421875, -14.01953125, -13.225830078125, -12.43212890625, -11.638427734375, -10.8447265625, -10.051025390625, -9.25732421875, -8.463623046875, -7.669921875, -6.876220703125, -6.08251953125, -5.288818359375, -4.4951171875, -3.701416015625, -2.90771484375, -2.114013671875, -1.3203125, -0.526611328125, 0.26708984375, 1.060791015625, 1.8544921875, 2.648193359375, 3.44189453125, 4.235595703125, 5.029296875, 5.822998046875, 6.61669921875, 7.410400390625, 8.2041015625, 8.997802734375, 9.79150390625, 10.585205078125, 11.37890625, 12.172607421875, 12.96630859375, 13.760009765625, 14.5537109375, 15.347412109375, 16.14111328125, 16.934814453125, 17.728515625, 18.522216796875, 19.31591796875, 20.109619140625, 20.9033203125, 21.697021484375, 22.49072265625, 23.284423828125, 24.078125]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 115.0, 692.0, 206.0, 0.0, 4.0], "bins": [-142.136962890625, -139.78981018066406, -137.4426727294922, -135.09552001953125, -132.7483673095703, -130.40122985839844, -128.0540771484375, -125.7069320678711, -123.35978698730469, -121.01264190673828, -118.66548919677734, -116.31834411621094, -113.97119903564453, -111.62405395507812, -109.27690124511719, -106.92975616455078, -104.58260345458984, -102.23545837402344, -99.8883056640625, -97.5411605834961, -95.19401550292969, -92.84686279296875, -90.49971771240234, -88.15257263183594, -85.805419921875, -83.4582748413086, -81.11112213134766, -78.76397705078125, -76.41683197021484, -74.06968688964844, -71.7225341796875, -69.3753890991211, -67.02824401855469, -64.68109893798828, -62.33395004272461, -59.98680114746094, -57.63965606689453, -55.29250717163086, -52.94535827636719, -50.59821319580078, -48.251060485839844, -45.90391159057617, -43.556766510009766, -41.209617614746094, -38.86247253417969, -36.515323638916016, -34.168174743652344, -31.821027755737305, -29.473880767822266, -27.126733779907227, -24.779586791992188, -22.432437896728516, -20.085290908813477, -17.738143920898438, -15.390995979309082, -13.043848037719727, -10.696701049804688, -8.349554061889648, -6.002406120300293, -3.6552586555480957, -1.3081111907958984, 1.0390357971191406, 3.386183738708496, 5.733331680297852, 8.08047866821289]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 6.0, 6.0, 7.0, 8.0, 10.0, 6.0, 6.0, 9.0, 6.0, 18.0, 18.0, 20.0, 23.0, 22.0, 20.0, 30.0, 21.0, 32.0, 28.0, 22.0, 32.0, 26.0, 36.0, 36.0, 35.0, 24.0, 29.0, 50.0, 38.0, 48.0, 41.0, 27.0, 25.0, 32.0, 21.0, 25.0, 27.0, 20.0, 24.0, 15.0, 12.0, 10.0, 11.0, 11.0, 0.0, 7.0, 6.0, 6.0, 7.0, 4.0, 4.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.860115051269531, -13.372802734375, -12.885491371154785, -12.39818000793457, -11.910867691040039, -11.423555374145508, -10.936244010925293, -10.448932647705078, -9.961620330810547, -9.474308013916016, -8.9869966506958, -8.499685287475586, -8.012372970581055, -7.525061130523682, -7.037749290466309, -6.5504374504089355, -6.0631256103515625, -5.5758137702941895, -5.088501930236816, -4.601190090179443, -4.11387825012207, -3.6265664100646973, -3.139254570007324, -2.651942729949951, -2.164630889892578, -1.677319049835205, -1.190007209777832, -0.702695369720459, -0.21538352966308594, 0.2719283103942871, 0.7592401504516602, 1.2465519905090332, 1.7338638305664062, 2.2211756706237793, 2.7084875106811523, 3.1957993507385254, 3.6831111907958984, 4.1704230308532715, 4.6577348709106445, 5.145046710968018, 5.632358551025391, 6.119670391082764, 6.606982231140137, 7.09429407119751, 7.581605911254883, 8.068918228149414, 8.556229591369629, 9.043540954589844, 9.530853271484375, 10.018165588378906, 10.505476951599121, 10.992788314819336, 11.480100631713867, 11.967412948608398, 12.454724311828613, 12.942035675048828, 13.42934799194336, 13.91666030883789, 14.403971672058105, 14.89128303527832, 15.378595352172852, 15.865907669067383, 16.35321807861328, 16.840530395507812, 17.327842712402344]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 6.0, 2.0, 4.0, 4.0, 10.0, 4.0, 10.0, 10.0, 12.0, 13.0, 6.0, 15.0, 19.0, 26.0, 23.0, 22.0, 25.0, 29.0, 23.0, 33.0, 44.0, 33.0, 33.0, 47.0, 39.0, 42.0, 45.0, 43.0, 39.0, 31.0, 39.0, 25.0, 26.0, 34.0, 24.0, 21.0, 20.0, 19.0, 16.0, 16.0, 13.0, 14.0, 9.0, 8.0, 7.0, 10.0, 3.0, 2.0, 2.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-1.6572265625, -1.6068878173828125, -1.556549072265625, -1.5062103271484375, -1.45587158203125, -1.4055328369140625, -1.355194091796875, -1.3048553466796875, -1.2545166015625, -1.2041778564453125, -1.153839111328125, -1.1035003662109375, -1.05316162109375, -1.0028228759765625, -0.952484130859375, -0.9021453857421875, -0.851806640625, -0.8014678955078125, -0.751129150390625, -0.7007904052734375, -0.65045166015625, -0.6001129150390625, -0.549774169921875, -0.4994354248046875, -0.4490966796875, -0.3987579345703125, -0.348419189453125, -0.2980804443359375, -0.24774169921875, -0.1974029541015625, -0.147064208984375, -0.0967254638671875, -0.04638671875, 0.0039520263671875, 0.054290771484375, 0.1046295166015625, 0.15496826171875, 0.2053070068359375, 0.255645751953125, 0.3059844970703125, 0.3563232421875, 0.4066619873046875, 0.457000732421875, 0.5073394775390625, 0.55767822265625, 0.6080169677734375, 0.658355712890625, 0.7086944580078125, 0.759033203125, 0.8093719482421875, 0.859710693359375, 0.9100494384765625, 0.96038818359375, 1.0107269287109375, 1.061065673828125, 1.1114044189453125, 1.1617431640625, 1.2120819091796875, 1.262420654296875, 1.3127593994140625, 1.36309814453125, 1.4134368896484375, 1.463775634765625, 1.5141143798828125, 1.564453125]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 6.0, 4.0, 5.0, 12.0, 11.0, 14.0, 15.0, 27.0, 18.0, 28.0, 51.0, 69.0, 100.0, 130.0, 206.0, 367.0, 647.0, 1141.0, 2390.0, 5170.0, 12430.0, 32695.0, 92402.0, 285713.0, 786094.0, 1355849.0, 997766.0, 409716.0, 135200.0, 45424.0, 16840.0, 7032.0, 3128.0, 1549.0, 794.0, 401.0, 273.0, 186.0, 99.0, 76.0, 47.0, 35.0, 34.0, 30.0, 13.0, 20.0, 6.0, 2.0, 4.0, 6.0, 6.0, 4.0, 3.0, 0.0, 0.0, 2.0, 2.0], "bins": [-2.115234375, -2.05047607421875, -1.9857177734375, -1.92095947265625, -1.856201171875, -1.79144287109375, -1.7266845703125, -1.66192626953125, -1.59716796875, -1.53240966796875, -1.4676513671875, -1.40289306640625, -1.338134765625, -1.27337646484375, -1.2086181640625, -1.14385986328125, -1.0791015625, -1.01434326171875, -0.9495849609375, -0.88482666015625, -0.820068359375, -0.75531005859375, -0.6905517578125, -0.62579345703125, -0.56103515625, -0.49627685546875, -0.4315185546875, -0.36676025390625, -0.302001953125, -0.23724365234375, -0.1724853515625, -0.10772705078125, -0.04296875, 0.02178955078125, 0.0865478515625, 0.15130615234375, 0.216064453125, 0.28082275390625, 0.3455810546875, 0.41033935546875, 0.47509765625, 0.53985595703125, 0.6046142578125, 0.66937255859375, 0.734130859375, 0.79888916015625, 0.8636474609375, 0.92840576171875, 0.9931640625, 1.05792236328125, 1.1226806640625, 1.18743896484375, 1.252197265625, 1.31695556640625, 1.3817138671875, 1.44647216796875, 1.51123046875, 1.57598876953125, 1.6407470703125, 1.70550537109375, 1.770263671875, 1.83502197265625, 1.8997802734375, 1.96453857421875, 2.029296875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 9.0, 6.0, 7.0, 3.0, 12.0, 9.0, 19.0, 14.0, 27.0, 33.0, 42.0, 67.0, 90.0, 114.0, 136.0, 164.0, 219.0, 254.0, 352.0, 321.0, 370.0, 349.0, 270.0, 255.0, 221.0, 165.0, 117.0, 107.0, 81.0, 52.0, 44.0, 37.0, 31.0, 20.0, 13.0, 14.0, 8.0, 7.0, 6.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.95703125, -3.841827392578125, -3.72662353515625, -3.611419677734375, -3.4962158203125, -3.381011962890625, -3.26580810546875, -3.150604248046875, -3.035400390625, -2.920196533203125, -2.80499267578125, -2.689788818359375, -2.5745849609375, -2.459381103515625, -2.34417724609375, -2.228973388671875, -2.11376953125, -1.998565673828125, -1.88336181640625, -1.768157958984375, -1.6529541015625, -1.537750244140625, -1.42254638671875, -1.307342529296875, -1.192138671875, -1.076934814453125, -0.96173095703125, -0.846527099609375, -0.7313232421875, -0.616119384765625, -0.50091552734375, -0.385711669921875, -0.2705078125, -0.155303955078125, -0.04010009765625, 0.075103759765625, 0.1903076171875, 0.305511474609375, 0.42071533203125, 0.535919189453125, 0.651123046875, 0.766326904296875, 0.88153076171875, 0.996734619140625, 1.1119384765625, 1.227142333984375, 1.34234619140625, 1.457550048828125, 1.57275390625, 1.687957763671875, 1.80316162109375, 1.918365478515625, 2.0335693359375, 2.148773193359375, 2.26397705078125, 2.379180908203125, 2.494384765625, 2.609588623046875, 2.72479248046875, 2.839996337890625, 2.9552001953125, 3.070404052734375, 3.18560791015625, 3.300811767578125, 3.416015625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 6.0, 4.0, 5.0, 16.0, 19.0, 22.0, 44.0, 58.0, 67.0, 96.0, 131.0, 260.0, 577.0, 1574.0, 6323.0, 40973.0, 402640.0, 2652225.0, 979291.0, 93953.0, 11799.0, 2429.0, 824.0, 376.0, 200.0, 104.0, 75.0, 51.0, 37.0, 28.0, 20.0, 13.0, 15.0, 9.0, 3.0, 6.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.49609375, -6.2696533203125, -6.043212890625, -5.8167724609375, -5.59033203125, -5.3638916015625, -5.137451171875, -4.9110107421875, -4.6845703125, -4.4581298828125, -4.231689453125, -4.0052490234375, -3.77880859375, -3.5523681640625, -3.325927734375, -3.0994873046875, -2.873046875, -2.6466064453125, -2.420166015625, -2.1937255859375, -1.96728515625, -1.7408447265625, -1.514404296875, -1.2879638671875, -1.0615234375, -0.8350830078125, -0.608642578125, -0.3822021484375, -0.15576171875, 0.0706787109375, 0.297119140625, 0.5235595703125, 0.75, 0.9764404296875, 1.202880859375, 1.4293212890625, 1.65576171875, 1.8822021484375, 2.108642578125, 2.3350830078125, 2.5615234375, 2.7879638671875, 3.014404296875, 3.2408447265625, 3.46728515625, 3.6937255859375, 3.920166015625, 4.1466064453125, 4.373046875, 4.5994873046875, 4.825927734375, 5.0523681640625, 5.27880859375, 5.5052490234375, 5.731689453125, 5.9581298828125, 6.1845703125, 6.4110107421875, 6.637451171875, 6.8638916015625, 7.09033203125, 7.3167724609375, 7.543212890625, 7.7696533203125, 7.99609375]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 7.0, 26.0, 68.0, 147.0, 224.0, 245.0, 174.0, 82.0, 31.0, 9.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.302536010742188, -8.842288970947266, -7.3820414543151855, -5.9217939376831055, -4.461546897888184, -3.0012998580932617, -1.5410518646240234, -0.08080482482910156, 1.3794422149658203, 2.8396894931793213, 4.299936771392822, 5.760184288024902, 7.220431327819824, 8.680678367614746, 10.140926361083984, 11.601173400878906, 13.061420440673828, 14.52166748046875, 15.981914520263672, 17.442161560058594, 18.902408599853516, 20.362655639648438, 21.822904586791992, 23.283151626586914, 24.743398666381836, 26.203645706176758, 27.66389274597168, 29.124141693115234, 30.584388732910156, 32.04463577270508, 33.5048828125, 34.96512985229492, 36.425376892089844, 37.885623931884766, 39.34587097167969, 40.80611801147461, 42.26636505126953, 43.72661209106445, 45.186859130859375, 46.64710998535156, 48.10735321044922, 49.56760025024414, 51.02784729003906, 52.488094329833984, 53.948341369628906, 55.40858840942383, 56.86883544921875, 58.32908630371094, 59.78933334350586, 61.24958038330078, 62.7098274230957, 64.17007446289062, 65.63032531738281, 67.09056854248047, 68.55081939697266, 70.01106262207031, 71.4713134765625, 72.93156433105469, 74.39180755615234, 75.85205841064453, 77.31230163574219, 78.77255249023438, 80.23279571533203, 81.69304656982422, 83.15328979492188]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 8.0, 10.0, 15.0, 13.0, 14.0, 6.0, 21.0, 16.0, 19.0, 28.0, 30.0, 32.0, 40.0, 34.0, 45.0, 45.0, 47.0, 38.0, 40.0, 41.0, 58.0, 44.0, 36.0, 34.0, 36.0, 28.0, 24.0, 30.0, 24.0, 24.0, 23.0, 19.0, 18.0, 14.0, 15.0, 5.0, 8.0, 9.0, 5.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-16.236427307128906, -15.772708892822266, -15.308990478515625, -14.8452730178833, -14.38155460357666, -13.91783618927002, -13.454117774963379, -12.990400314331055, -12.526681900024414, -12.062963485717773, -11.599245071411133, -11.135527610778809, -10.671809196472168, -10.208090782165527, -9.744372367858887, -9.280654907226562, -8.816936492919922, -8.353218078613281, -7.889500141143799, -7.425781726837158, -6.962063789367676, -6.498345375061035, -6.0346269607543945, -5.570909023284912, -5.107190132141113, -4.643471717834473, -4.17975378036499, -3.7160353660583496, -3.252317428588867, -2.7885990142822266, -2.324880838394165, -1.8611626625061035, -1.397444725036621, -0.9337265491485596, -0.47000831365585327, -0.006290078163146973, 0.45742809772491455, 0.9211463928222656, 1.3848645687103271, 1.8485827445983887, 2.31230092048645, 2.7760190963745117, 3.2397372722625732, 3.7034554481506348, 4.167173862457275, 4.630891799926758, 5.094610214233398, 5.558328628540039, 6.0220465660095215, 6.485764980316162, 6.9494829177856445, 7.413201332092285, 7.876919269561768, 8.34063720703125, 8.80435562133789, 9.268074035644531, 9.731792449951172, 10.195510864257812, 10.659229278564453, 11.122946739196777, 11.586665153503418, 12.050383567810059, 12.5141019821167, 12.977819442749023, 13.441537857055664]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 7.0, 0.0, 8.0, 6.0, 13.0, 4.0, 4.0, 11.0, 13.0, 10.0, 23.0, 26.0, 23.0, 23.0, 29.0, 27.0, 35.0, 41.0, 33.0, 37.0, 36.0, 41.0, 40.0, 45.0, 38.0, 45.0, 45.0, 45.0, 35.0, 31.0, 40.0, 23.0, 19.0, 19.0, 21.0, 18.0, 16.0, 13.0, 12.0, 11.0, 7.0, 3.0, 6.0, 4.0, 2.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.658203125, -1.6042938232421875, -1.550384521484375, -1.4964752197265625, -1.44256591796875, -1.3886566162109375, -1.334747314453125, -1.2808380126953125, -1.2269287109375, -1.1730194091796875, -1.119110107421875, -1.0652008056640625, -1.01129150390625, -0.9573822021484375, -0.903472900390625, -0.8495635986328125, -0.795654296875, -0.7417449951171875, -0.687835693359375, -0.6339263916015625, -0.58001708984375, -0.5261077880859375, -0.472198486328125, -0.4182891845703125, -0.3643798828125, -0.3104705810546875, -0.256561279296875, -0.2026519775390625, -0.14874267578125, -0.0948333740234375, -0.040924072265625, 0.0129852294921875, 0.06689453125, 0.1208038330078125, 0.174713134765625, 0.2286224365234375, 0.28253173828125, 0.3364410400390625, 0.390350341796875, 0.4442596435546875, 0.4981689453125, 0.5520782470703125, 0.605987548828125, 0.6598968505859375, 0.71380615234375, 0.7677154541015625, 0.821624755859375, 0.8755340576171875, 0.929443359375, 0.9833526611328125, 1.037261962890625, 1.0911712646484375, 1.14508056640625, 1.1989898681640625, 1.252899169921875, 1.3068084716796875, 1.3607177734375, 1.4146270751953125, 1.468536376953125, 1.5224456787109375, 1.57635498046875, 1.6302642822265625, 1.684173583984375, 1.7380828857421875, 1.7919921875]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 4.0, 2.0, 7.0, 11.0, 14.0, 21.0, 29.0, 54.0, 67.0, 94.0, 171.0, 253.0, 321.0, 497.0, 800.0, 1140.0, 1722.0, 2495.0, 3814.0, 5843.0, 8904.0, 14292.0, 23064.0, 38850.0, 69216.0, 132918.0, 247915.0, 225332.0, 116475.0, 61082.0, 34957.0, 21040.0, 12980.0, 8284.0, 5285.0, 3477.0, 2410.0, 1548.0, 1001.0, 686.0, 531.0, 285.0, 210.0, 151.0, 112.0, 70.0, 42.0, 32.0, 20.0, 16.0, 8.0, 7.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2420654296875, -0.23423194885253906, -0.22639846801757812, -0.2185649871826172, -0.21073150634765625, -0.2028980255126953, -0.19506454467773438, -0.18723106384277344, -0.1793975830078125, -0.17156410217285156, -0.16373062133789062, -0.1558971405029297, -0.14806365966796875, -0.1402301788330078, -0.13239669799804688, -0.12456321716308594, -0.116729736328125, -0.10889625549316406, -0.10106277465820312, -0.09322929382324219, -0.08539581298828125, -0.07756233215332031, -0.06972885131835938, -0.06189537048339844, -0.0540618896484375, -0.04622840881347656, -0.038394927978515625, -0.030561447143554688, -0.02272796630859375, -0.014894485473632812, -0.007061004638671875, 0.0007724761962890625, 0.00860595703125, 0.016439437866210938, 0.024272918701171875, 0.03210639953613281, 0.03993988037109375, 0.04777336120605469, 0.055606842041015625, 0.06344032287597656, 0.0712738037109375, 0.07910728454589844, 0.08694076538085938, 0.09477424621582031, 0.10260772705078125, 0.11044120788574219, 0.11827468872070312, 0.12610816955566406, 0.133941650390625, 0.14177513122558594, 0.14960861206054688, 0.1574420928955078, 0.16527557373046875, 0.1731090545654297, 0.18094253540039062, 0.18877601623535156, 0.1966094970703125, 0.20444297790527344, 0.21227645874023438, 0.2201099395751953, 0.22794342041015625, 0.2357769012451172, 0.24361038208007812, 0.25144386291503906, 0.25927734375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 6.0, 11.0, 5.0, 15.0, 15.0, 16.0, 16.0, 11.0, 20.0, 24.0, 32.0, 36.0, 35.0, 37.0, 30.0, 53.0, 35.0, 34.0, 43.0, 1061.0, 40.0, 45.0, 39.0, 42.0, 39.0, 31.0, 41.0, 30.0, 31.0, 34.0, 32.0, 14.0, 9.0, 16.0, 10.0, 15.0, 6.0, 8.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.2939453125, -1.2555999755859375, -1.217254638671875, -1.1789093017578125, -1.14056396484375, -1.1022186279296875, -1.063873291015625, -1.0255279541015625, -0.9871826171875, -0.9488372802734375, -0.910491943359375, -0.8721466064453125, -0.83380126953125, -0.7954559326171875, -0.757110595703125, -0.7187652587890625, -0.680419921875, -0.6420745849609375, -0.603729248046875, -0.5653839111328125, -0.52703857421875, -0.4886932373046875, -0.450347900390625, -0.4120025634765625, -0.3736572265625, -0.3353118896484375, -0.296966552734375, -0.2586212158203125, -0.22027587890625, -0.1819305419921875, -0.143585205078125, -0.1052398681640625, -0.06689453125, -0.0285491943359375, 0.009796142578125, 0.0481414794921875, 0.08648681640625, 0.1248321533203125, 0.163177490234375, 0.2015228271484375, 0.2398681640625, 0.2782135009765625, 0.316558837890625, 0.3549041748046875, 0.39324951171875, 0.4315948486328125, 0.469940185546875, 0.5082855224609375, 0.546630859375, 0.5849761962890625, 0.623321533203125, 0.6616668701171875, 0.70001220703125, 0.7383575439453125, 0.776702880859375, 0.8150482177734375, 0.8533935546875, 0.8917388916015625, 0.930084228515625, 0.9684295654296875, 1.00677490234375, 1.0451202392578125, 1.083465576171875, 1.1218109130859375, 1.16015625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 5.0, 5.0, 11.0, 14.0, 21.0, 29.0, 56.0, 68.0, 97.0, 154.0, 186.0, 269.0, 404.0, 641.0, 850.0, 1348.0, 2073.0, 3263.0, 5138.0, 8063.0, 13326.0, 22475.0, 38225.0, 67067.0, 124130.0, 235823.0, 1261601.0, 135348.0, 73457.0, 40880.0, 23580.0, 14064.0, 8700.0, 5497.0, 3390.0, 2288.0, 1509.0, 994.0, 677.0, 448.0, 303.0, 222.0, 143.0, 88.0, 73.0, 40.0, 30.0, 22.0, 21.0, 11.0, 3.0, 5.0, 0.0, 2.0, 2.0, 2.0], "bins": [-0.202880859375, -0.19692611694335938, -0.19097137451171875, -0.18501663208007812, -0.1790618896484375, -0.17310714721679688, -0.16715240478515625, -0.16119766235351562, -0.155242919921875, -0.14928817749023438, -0.14333343505859375, -0.13737869262695312, -0.1314239501953125, -0.12546920776367188, -0.11951446533203125, -0.11355972290039062, -0.10760498046875, -0.10165023803710938, -0.09569549560546875, -0.08974075317382812, -0.0837860107421875, -0.07783126831054688, -0.07187652587890625, -0.06592178344726562, -0.059967041015625, -0.054012298583984375, -0.04805755615234375, -0.042102813720703125, -0.0361480712890625, -0.030193328857421875, -0.02423858642578125, -0.018283843994140625, -0.0123291015625, -0.006374359130859375, -0.00041961669921875, 0.005535125732421875, 0.0114898681640625, 0.017444610595703125, 0.02339935302734375, 0.029354095458984375, 0.035308837890625, 0.041263580322265625, 0.04721832275390625, 0.053173065185546875, 0.0591278076171875, 0.06508255004882812, 0.07103729248046875, 0.07699203491210938, 0.08294677734375, 0.08890151977539062, 0.09485626220703125, 0.10081100463867188, 0.1067657470703125, 0.11272048950195312, 0.11867523193359375, 0.12462997436523438, 0.130584716796875, 0.13653945922851562, 0.14249420166015625, 0.14844894409179688, 0.1544036865234375, 0.16035842895507812, 0.16631317138671875, 0.17226791381835938, 0.17822265625]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 6.0, 7.0, 6.0, 3.0, 9.0, 14.0, 9.0, 20.0, 17.0, 9.0, 23.0, 34.0, 56.0, 51.0, 74.0, 77.0, 78.0, 79.0, 68.0, 57.0, 57.0, 42.0, 38.0, 36.0, 20.0, 18.0, 13.0, 19.0, 9.0, 10.0, 6.0, 6.0, 7.0, 9.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00090789794921875, -0.000881493091583252, -0.0008550882339477539, -0.0008286833763122559, -0.0008022785186767578, -0.0007758736610412598, -0.0007494688034057617, -0.0007230639457702637, -0.0006966590881347656, -0.0006702542304992676, -0.0006438493728637695, -0.0006174445152282715, -0.0005910396575927734, -0.0005646347999572754, -0.0005382299423217773, -0.0005118250846862793, -0.00048542022705078125, -0.0004590153694152832, -0.00043261051177978516, -0.0004062056541442871, -0.00037980079650878906, -0.000353395938873291, -0.00032699108123779297, -0.0003005862236022949, -0.0002741813659667969, -0.00024777650833129883, -0.00022137165069580078, -0.00019496679306030273, -0.0001685619354248047, -0.00014215707778930664, -0.0001157522201538086, -8.934736251831055e-05, -6.29425048828125e-05, -3.653764724731445e-05, -1.0132789611816406e-05, 1.627206802368164e-05, 4.267692565917969e-05, 6.908178329467773e-05, 9.548664093017578e-05, 0.00012189149856567383, 0.00014829635620117188, 0.00017470121383666992, 0.00020110607147216797, 0.00022751092910766602, 0.00025391578674316406, 0.0002803206443786621, 0.00030672550201416016, 0.0003331303596496582, 0.00035953521728515625, 0.0003859400749206543, 0.00041234493255615234, 0.0004387497901916504, 0.00046515464782714844, 0.0004915595054626465, 0.0005179643630981445, 0.0005443692207336426, 0.0005707740783691406, 0.0005971789360046387, 0.0006235837936401367, 0.0006499886512756348, 0.0006763935089111328, 0.0007027983665466309, 0.0007292032241821289, 0.000755608081817627, 0.000782012939453125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 4.0, 5.0, 8.0, 4.0, 9.0, 5.0, 9.0, 10.0, 18.0, 28.0, 32.0, 32.0, 56.0, 86.0, 114.0, 225.0, 409.0, 1133.0, 181806.0, 861221.0, 2049.0, 519.0, 266.0, 153.0, 107.0, 62.0, 46.0, 26.0, 25.0, 17.0, 13.0, 12.0, 10.0, 6.0, 9.0, 4.0, 5.0, 3.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01611328125, -0.015560150146484375, -0.01500701904296875, -0.014453887939453125, -0.0139007568359375, -0.013347625732421875, -0.01279449462890625, -0.012241363525390625, -0.011688232421875, -0.011135101318359375, -0.01058197021484375, -0.010028839111328125, -0.0094757080078125, -0.008922576904296875, -0.00836944580078125, -0.007816314697265625, -0.00726318359375, -0.006710052490234375, -0.00615692138671875, -0.005603790283203125, -0.0050506591796875, -0.004497528076171875, -0.00394439697265625, -0.003391265869140625, -0.002838134765625, -0.002285003662109375, -0.00173187255859375, -0.001178741455078125, -0.0006256103515625, -7.2479248046875e-05, 0.00048065185546875, 0.001033782958984375, 0.0015869140625, 0.002140045166015625, 0.00269317626953125, 0.003246307373046875, 0.0037994384765625, 0.004352569580078125, 0.00490570068359375, 0.005458831787109375, 0.006011962890625, 0.006565093994140625, 0.00711822509765625, 0.007671356201171875, 0.0082244873046875, 0.008777618408203125, 0.00933074951171875, 0.009883880615234375, 0.01043701171875, 0.010990142822265625, 0.01154327392578125, 0.012096405029296875, 0.0126495361328125, 0.013202667236328125, 0.01375579833984375, 0.014308929443359375, 0.014862060546875, 0.015415191650390625, 0.01596832275390625, 0.016521453857421875, 0.0170745849609375, 0.017627716064453125, 0.01818084716796875, 0.018733978271484375, 0.019287109375]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 48.0, 219.0, 397.0, 262.0, 62.0, 19.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0022262653801590204, -0.002165293786674738, -0.0021043221931904554, -0.0020433503668755293, -0.001982378773391247, -0.0019214071799069643, -0.0018604355864226818, -0.0017994639929383993, -0.001738492283038795, -0.0016775206895545125, -0.0016165489796549082, -0.0015555773861706257, -0.0014946057926863432, -0.0014336340827867389, -0.0013726624893024564, -0.001311690779402852, -0.0012507191859185696, -0.001189747592434287, -0.0011287758825346828, -0.0010678042890504003, -0.001006832579150796, -0.0009458609856665134, -0.000884889392182231, -0.0008239177404902875, -0.0007629460887983441, -0.0007019744371064007, -0.0006410027854144573, -0.0005800311919301748, -0.0005190595402382314, -0.000458087888546288, -0.00039711626595817506, -0.0003361446433700621, -0.00027517310809344053, -0.00021420147095341235, -0.00015322983381338418, -9.2258196673356e-05, -3.128655953332782e-05, 2.968509215861559e-05, 9.065671474672854e-05, 0.0001516283373348415, 0.0002125999890267849, 0.0002735716407187283, 0.00033454326330684125, 0.0003955148858949542, 0.0004564865375868976, 0.000517458189278841, 0.0005784297827631235, 0.0006394014344550669, 0.0007003730861470103, 0.0007613447378389537, 0.0008223163895308971, 0.0008832879830151796, 0.000944259634707123, 0.0010052312863990664, 0.001066202879883349, 0.0011271745897829533, 0.0011881461832672358, 0.0012491177767515182, 0.0013100894866511226, 0.001371061080135405, 0.0014320327900350094, 0.0014930043835192919, 0.0015539759770035744, 0.0016149475704878569, 0.0016759192803874612]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 6.0, 6.0, 9.0, 6.0, 5.0, 7.0, 4.0, 14.0, 10.0, 10.0, 18.0, 18.0, 29.0, 22.0, 18.0, 30.0, 26.0, 31.0, 40.0, 21.0, 36.0, 50.0, 45.0, 52.0, 48.0, 37.0, 47.0, 27.0, 39.0, 35.0, 35.0, 35.0, 25.0, 22.0, 25.0, 18.0, 27.0, 13.0, 7.0, 11.0, 9.0, 8.0, 5.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.0003914833068847656, -0.0003781011328101158, -0.000364718958735466, -0.0003513367846608162, -0.0003379546105861664, -0.00032457243651151657, -0.00031119026243686676, -0.00029780808836221695, -0.00028442591428756714, -0.00027104374021291733, -0.0002576615661382675, -0.0002442793920636177, -0.0002308972179889679, -0.00021751504391431808, -0.00020413286983966827, -0.00019075069576501846, -0.00017736852169036865, -0.00016398634761571884, -0.00015060417354106903, -0.00013722199946641922, -0.0001238398253917694, -0.0001104576513171196, -9.707547724246979e-05, -8.369330316781998e-05, -7.031112909317017e-05, -5.6928955018520355e-05, -4.3546780943870544e-05, -3.0164606869220734e-05, -1.6782432794570923e-05, -3.400258719921112e-06, 9.981915354728699e-06, 2.336408942937851e-05, 3.674626350402832e-05, 5.012843757867813e-05, 6.351061165332794e-05, 7.689278572797775e-05, 9.027495980262756e-05, 0.00010365713387727737, 0.00011703930795192719, 0.000130421482026577, 0.0001438036561012268, 0.00015718583017587662, 0.00017056800425052643, 0.00018395017832517624, 0.00019733235239982605, 0.00021071452647447586, 0.00022409670054912567, 0.00023747887462377548, 0.0002508610486984253, 0.0002642432227730751, 0.0002776253968477249, 0.0002910075709223747, 0.00030438974499702454, 0.00031777191907167435, 0.00033115409314632416, 0.00034453626722097397, 0.0003579184412956238, 0.0003713006153702736, 0.0003846827894449234, 0.0003980649635195732, 0.000411447137594223, 0.00042482931166887283, 0.00043821148574352264, 0.00045159365981817245, 0.00046497583389282227]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 7.0, 0.0, 8.0, 6.0, 13.0, 4.0, 4.0, 11.0, 13.0, 10.0, 23.0, 26.0, 23.0, 23.0, 29.0, 27.0, 35.0, 41.0, 33.0, 37.0, 36.0, 41.0, 40.0, 45.0, 38.0, 45.0, 45.0, 45.0, 35.0, 31.0, 40.0, 23.0, 19.0, 19.0, 21.0, 18.0, 16.0, 13.0, 12.0, 11.0, 7.0, 3.0, 6.0, 4.0, 2.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.658203125, -1.6042938232421875, -1.550384521484375, -1.4964752197265625, -1.44256591796875, -1.3886566162109375, -1.334747314453125, -1.2808380126953125, -1.2269287109375, -1.1730194091796875, -1.119110107421875, -1.0652008056640625, -1.01129150390625, -0.9573822021484375, -0.903472900390625, -0.8495635986328125, -0.795654296875, -0.7417449951171875, -0.687835693359375, -0.6339263916015625, -0.58001708984375, -0.5261077880859375, -0.472198486328125, -0.4182891845703125, -0.3643798828125, -0.3104705810546875, -0.256561279296875, -0.2026519775390625, -0.14874267578125, -0.0948333740234375, -0.040924072265625, 0.0129852294921875, 0.06689453125, 0.1208038330078125, 0.174713134765625, 0.2286224365234375, 0.28253173828125, 0.3364410400390625, 0.390350341796875, 0.4442596435546875, 0.4981689453125, 0.5520782470703125, 0.605987548828125, 0.6598968505859375, 0.71380615234375, 0.7677154541015625, 0.821624755859375, 0.8755340576171875, 0.929443359375, 0.9833526611328125, 1.037261962890625, 1.0911712646484375, 1.14508056640625, 1.1989898681640625, 1.252899169921875, 1.3068084716796875, 1.3607177734375, 1.4146270751953125, 1.468536376953125, 1.5224456787109375, 1.57635498046875, 1.6302642822265625, 1.684173583984375, 1.7380828857421875, 1.7919921875]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 4.0, 9.0, 4.0, 7.0, 10.0, 8.0, 25.0, 31.0, 43.0, 61.0, 74.0, 107.0, 191.0, 266.0, 412.0, 634.0, 1019.0, 1639.0, 3078.0, 5166.0, 9586.0, 19286.0, 44239.0, 118925.0, 316471.0, 319434.0, 121476.0, 44417.0, 19305.0, 9746.0, 5309.0, 2953.0, 1771.0, 1005.0, 634.0, 388.0, 263.0, 166.0, 123.0, 74.0, 58.0, 36.0, 32.0, 20.0, 14.0, 9.0, 8.0, 11.0, 6.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.9658203125, -1.9024200439453125, -1.839019775390625, -1.7756195068359375, -1.71221923828125, -1.6488189697265625, -1.585418701171875, -1.5220184326171875, -1.4586181640625, -1.3952178955078125, -1.331817626953125, -1.2684173583984375, -1.20501708984375, -1.1416168212890625, -1.078216552734375, -1.0148162841796875, -0.951416015625, -0.8880157470703125, -0.824615478515625, -0.7612152099609375, -0.69781494140625, -0.6344146728515625, -0.571014404296875, -0.5076141357421875, -0.4442138671875, -0.3808135986328125, -0.317413330078125, -0.2540130615234375, -0.19061279296875, -0.1272125244140625, -0.063812255859375, -0.0004119873046875, 0.06298828125, 0.1263885498046875, 0.189788818359375, 0.2531890869140625, 0.31658935546875, 0.3799896240234375, 0.443389892578125, 0.5067901611328125, 0.5701904296875, 0.6335906982421875, 0.696990966796875, 0.7603912353515625, 0.82379150390625, 0.8871917724609375, 0.950592041015625, 1.0139923095703125, 1.077392578125, 1.1407928466796875, 1.204193115234375, 1.2675933837890625, 1.33099365234375, 1.3943939208984375, 1.457794189453125, 1.5211944580078125, 1.5845947265625, 1.6479949951171875, 1.711395263671875, 1.7747955322265625, 1.83819580078125, 1.9015960693359375, 1.964996337890625, 2.0283966064453125, 2.091796875]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 4.0, 0.0, 5.0, 6.0, 6.0, 4.0, 10.0, 10.0, 9.0, 9.0, 16.0, 18.0, 18.0, 25.0, 39.0, 27.0, 36.0, 53.0, 53.0, 65.0, 79.0, 174.0, 1390.0, 330.0, 181.0, 81.0, 51.0, 47.0, 43.0, 44.0, 31.0, 35.0, 27.0, 24.0, 18.0, 15.0, 12.0, 11.0, 6.0, 9.0, 8.0, 6.0, 7.0, 5.0, 3.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.85546875, -6.6341552734375, -6.412841796875, -6.1915283203125, -5.97021484375, -5.7489013671875, -5.527587890625, -5.3062744140625, -5.0849609375, -4.8636474609375, -4.642333984375, -4.4210205078125, -4.19970703125, -3.9783935546875, -3.757080078125, -3.5357666015625, -3.314453125, -3.0931396484375, -2.871826171875, -2.6505126953125, -2.42919921875, -2.2078857421875, -1.986572265625, -1.7652587890625, -1.5439453125, -1.3226318359375, -1.101318359375, -0.8800048828125, -0.65869140625, -0.4373779296875, -0.216064453125, 0.0052490234375, 0.2265625, 0.4478759765625, 0.669189453125, 0.8905029296875, 1.11181640625, 1.3331298828125, 1.554443359375, 1.7757568359375, 1.9970703125, 2.2183837890625, 2.439697265625, 2.6610107421875, 2.88232421875, 3.1036376953125, 3.324951171875, 3.5462646484375, 3.767578125, 3.9888916015625, 4.210205078125, 4.4315185546875, 4.65283203125, 4.8741455078125, 5.095458984375, 5.3167724609375, 5.5380859375, 5.7593994140625, 5.980712890625, 6.2020263671875, 6.42333984375, 6.6446533203125, 6.865966796875, 7.0872802734375, 7.30859375]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 5.0, 5.0, 8.0, 22.0, 20.0, 30.0, 41.0, 74.0, 109.0, 157.0, 315.0, 814.0, 7764.0, 3101311.0, 33003.0, 1127.0, 367.0, 182.0, 122.0, 63.0, 56.0, 31.0, 16.0, 19.0, 16.0, 9.0, 3.0, 6.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-33.59375, -32.74609375, -31.8984375, -31.05078125, -30.203125, -29.35546875, -28.5078125, -27.66015625, -26.8125, -25.96484375, -25.1171875, -24.26953125, -23.421875, -22.57421875, -21.7265625, -20.87890625, -20.03125, -19.18359375, -18.3359375, -17.48828125, -16.640625, -15.79296875, -14.9453125, -14.09765625, -13.25, -12.40234375, -11.5546875, -10.70703125, -9.859375, -9.01171875, -8.1640625, -7.31640625, -6.46875, -5.62109375, -4.7734375, -3.92578125, -3.078125, -2.23046875, -1.3828125, -0.53515625, 0.3125, 1.16015625, 2.0078125, 2.85546875, 3.703125, 4.55078125, 5.3984375, 6.24609375, 7.09375, 7.94140625, 8.7890625, 9.63671875, 10.484375, 11.33203125, 12.1796875, 13.02734375, 13.875, 14.72265625, 15.5703125, 16.41796875, 17.265625, 18.11328125, 18.9609375, 19.80859375, 20.65625]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [859.0, 155.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.426872730255127, 1.045492172241211, 5.517857074737549, 9.990222930908203, 14.462587356567383, 18.934951782226562, 23.407318115234375, 27.879682540893555, 32.352046966552734, 36.82441329956055, 41.296775817871094, 45.769142150878906, 50.24150848388672, 54.713871002197266, 59.18623733520508, 63.658599853515625, 68.13096618652344, 72.60333251953125, 77.07569885253906, 81.54806518554688, 86.02042388916016, 90.49279022216797, 94.96515655517578, 99.4375228881836, 103.90988159179688, 108.38224792480469, 112.8546142578125, 117.32698059082031, 121.7993392944336, 126.2717056274414, 130.74407958984375, 135.2164306640625, 139.6887969970703, 144.16116333007812, 148.63352966308594, 153.10589599609375, 157.57826232910156, 162.05062866210938, 166.52297973632812, 170.99534606933594, 175.46771240234375, 179.94007873535156, 184.41244506835938, 188.8848114013672, 193.357177734375, 197.82952880859375, 202.30191040039062, 206.77426147460938, 211.24664306640625, 215.71900939941406, 220.19137573242188, 224.6637420654297, 229.1361083984375, 233.60845947265625, 238.08084106445312, 242.55319213867188, 247.0255584716797, 251.4979248046875, 255.9702911376953, 260.4426574707031, 264.9150085449219, 269.38739013671875, 273.8597412109375, 278.3321228027344, 282.8044738769531]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 5.0, 5.0, 13.0, 10.0, 9.0, 11.0, 16.0, 11.0, 21.0, 17.0, 19.0, 23.0, 24.0, 24.0, 26.0, 36.0, 27.0, 35.0, 40.0, 29.0, 39.0, 42.0, 39.0, 40.0, 46.0, 37.0, 32.0, 35.0, 22.0, 18.0, 38.0, 24.0, 30.0, 23.0, 27.0, 14.0, 17.0, 13.0, 8.0, 11.0, 8.0, 7.0, 8.0, 4.0, 4.0, 4.0, 5.0, 2.0, 1.0, 4.0, 3.0, 2.0, 0.0, 2.0], "bins": [-16.991905212402344, -16.486116409301758, -15.980329513549805, -15.474541664123535, -14.968753814697266, -14.46296501159668, -13.95717716217041, -13.45138931274414, -12.945601463317871, -12.439813613891602, -11.934025764465332, -11.428237915039062, -10.922449111938477, -10.416662216186523, -9.910873413085938, -9.405085563659668, -8.899297714233398, -8.393509864807129, -7.887722015380859, -7.381933689117432, -6.876145839691162, -6.370357990264893, -5.864569664001465, -5.358781814575195, -4.852993965148926, -4.347206115722656, -3.8414180278778076, -3.335629940032959, -2.8298420906066895, -2.32405424118042, -1.8182661533355713, -1.3124780654907227, -0.8066921234130859, -0.30090415477752686, 0.20488381385803223, 0.7106717824935913, 1.2164597511291504, 1.72224760055542, 2.2280356884002686, 2.733823776245117, 3.2396116256713867, 3.7453994750976562, 4.251187324523926, 4.7569756507873535, 5.262763500213623, 5.768551349639893, 6.27433967590332, 6.78012752532959, 7.285915374755859, 7.791703224182129, 8.297491073608398, 8.803278923034668, 9.309066772460938, 9.814855575561523, 10.320643424987793, 10.826431274414062, 11.332219123840332, 11.838006973266602, 12.343794822692871, 12.84958267211914, 13.355371475219727, 13.86115837097168, 14.366947174072266, 14.872735023498535, 15.378522872924805]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 2.0, 6.0, 3.0, 5.0, 7.0, 9.0, 10.0, 8.0, 18.0, 8.0, 19.0, 21.0, 25.0, 19.0, 21.0, 31.0, 33.0, 26.0, 33.0, 36.0, 35.0, 34.0, 41.0, 36.0, 41.0, 34.0, 47.0, 45.0, 41.0, 41.0, 38.0, 40.0, 26.0, 27.0, 20.0, 10.0, 14.0, 14.0, 21.0, 10.0, 11.0, 5.0, 4.0, 7.0, 6.0, 6.0, 2.0, 5.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.697265625, -1.640472412109375, -1.58367919921875, -1.526885986328125, -1.4700927734375, -1.413299560546875, -1.35650634765625, -1.299713134765625, -1.242919921875, -1.186126708984375, -1.12933349609375, -1.072540283203125, -1.0157470703125, -0.958953857421875, -0.90216064453125, -0.845367431640625, -0.78857421875, -0.731781005859375, -0.67498779296875, -0.618194580078125, -0.5614013671875, -0.504608154296875, -0.44781494140625, -0.391021728515625, -0.334228515625, -0.277435302734375, -0.22064208984375, -0.163848876953125, -0.1070556640625, -0.050262451171875, 0.00653076171875, 0.063323974609375, 0.1201171875, 0.176910400390625, 0.23370361328125, 0.290496826171875, 0.3472900390625, 0.404083251953125, 0.46087646484375, 0.517669677734375, 0.574462890625, 0.631256103515625, 0.68804931640625, 0.744842529296875, 0.8016357421875, 0.858428955078125, 0.91522216796875, 0.972015380859375, 1.02880859375, 1.085601806640625, 1.14239501953125, 1.199188232421875, 1.2559814453125, 1.312774658203125, 1.36956787109375, 1.426361083984375, 1.483154296875, 1.539947509765625, 1.59674072265625, 1.653533935546875, 1.7103271484375, 1.767120361328125, 1.82391357421875, 1.880706787109375, 1.9375]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 2.0, 4.0, 5.0, 4.0, 6.0, 6.0, 7.0, 12.0, 8.0, 13.0, 25.0, 20.0, 24.0, 28.0, 41.0, 45.0, 40.0, 54.0, 58.0, 70.0, 112.0, 176.0, 405.0, 1579.0, 14027.0, 453125.0, 3371785.0, 338773.0, 11274.0, 1398.0, 374.0, 196.0, 140.0, 86.0, 61.0, 44.0, 32.0, 33.0, 39.0, 35.0, 29.0, 10.0, 10.0, 13.0, 17.0, 8.0, 14.0, 3.0, 7.0, 5.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.1171875, -6.8756103515625, -6.634033203125, -6.3924560546875, -6.15087890625, -5.9093017578125, -5.667724609375, -5.4261474609375, -5.1845703125, -4.9429931640625, -4.701416015625, -4.4598388671875, -4.21826171875, -3.9766845703125, -3.735107421875, -3.4935302734375, -3.251953125, -3.0103759765625, -2.768798828125, -2.5272216796875, -2.28564453125, -2.0440673828125, -1.802490234375, -1.5609130859375, -1.3193359375, -1.0777587890625, -0.836181640625, -0.5946044921875, -0.35302734375, -0.1114501953125, 0.130126953125, 0.3717041015625, 0.61328125, 0.8548583984375, 1.096435546875, 1.3380126953125, 1.57958984375, 1.8211669921875, 2.062744140625, 2.3043212890625, 2.5458984375, 2.7874755859375, 3.029052734375, 3.2706298828125, 3.51220703125, 3.7537841796875, 3.995361328125, 4.2369384765625, 4.478515625, 4.7200927734375, 4.961669921875, 5.2032470703125, 5.44482421875, 5.6864013671875, 5.927978515625, 6.1695556640625, 6.4111328125, 6.6527099609375, 6.894287109375, 7.1358642578125, 7.37744140625, 7.6190185546875, 7.860595703125, 8.1021728515625, 8.34375]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 12.0, 10.0, 9.0, 23.0, 32.0, 51.0, 63.0, 95.0, 127.0, 194.0, 256.0, 388.0, 441.0, 514.0, 464.0, 426.0, 303.0, 207.0, 136.0, 97.0, 70.0, 49.0, 34.0, 26.0, 17.0, 9.0, 6.0, 3.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.29296875, -5.1197509765625, -4.946533203125, -4.7733154296875, -4.60009765625, -4.4268798828125, -4.253662109375, -4.0804443359375, -3.9072265625, -3.7340087890625, -3.560791015625, -3.3875732421875, -3.21435546875, -3.0411376953125, -2.867919921875, -2.6947021484375, -2.521484375, -2.3482666015625, -2.175048828125, -2.0018310546875, -1.82861328125, -1.6553955078125, -1.482177734375, -1.3089599609375, -1.1357421875, -0.9625244140625, -0.789306640625, -0.6160888671875, -0.44287109375, -0.2696533203125, -0.096435546875, 0.0767822265625, 0.25, 0.4232177734375, 0.596435546875, 0.7696533203125, 0.94287109375, 1.1160888671875, 1.289306640625, 1.4625244140625, 1.6357421875, 1.8089599609375, 1.982177734375, 2.1553955078125, 2.32861328125, 2.5018310546875, 2.675048828125, 2.8482666015625, 3.021484375, 3.1947021484375, 3.367919921875, 3.5411376953125, 3.71435546875, 3.8875732421875, 4.060791015625, 4.2340087890625, 4.4072265625, 4.5804443359375, 4.753662109375, 4.9268798828125, 5.10009765625, 5.2733154296875, 5.446533203125, 5.6197509765625, 5.79296875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 3.0, 2.0, 10.0, 13.0, 22.0, 34.0, 41.0, 74.0, 99.0, 182.0, 266.0, 509.0, 1590.0, 23170.0, 2131487.0, 2012358.0, 21617.0, 1606.0, 487.0, 259.0, 149.0, 94.0, 77.0, 49.0, 23.0, 24.0, 11.0, 8.0, 10.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.4296875, -14.9473876953125, -14.465087890625, -13.9827880859375, -13.50048828125, -13.0181884765625, -12.535888671875, -12.0535888671875, -11.5712890625, -11.0889892578125, -10.606689453125, -10.1243896484375, -9.64208984375, -9.1597900390625, -8.677490234375, -8.1951904296875, -7.712890625, -7.2305908203125, -6.748291015625, -6.2659912109375, -5.78369140625, -5.3013916015625, -4.819091796875, -4.3367919921875, -3.8544921875, -3.3721923828125, -2.889892578125, -2.4075927734375, -1.92529296875, -1.4429931640625, -0.960693359375, -0.4783935546875, 0.00390625, 0.4862060546875, 0.968505859375, 1.4508056640625, 1.93310546875, 2.4154052734375, 2.897705078125, 3.3800048828125, 3.8623046875, 4.3446044921875, 4.826904296875, 5.3092041015625, 5.79150390625, 6.2738037109375, 6.756103515625, 7.2384033203125, 7.720703125, 8.2030029296875, 8.685302734375, 9.1676025390625, 9.64990234375, 10.1322021484375, 10.614501953125, 11.0968017578125, 11.5791015625, 12.0614013671875, 12.543701171875, 13.0260009765625, 13.50830078125, 13.9906005859375, 14.472900390625, 14.9552001953125, 15.4375]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 7.0, 185.0, 674.0, 148.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-193.9256134033203, -189.0108642578125, -184.09613037109375, -179.18138122558594, -174.26663208007812, -169.3518829345703, -164.4371337890625, -159.52239990234375, -154.60765075683594, -149.69290161132812, -144.77816772460938, -139.86341857910156, -134.94866943359375, -130.03392028808594, -125.11917877197266, -120.20443725585938, -115.28968811035156, -110.37493896484375, -105.46019744873047, -100.54545593261719, -95.63070678710938, -90.71595764160156, -85.80121612548828, -80.886474609375, -75.97172546386719, -71.05697631835938, -66.1422348022461, -61.22748947143555, -56.312744140625, -51.39799880981445, -46.483253479003906, -41.56850814819336, -36.65374755859375, -31.739002227783203, -26.824256896972656, -21.90951156616211, -16.994766235351562, -12.080020904541016, -7.165275573730469, -2.250530242919922, 2.664215087890625, 7.578960418701172, 12.493705749511719, 17.408451080322266, 22.323196411132812, 27.23794174194336, 32.152687072753906, 37.06743240356445, 41.982177734375, 46.89692306518555, 51.811668395996094, 56.72641372680664, 61.64115905761719, 66.555908203125, 71.47064971923828, 76.38539123535156, 81.30014038085938, 86.21488952636719, 91.12963104248047, 96.04437255859375, 100.95912170410156, 105.87387084960938, 110.78861236572266, 115.70335388183594, 120.61810302734375]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 6.0, 8.0, 6.0, 6.0, 9.0, 15.0, 15.0, 15.0, 18.0, 24.0, 25.0, 20.0, 26.0, 28.0, 36.0, 41.0, 44.0, 40.0, 51.0, 48.0, 41.0, 47.0, 36.0, 30.0, 45.0, 35.0, 34.0, 43.0, 36.0, 32.0, 22.0, 25.0, 23.0, 19.0, 7.0, 6.0, 9.0, 11.0, 6.0, 6.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.537100791931152, -15.014609336853027, -14.492117881774902, -13.969627380371094, -13.447135925292969, -12.924644470214844, -12.402153015136719, -11.879661560058594, -11.357170104980469, -10.834678649902344, -10.312187194824219, -9.789695739746094, -9.267205238342285, -8.74471378326416, -8.222222328186035, -7.69973087310791, -7.177240371704102, -6.654748916625977, -6.13225793838501, -5.609766483306885, -5.087275505065918, -4.564784049987793, -4.042292594909668, -3.519801378250122, -2.997310161590576, -2.4748189449310303, -1.9523276090621948, -1.4298362731933594, -0.9073450565338135, -0.3848538398742676, 0.13763761520385742, 0.6601288318634033, 1.1826190948486328, 1.7051103115081787, 2.2276015281677246, 2.7500929832458496, 3.2725841999053955, 3.7950754165649414, 4.317566871643066, 4.840058326721191, 5.362549304962158, 5.885040760040283, 6.40753173828125, 6.930023193359375, 7.4525146484375, 7.975005626678467, 8.49749755859375, 9.019988059997559, 9.542479515075684, 10.064970970153809, 10.587462425231934, 11.109952926635742, 11.632444381713867, 12.154935836791992, 12.677427291870117, 13.199918746948242, 13.722410202026367, 14.244901657104492, 14.767393112182617, 15.289884567260742, 15.81237506866455, 16.33486557006836, 16.857357025146484, 17.37984848022461, 17.902339935302734]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [4.0, 3.0, 3.0, 4.0, 5.0, 4.0, 0.0, 6.0, 6.0, 7.0, 8.0, 12.0, 10.0, 13.0, 13.0, 19.0, 17.0, 22.0, 19.0, 23.0, 25.0, 29.0, 30.0, 37.0, 50.0, 37.0, 38.0, 50.0, 42.0, 31.0, 39.0, 44.0, 47.0, 30.0, 39.0, 37.0, 19.0, 27.0, 24.0, 26.0, 21.0, 16.0, 16.0, 13.0, 10.0, 6.0, 8.0, 2.0, 3.0, 6.0, 3.0, 3.0, 3.0, 5.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.654296875, -1.596221923828125, -1.53814697265625, -1.480072021484375, -1.4219970703125, -1.363922119140625, -1.30584716796875, -1.247772216796875, -1.189697265625, -1.131622314453125, -1.07354736328125, -1.015472412109375, -0.9573974609375, -0.899322509765625, -0.84124755859375, -0.783172607421875, -0.72509765625, -0.667022705078125, -0.60894775390625, -0.550872802734375, -0.4927978515625, -0.434722900390625, -0.37664794921875, -0.318572998046875, -0.260498046875, -0.202423095703125, -0.14434814453125, -0.086273193359375, -0.0281982421875, 0.029876708984375, 0.08795166015625, 0.146026611328125, 0.2041015625, 0.262176513671875, 0.32025146484375, 0.378326416015625, 0.4364013671875, 0.494476318359375, 0.55255126953125, 0.610626220703125, 0.668701171875, 0.726776123046875, 0.78485107421875, 0.842926025390625, 0.9010009765625, 0.959075927734375, 1.01715087890625, 1.075225830078125, 1.13330078125, 1.191375732421875, 1.24945068359375, 1.307525634765625, 1.3656005859375, 1.423675537109375, 1.48175048828125, 1.539825439453125, 1.597900390625, 1.655975341796875, 1.71405029296875, 1.772125244140625, 1.8302001953125, 1.888275146484375, 1.94635009765625, 2.004425048828125, 2.0625]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 3.0, 8.0, 4.0, 8.0, 12.0, 17.0, 43.0, 54.0, 62.0, 106.0, 164.0, 245.0, 329.0, 528.0, 795.0, 1192.0, 1809.0, 2693.0, 4110.0, 6046.0, 9370.0, 14634.0, 23034.0, 38353.0, 65895.0, 115754.0, 205618.0, 228907.0, 135649.0, 75413.0, 43918.0, 26431.0, 16602.0, 10506.0, 6838.0, 4444.0, 2986.0, 2001.0, 1329.0, 851.0, 583.0, 388.0, 292.0, 184.0, 137.0, 70.0, 43.0, 35.0, 27.0, 13.0, 15.0, 6.0, 4.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.236083984375, -0.22824859619140625, -0.2204132080078125, -0.21257781982421875, -0.204742431640625, -0.19690704345703125, -0.1890716552734375, -0.18123626708984375, -0.17340087890625, -0.16556549072265625, -0.1577301025390625, -0.14989471435546875, -0.142059326171875, -0.13422393798828125, -0.1263885498046875, -0.11855316162109375, -0.1107177734375, -0.10288238525390625, -0.0950469970703125, -0.08721160888671875, -0.079376220703125, -0.07154083251953125, -0.0637054443359375, -0.05587005615234375, -0.04803466796875, -0.04019927978515625, -0.0323638916015625, -0.02452850341796875, -0.016693115234375, -0.00885772705078125, -0.0010223388671875, 0.00681304931640625, 0.0146484375, 0.02248382568359375, 0.0303192138671875, 0.03815460205078125, 0.045989990234375, 0.05382537841796875, 0.0616607666015625, 0.06949615478515625, 0.07733154296875, 0.08516693115234375, 0.0930023193359375, 0.10083770751953125, 0.108673095703125, 0.11650848388671875, 0.1243438720703125, 0.13217926025390625, 0.1400146484375, 0.14785003662109375, 0.1556854248046875, 0.16352081298828125, 0.171356201171875, 0.17919158935546875, 0.1870269775390625, 0.19486236572265625, 0.20269775390625, 0.21053314208984375, 0.2183685302734375, 0.22620391845703125, 0.234039306640625, 0.24187469482421875, 0.2497100830078125, 0.25754547119140625, 0.265380859375]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 4.0, 1.0, 7.0, 5.0, 6.0, 7.0, 4.0, 8.0, 7.0, 23.0, 16.0, 18.0, 11.0, 21.0, 23.0, 25.0, 32.0, 26.0, 24.0, 52.0, 27.0, 38.0, 47.0, 38.0, 1077.0, 46.0, 37.0, 38.0, 41.0, 28.0, 29.0, 28.0, 33.0, 22.0, 25.0, 16.0, 10.0, 18.0, 17.0, 22.0, 19.0, 12.0, 14.0, 11.0, 4.0, 3.0, 5.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-1.19921875, -1.1625823974609375, -1.125946044921875, -1.0893096923828125, -1.05267333984375, -1.0160369873046875, -0.979400634765625, -0.9427642822265625, -0.9061279296875, -0.8694915771484375, -0.832855224609375, -0.7962188720703125, -0.75958251953125, -0.7229461669921875, -0.686309814453125, -0.6496734619140625, -0.613037109375, -0.5764007568359375, -0.539764404296875, -0.5031280517578125, -0.46649169921875, -0.4298553466796875, -0.393218994140625, -0.3565826416015625, -0.3199462890625, -0.2833099365234375, -0.246673583984375, -0.2100372314453125, -0.17340087890625, -0.1367645263671875, -0.100128173828125, -0.0634918212890625, -0.02685546875, 0.0097808837890625, 0.046417236328125, 0.0830535888671875, 0.11968994140625, 0.1563262939453125, 0.192962646484375, 0.2295989990234375, 0.2662353515625, 0.3028717041015625, 0.339508056640625, 0.3761444091796875, 0.41278076171875, 0.4494171142578125, 0.486053466796875, 0.5226898193359375, 0.559326171875, 0.5959625244140625, 0.632598876953125, 0.6692352294921875, 0.70587158203125, 0.7425079345703125, 0.779144287109375, 0.8157806396484375, 0.8524169921875, 0.8890533447265625, 0.925689697265625, 0.9623260498046875, 0.99896240234375, 1.0355987548828125, 1.072235107421875, 1.1088714599609375, 1.1455078125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 7.0, 6.0, 9.0, 6.0, 8.0, 17.0, 30.0, 49.0, 62.0, 86.0, 166.0, 188.0, 310.0, 452.0, 657.0, 925.0, 1395.0, 2117.0, 3123.0, 4918.0, 7487.0, 12000.0, 19623.0, 32488.0, 56605.0, 101934.0, 185783.0, 1290428.0, 161598.0, 88096.0, 49161.0, 28970.0, 17335.0, 11016.0, 7035.0, 4480.0, 2894.0, 1869.0, 1218.0, 864.0, 555.0, 349.0, 259.0, 187.0, 90.0, 102.0, 59.0, 37.0, 24.0, 21.0, 16.0, 10.0, 6.0, 7.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.1943359375, -0.1881427764892578, -0.18194961547851562, -0.17575645446777344, -0.16956329345703125, -0.16337013244628906, -0.15717697143554688, -0.1509838104248047, -0.1447906494140625, -0.1385974884033203, -0.13240432739257812, -0.12621116638183594, -0.12001800537109375, -0.11382484436035156, -0.10763168334960938, -0.10143852233886719, -0.095245361328125, -0.08905220031738281, -0.08285903930664062, -0.07666587829589844, -0.07047271728515625, -0.06427955627441406, -0.058086395263671875, -0.05189323425292969, -0.0457000732421875, -0.03950691223144531, -0.033313751220703125, -0.027120590209960938, -0.02092742919921875, -0.014734268188476562, -0.008541107177734375, -0.0023479461669921875, 0.00384521484375, 0.010038375854492188, 0.016231536865234375, 0.022424697875976562, 0.02861785888671875, 0.03481101989746094, 0.041004180908203125, 0.04719734191894531, 0.0533905029296875, 0.05958366394042969, 0.06577682495117188, 0.07196998596191406, 0.07816314697265625, 0.08435630798339844, 0.09054946899414062, 0.09674263000488281, 0.102935791015625, 0.10912895202636719, 0.11532211303710938, 0.12151527404785156, 0.12770843505859375, 0.13390159606933594, 0.14009475708007812, 0.1462879180908203, 0.1524810791015625, 0.1586742401123047, 0.16486740112304688, 0.17106056213378906, 0.17725372314453125, 0.18344688415527344, 0.18964004516601562, 0.1958332061767578, 0.2020263671875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 2.0, 5.0, 5.0, 5.0, 8.0, 13.0, 9.0, 16.0, 22.0, 18.0, 15.0, 27.0, 39.0, 49.0, 48.0, 54.0, 68.0, 55.0, 71.0, 64.0, 61.0, 49.0, 58.0, 51.0, 41.0, 21.0, 20.0, 20.0, 12.0, 20.0, 11.0, 13.0, 5.0, 3.0, 5.0, 5.0, 3.0, 5.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0009546279907226562, -0.0009261369705200195, -0.0008976459503173828, -0.0008691549301147461, -0.0008406639099121094, -0.0008121728897094727, -0.0007836818695068359, -0.0007551908493041992, -0.0007266998291015625, -0.0006982088088989258, -0.0006697177886962891, -0.0006412267684936523, -0.0006127357482910156, -0.0005842447280883789, -0.0005557537078857422, -0.0005272626876831055, -0.0004987716674804688, -0.00047028064727783203, -0.0004417896270751953, -0.0004132986068725586, -0.0003848075866699219, -0.00035631656646728516, -0.00032782554626464844, -0.0002993345260620117, -0.000270843505859375, -0.00024235248565673828, -0.00021386146545410156, -0.00018537044525146484, -0.00015687942504882812, -0.0001283884048461914, -9.989738464355469e-05, -7.140636444091797e-05, -4.291534423828125e-05, -1.4424324035644531e-05, 1.4066696166992188e-05, 4.2557716369628906e-05, 7.104873657226562e-05, 9.953975677490234e-05, 0.00012803077697753906, 0.00015652179718017578, 0.0001850128173828125, 0.00021350383758544922, 0.00024199485778808594, 0.00027048587799072266, 0.0002989768981933594, 0.0003274679183959961, 0.0003559589385986328, 0.00038444995880126953, 0.00041294097900390625, 0.00044143199920654297, 0.0004699230194091797, 0.0004984140396118164, 0.0005269050598144531, 0.0005553960800170898, 0.0005838871002197266, 0.0006123781204223633, 0.000640869140625, 0.0006693601608276367, 0.0006978511810302734, 0.0007263422012329102, 0.0007548332214355469, 0.0007833242416381836, 0.0008118152618408203, 0.000840306282043457, 0.0008687973022460938]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 7.0, 4.0, 3.0, 5.0, 12.0, 12.0, 15.0, 16.0, 31.0, 30.0, 46.0, 72.0, 121.0, 177.0, 384.0, 917.0, 44090.0, 997996.0, 3301.0, 554.0, 292.0, 157.0, 93.0, 56.0, 38.0, 18.0, 26.0, 15.0, 15.0, 18.0, 4.0, 8.0, 10.0, 4.0, 1.0, 8.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0197601318359375, -0.019107580184936523, -0.018455028533935547, -0.01780247688293457, -0.017149925231933594, -0.016497373580932617, -0.01584482192993164, -0.015192270278930664, -0.014539718627929688, -0.013887166976928711, -0.013234615325927734, -0.012582063674926758, -0.011929512023925781, -0.011276960372924805, -0.010624408721923828, -0.009971857070922852, -0.009319305419921875, -0.008666753768920898, -0.008014202117919922, -0.007361650466918945, -0.006709098815917969, -0.006056547164916992, -0.005403995513916016, -0.004751443862915039, -0.0040988922119140625, -0.003446340560913086, -0.0027937889099121094, -0.002141237258911133, -0.0014886856079101562, -0.0008361339569091797, -0.00018358230590820312, 0.00046896934509277344, 0.00112152099609375, 0.0017740726470947266, 0.002426624298095703, 0.0030791759490966797, 0.0037317276000976562, 0.004384279251098633, 0.005036830902099609, 0.005689382553100586, 0.0063419342041015625, 0.006994485855102539, 0.007647037506103516, 0.008299589157104492, 0.008952140808105469, 0.009604692459106445, 0.010257244110107422, 0.010909795761108398, 0.011562347412109375, 0.012214899063110352, 0.012867450714111328, 0.013520002365112305, 0.014172554016113281, 0.014825105667114258, 0.015477657318115234, 0.01613020896911621, 0.016782760620117188, 0.017435312271118164, 0.01808786392211914, 0.018740415573120117, 0.019392967224121094, 0.02004551887512207, 0.020698070526123047, 0.021350622177124023, 0.022003173828125]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 10.0, 72.0, 304.0, 390.0, 195.0, 38.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00043118110625073314, -0.00036270642885938287, -0.00029423178057186306, -0.00022575711773242801, -0.00015728245489299297, -8.88077775016427e-05, -2.033312921412289e-05, 4.814151907339692e-05, 0.00011661619646474719, 0.00018509085930418223, 0.00025356552214361727, 0.0003220401704311371, 0.00039051484782248735, 0.0004589895252138376, 0.0005274642026051879, 0.0005959388217888772, 0.0006644134991802275, 0.0007328881765715778, 0.0008013627957552671, 0.0008698374731466174, 0.0009383121505379677, 0.001006786827929318, 0.0010752615053206682, 0.0011437360662966967, 0.0012122108601033688, 0.001280685537494719, 0.0013491602148860693, 0.0014176348922774196, 0.0014861095696687698, 0.0015545841306447983, 0.0016230588080361485, 0.0016915334854274988, 0.001760008279234171, 0.0018284829566255212, 0.0018969576340168715, 0.0019654321949929, 0.002033906988799572, 0.0021023815497756004, 0.0021708563435822725, 0.002239330904558301, 0.002307805698364973, 0.0023762802593410015, 0.0024447550531476736, 0.002513229614123702, 0.002581704407930374, 0.0026501789689064026, 0.0027186537627130747, 0.002787128323689103, 0.0028556028846651316, 0.00292407744564116, 0.002992552239447832, 0.0030610268004238605, 0.0031295015942305326, 0.003197976155206561, 0.003266450949013233, 0.0033349255099892616, 0.00340340007096529, 0.0034718746319413185, 0.0035403494257479906, 0.003608823986724019, 0.003677298780530691, 0.0037457733415067196, 0.0038142481353133917, 0.00388272269628942, 0.003951197490096092]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 10.0, 8.0, 8.0, 10.0, 13.0, 11.0, 17.0, 16.0, 19.0, 30.0, 25.0, 29.0, 18.0, 35.0, 36.0, 30.0, 40.0, 49.0, 43.0, 37.0, 48.0, 40.0, 51.0, 43.0, 39.0, 34.0, 42.0, 28.0, 28.0, 37.0, 22.0, 9.0, 14.0, 16.0, 17.0, 10.0, 3.0, 9.0, 7.0, 5.0, 7.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004521012306213379, -0.0004372112452983856, -0.00042232125997543335, -0.0004074312746524811, -0.0003925412893295288, -0.00037765130400657654, -0.00036276131868362427, -0.000347871333360672, -0.0003329813480377197, -0.00031809136271476746, -0.0003032013773918152, -0.0002883113920688629, -0.00027342140674591064, -0.0002585314214229584, -0.0002436414361000061, -0.00022875145077705383, -0.00021386146545410156, -0.0001989714801311493, -0.00018408149480819702, -0.00016919150948524475, -0.00015430152416229248, -0.0001394115388393402, -0.00012452155351638794, -0.00010963156819343567, -9.47415828704834e-05, -7.985159754753113e-05, -6.496161222457886e-05, -5.007162690162659e-05, -3.5181641578674316e-05, -2.0291656255722046e-05, -5.401670932769775e-06, 9.488314390182495e-06, 2.4378299713134766e-05, 3.9268285036087036e-05, 5.415827035903931e-05, 6.904825568199158e-05, 8.393824100494385e-05, 9.882822632789612e-05, 0.00011371821165084839, 0.00012860819697380066, 0.00014349818229675293, 0.0001583881676197052, 0.00017327815294265747, 0.00018816813826560974, 0.000203058123588562, 0.00021794810891151428, 0.00023283809423446655, 0.0002477280795574188, 0.0002626180648803711, 0.00027750805020332336, 0.00029239803552627563, 0.0003072880208492279, 0.0003221780061721802, 0.00033706799149513245, 0.0003519579768180847, 0.000366847962141037, 0.00038173794746398926, 0.00039662793278694153, 0.0004115179181098938, 0.00042640790343284607, 0.00044129788875579834, 0.0004561878740787506, 0.0004710778594017029, 0.00048596784472465515, 0.0005008578300476074]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [4.0, 3.0, 3.0, 4.0, 5.0, 4.0, 0.0, 6.0, 6.0, 7.0, 8.0, 12.0, 10.0, 13.0, 13.0, 19.0, 17.0, 22.0, 19.0, 23.0, 25.0, 29.0, 30.0, 37.0, 50.0, 37.0, 38.0, 50.0, 42.0, 31.0, 39.0, 44.0, 47.0, 30.0, 39.0, 36.0, 20.0, 27.0, 24.0, 26.0, 21.0, 16.0, 16.0, 13.0, 10.0, 6.0, 8.0, 2.0, 3.0, 6.0, 3.0, 3.0, 3.0, 5.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.654296875, -1.596221923828125, -1.53814697265625, -1.480072021484375, -1.4219970703125, -1.363922119140625, -1.30584716796875, -1.247772216796875, -1.189697265625, -1.131622314453125, -1.07354736328125, -1.015472412109375, -0.9573974609375, -0.899322509765625, -0.84124755859375, -0.783172607421875, -0.72509765625, -0.667022705078125, -0.60894775390625, -0.550872802734375, -0.4927978515625, -0.434722900390625, -0.37664794921875, -0.318572998046875, -0.260498046875, -0.202423095703125, -0.14434814453125, -0.086273193359375, -0.0281982421875, 0.029876708984375, 0.08795166015625, 0.146026611328125, 0.2041015625, 0.262176513671875, 0.32025146484375, 0.378326416015625, 0.4364013671875, 0.494476318359375, 0.55255126953125, 0.610626220703125, 0.668701171875, 0.726776123046875, 0.78485107421875, 0.842926025390625, 0.9010009765625, 0.959075927734375, 1.01715087890625, 1.075225830078125, 1.13330078125, 1.191375732421875, 1.24945068359375, 1.307525634765625, 1.3656005859375, 1.423675537109375, 1.48175048828125, 1.539825439453125, 1.597900390625, 1.655975341796875, 1.71405029296875, 1.772125244140625, 1.8302001953125, 1.888275146484375, 1.94635009765625, 2.004425048828125, 2.0625]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 5.0, 4.0, 5.0, 9.0, 6.0, 6.0, 14.0, 15.0, 22.0, 26.0, 45.0, 73.0, 100.0, 197.0, 312.0, 514.0, 996.0, 1812.0, 3534.0, 6667.0, 12217.0, 22818.0, 43328.0, 90691.0, 219645.0, 325898.0, 170288.0, 72083.0, 35679.0, 19255.0, 10399.0, 5458.0, 2883.0, 1521.0, 811.0, 477.0, 246.0, 160.0, 108.0, 52.0, 52.0, 31.0, 21.0, 20.0, 12.0, 15.0, 8.0, 3.0, 5.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0], "bins": [-1.779296875, -1.7259521484375, -1.672607421875, -1.6192626953125, -1.56591796875, -1.5125732421875, -1.459228515625, -1.4058837890625, -1.3525390625, -1.2991943359375, -1.245849609375, -1.1925048828125, -1.13916015625, -1.0858154296875, -1.032470703125, -0.9791259765625, -0.92578125, -0.8724365234375, -0.819091796875, -0.7657470703125, -0.71240234375, -0.6590576171875, -0.605712890625, -0.5523681640625, -0.4990234375, -0.4456787109375, -0.392333984375, -0.3389892578125, -0.28564453125, -0.2322998046875, -0.178955078125, -0.1256103515625, -0.072265625, -0.0189208984375, 0.034423828125, 0.0877685546875, 0.14111328125, 0.1944580078125, 0.247802734375, 0.3011474609375, 0.3544921875, 0.4078369140625, 0.461181640625, 0.5145263671875, 0.56787109375, 0.6212158203125, 0.674560546875, 0.7279052734375, 0.78125, 0.8345947265625, 0.887939453125, 0.9412841796875, 0.99462890625, 1.0479736328125, 1.101318359375, 1.1546630859375, 1.2080078125, 1.2613525390625, 1.314697265625, 1.3680419921875, 1.42138671875, 1.4747314453125, 1.528076171875, 1.5814208984375, 1.634765625]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 2.0, 3.0, 5.0, 7.0, 5.0, 9.0, 9.0, 14.0, 14.0, 14.0, 10.0, 18.0, 19.0, 32.0, 31.0, 34.0, 40.0, 24.0, 44.0, 45.0, 69.0, 96.0, 195.0, 1428.0, 273.0, 144.0, 73.0, 59.0, 41.0, 27.0, 28.0, 24.0, 31.0, 25.0, 21.0, 28.0, 18.0, 18.0, 13.0, 11.0, 5.0, 12.0, 7.0, 6.0, 5.0, 8.0, 3.0, 1.0, 0.0, 4.0, 4.0, 0.0, 3.0, 1.0], "bins": [-7.39453125, -7.1751708984375, -6.955810546875, -6.7364501953125, -6.51708984375, -6.2977294921875, -6.078369140625, -5.8590087890625, -5.6396484375, -5.4202880859375, -5.200927734375, -4.9815673828125, -4.76220703125, -4.5428466796875, -4.323486328125, -4.1041259765625, -3.884765625, -3.6654052734375, -3.446044921875, -3.2266845703125, -3.00732421875, -2.7879638671875, -2.568603515625, -2.3492431640625, -2.1298828125, -1.9105224609375, -1.691162109375, -1.4718017578125, -1.25244140625, -1.0330810546875, -0.813720703125, -0.5943603515625, -0.375, -0.1556396484375, 0.063720703125, 0.2830810546875, 0.50244140625, 0.7218017578125, 0.941162109375, 1.1605224609375, 1.3798828125, 1.5992431640625, 1.818603515625, 2.0379638671875, 2.25732421875, 2.4766845703125, 2.696044921875, 2.9154052734375, 3.134765625, 3.3541259765625, 3.573486328125, 3.7928466796875, 4.01220703125, 4.2315673828125, 4.450927734375, 4.6702880859375, 4.8896484375, 5.1090087890625, 5.328369140625, 5.5477294921875, 5.76708984375, 5.9864501953125, 6.205810546875, 6.4251708984375, 6.64453125]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 2.0, 4.0, 3.0, 2.0, 2.0, 2.0, 3.0, 5.0, 7.0, 2.0, 15.0, 18.0, 20.0, 27.0, 31.0, 55.0, 83.0, 146.0, 211.0, 370.0, 979.0, 14682.0, 3114621.0, 12549.0, 922.0, 352.0, 208.0, 103.0, 80.0, 62.0, 29.0, 26.0, 23.0, 16.0, 11.0, 10.0, 10.0, 4.0, 4.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.609375, -27.6708984375, -26.732421875, -25.7939453125, -24.85546875, -23.9169921875, -22.978515625, -22.0400390625, -21.1015625, -20.1630859375, -19.224609375, -18.2861328125, -17.34765625, -16.4091796875, -15.470703125, -14.5322265625, -13.59375, -12.6552734375, -11.716796875, -10.7783203125, -9.83984375, -8.9013671875, -7.962890625, -7.0244140625, -6.0859375, -5.1474609375, -4.208984375, -3.2705078125, -2.33203125, -1.3935546875, -0.455078125, 0.4833984375, 1.421875, 2.3603515625, 3.298828125, 4.2373046875, 5.17578125, 6.1142578125, 7.052734375, 7.9912109375, 8.9296875, 9.8681640625, 10.806640625, 11.7451171875, 12.68359375, 13.6220703125, 14.560546875, 15.4990234375, 16.4375, 17.3759765625, 18.314453125, 19.2529296875, 20.19140625, 21.1298828125, 22.068359375, 23.0068359375, 23.9453125, 24.8837890625, 25.822265625, 26.7607421875, 27.69921875, 28.6376953125, 29.576171875, 30.5146484375, 31.453125]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 96.0, 681.0, 233.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.49155330657959, -13.164342880249023, -10.83713150024414, -8.509920120239258, -6.182709693908691, -3.8554983139038086, -1.5282878875732422, 0.7989225387573242, 3.126133918762207, 5.453344821929932, 7.780555725097656, 10.107767105102539, 12.434977531433105, 14.762188911437988, 17.089399337768555, 19.416610717773438, 21.743820190429688, 24.07103157043457, 26.398242950439453, 28.725452423095703, 31.052663803100586, 33.37987518310547, 35.70708465576172, 38.03429412841797, 40.361507415771484, 42.688716888427734, 45.01593017578125, 47.3431396484375, 49.67034912109375, 51.997562408447266, 54.324771881103516, 56.65198516845703, 58.97920227050781, 61.30641174316406, 63.63362503051758, 65.9608383178711, 68.28804779052734, 70.6152572631836, 72.94246673583984, 75.2696762084961, 77.59689331054688, 79.92410278320312, 82.25131225585938, 84.57852935791016, 86.9057388305664, 89.23294830322266, 91.5601577758789, 93.88736724853516, 96.2145767211914, 98.54178619384766, 100.8689956665039, 103.19621276855469, 105.52342224121094, 107.85063171386719, 110.17784118652344, 112.50505065917969, 114.83226013183594, 117.15946960449219, 119.48667907714844, 121.81389617919922, 124.14110565185547, 126.46831512451172, 128.7955322265625, 131.12274169921875, 133.449951171875]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 6.0, 6.0, 9.0, 12.0, 15.0, 9.0, 22.0, 17.0, 19.0, 16.0, 18.0, 27.0, 26.0, 27.0, 33.0, 37.0, 37.0, 33.0, 31.0, 50.0, 26.0, 37.0, 35.0, 38.0, 32.0, 33.0, 32.0, 28.0, 23.0, 27.0, 36.0, 34.0, 24.0, 18.0, 25.0, 22.0, 16.0, 15.0, 9.0, 7.0, 7.0, 7.0, 7.0, 3.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0], "bins": [-21.65027618408203, -21.046649932861328, -20.443025588989258, -19.839399337768555, -19.235774993896484, -18.63214874267578, -18.02852439880371, -17.424898147583008, -16.821273803710938, -16.217647552490234, -15.614023208618164, -15.010397911071777, -14.40677261352539, -13.803146362304688, -13.1995210647583, -12.595895767211914, -11.992269515991211, -11.388644218444824, -10.785018920898438, -10.18139362335205, -9.577768325805664, -8.974142074584961, -8.370516777038574, -7.7668914794921875, -7.163266181945801, -6.559640884399414, -5.956015586853027, -5.352389812469482, -4.748764514923096, -4.145139217376709, -3.541513681411743, -2.9378881454467773, -2.3342628479003906, -1.7306374311447144, -1.127012014389038, -0.5233865976333618, 0.08023881912231445, 0.6838641166687012, 1.287489652633667, 1.8911151885986328, 2.4947404861450195, 3.0983657836914062, 3.701991319656372, 4.305616855621338, 4.909242153167725, 5.512867450714111, 6.116493225097656, 6.720118522644043, 7.32374382019043, 7.927369117736816, 8.530994415283203, 9.13461971282959, 9.738245010375977, 10.34187126159668, 10.945496559143066, 11.549121856689453, 12.15274715423584, 12.756372451782227, 13.359997749328613, 13.963623046875, 14.567249298095703, 15.170873641967773, 15.774499893188477, 16.378124237060547, 16.98175048828125]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 7.0, 5.0, 2.0, 5.0, 8.0, 7.0, 7.0, 5.0, 12.0, 15.0, 12.0, 14.0, 19.0, 32.0, 19.0, 27.0, 27.0, 37.0, 23.0, 31.0, 41.0, 47.0, 39.0, 38.0, 53.0, 49.0, 36.0, 39.0, 27.0, 44.0, 50.0, 29.0, 29.0, 19.0, 26.0, 19.0, 14.0, 17.0, 12.0, 11.0, 15.0, 6.0, 5.0, 4.0, 4.0, 2.0, 8.0, 2.0, 2.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.9814453125, -1.9159698486328125, -1.850494384765625, -1.7850189208984375, -1.71954345703125, -1.6540679931640625, -1.588592529296875, -1.5231170654296875, -1.4576416015625, -1.3921661376953125, -1.326690673828125, -1.2612152099609375, -1.19573974609375, -1.1302642822265625, -1.064788818359375, -0.9993133544921875, -0.933837890625, -0.8683624267578125, -0.802886962890625, -0.7374114990234375, -0.67193603515625, -0.6064605712890625, -0.540985107421875, -0.4755096435546875, -0.4100341796875, -0.3445587158203125, -0.279083251953125, -0.2136077880859375, -0.14813232421875, -0.0826568603515625, -0.017181396484375, 0.0482940673828125, 0.11376953125, 0.1792449951171875, 0.244720458984375, 0.3101959228515625, 0.37567138671875, 0.4411468505859375, 0.506622314453125, 0.5720977783203125, 0.6375732421875, 0.7030487060546875, 0.768524169921875, 0.8339996337890625, 0.89947509765625, 0.9649505615234375, 1.030426025390625, 1.0959014892578125, 1.161376953125, 1.2268524169921875, 1.292327880859375, 1.3578033447265625, 1.42327880859375, 1.4887542724609375, 1.554229736328125, 1.6197052001953125, 1.6851806640625, 1.7506561279296875, 1.816131591796875, 1.8816070556640625, 1.94708251953125, 2.0125579833984375, 2.078033447265625, 2.1435089111328125, 2.208984375]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 4.0, 2.0, 7.0, 12.0, 8.0, 12.0, 9.0, 15.0, 23.0, 26.0, 53.0, 64.0, 103.0, 179.0, 304.0, 768.0, 2298.0, 10786.0, 75396.0, 616280.0, 2169328.0, 1132248.0, 159843.0, 20477.0, 3820.0, 1115.0, 445.0, 228.0, 136.0, 88.0, 64.0, 35.0, 29.0, 17.0, 5.0, 9.0, 9.0, 14.0, 4.0, 8.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.3828125, -4.24444580078125, -4.1060791015625, -3.96771240234375, -3.829345703125, -3.69097900390625, -3.5526123046875, -3.41424560546875, -3.27587890625, -3.13751220703125, -2.9991455078125, -2.86077880859375, -2.722412109375, -2.58404541015625, -2.4456787109375, -2.30731201171875, -2.1689453125, -2.03057861328125, -1.8922119140625, -1.75384521484375, -1.615478515625, -1.47711181640625, -1.3387451171875, -1.20037841796875, -1.06201171875, -0.92364501953125, -0.7852783203125, -0.64691162109375, -0.508544921875, -0.37017822265625, -0.2318115234375, -0.09344482421875, 0.044921875, 0.18328857421875, 0.3216552734375, 0.46002197265625, 0.598388671875, 0.73675537109375, 0.8751220703125, 1.01348876953125, 1.15185546875, 1.29022216796875, 1.4285888671875, 1.56695556640625, 1.705322265625, 1.84368896484375, 1.9820556640625, 2.12042236328125, 2.2587890625, 2.39715576171875, 2.5355224609375, 2.67388916015625, 2.812255859375, 2.95062255859375, 3.0889892578125, 3.22735595703125, 3.36572265625, 3.50408935546875, 3.6424560546875, 3.78082275390625, 3.919189453125, 4.05755615234375, 4.1959228515625, 4.33428955078125, 4.47265625]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 3.0, 7.0, 8.0, 10.0, 22.0, 31.0, 56.0, 69.0, 97.0, 172.0, 216.0, 281.0, 384.0, 461.0, 486.0, 459.0, 379.0, 304.0, 195.0, 129.0, 98.0, 73.0, 40.0, 28.0, 12.0, 23.0, 12.0, 7.0, 6.0, 0.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.51171875, -5.32403564453125, -5.1363525390625, -4.94866943359375, -4.760986328125, -4.57330322265625, -4.3856201171875, -4.19793701171875, -4.01025390625, -3.82257080078125, -3.6348876953125, -3.44720458984375, -3.259521484375, -3.07183837890625, -2.8841552734375, -2.69647216796875, -2.5087890625, -2.32110595703125, -2.1334228515625, -1.94573974609375, -1.758056640625, -1.57037353515625, -1.3826904296875, -1.19500732421875, -1.00732421875, -0.81964111328125, -0.6319580078125, -0.44427490234375, -0.256591796875, -0.06890869140625, 0.1187744140625, 0.30645751953125, 0.494140625, 0.68182373046875, 0.8695068359375, 1.05718994140625, 1.244873046875, 1.43255615234375, 1.6202392578125, 1.80792236328125, 1.99560546875, 2.18328857421875, 2.3709716796875, 2.55865478515625, 2.746337890625, 2.93402099609375, 3.1217041015625, 3.30938720703125, 3.4970703125, 3.68475341796875, 3.8724365234375, 4.06011962890625, 4.247802734375, 4.43548583984375, 4.6231689453125, 4.81085205078125, 4.99853515625, 5.18621826171875, 5.3739013671875, 5.56158447265625, 5.749267578125, 5.93695068359375, 6.1246337890625, 6.31231689453125, 6.5]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 8.0, 4.0, 6.0, 9.0, 12.0, 11.0, 25.0, 40.0, 47.0, 92.0, 115.0, 188.0, 266.0, 558.0, 1612.0, 12970.0, 397612.0, 3414644.0, 351602.0, 11605.0, 1512.0, 509.0, 295.0, 180.0, 115.0, 81.0, 74.0, 34.0, 15.0, 16.0, 16.0, 9.0, 5.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0859375, -11.7249755859375, -11.364013671875, -11.0030517578125, -10.64208984375, -10.2811279296875, -9.920166015625, -9.5592041015625, -9.1982421875, -8.8372802734375, -8.476318359375, -8.1153564453125, -7.75439453125, -7.3934326171875, -7.032470703125, -6.6715087890625, -6.310546875, -5.9495849609375, -5.588623046875, -5.2276611328125, -4.86669921875, -4.5057373046875, -4.144775390625, -3.7838134765625, -3.4228515625, -3.0618896484375, -2.700927734375, -2.3399658203125, -1.97900390625, -1.6180419921875, -1.257080078125, -0.8961181640625, -0.53515625, -0.1741943359375, 0.186767578125, 0.5477294921875, 0.90869140625, 1.2696533203125, 1.630615234375, 1.9915771484375, 2.3525390625, 2.7135009765625, 3.074462890625, 3.4354248046875, 3.79638671875, 4.1573486328125, 4.518310546875, 4.8792724609375, 5.240234375, 5.6011962890625, 5.962158203125, 6.3231201171875, 6.68408203125, 7.0450439453125, 7.406005859375, 7.7669677734375, 8.1279296875, 8.4888916015625, 8.849853515625, 9.2108154296875, 9.57177734375, 9.9327392578125, 10.293701171875, 10.6546630859375, 11.015625]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 12.0, 24.0, 58.0, 107.0, 172.0, 194.0, 185.0, 127.0, 77.0, 35.0, 14.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.13328552246094, -35.83259582519531, -34.53190231323242, -33.2312126159668, -31.93052101135254, -30.62982940673828, -29.329137802124023, -28.028446197509766, -26.72775650024414, -25.427064895629883, -24.126373291015625, -22.82568359375, -21.524991989135742, -20.224300384521484, -18.923608779907227, -17.62291717529297, -16.32222557067871, -15.021533966064453, -13.720843315124512, -12.420151710510254, -11.119461059570312, -9.818769454956055, -8.518077850341797, -7.2173871994018555, -5.916695594787598, -4.616004467010498, -3.3153131008148193, -2.0146217346191406, -0.713930606842041, 0.5867605209350586, 1.8874521255493164, 3.188142776489258, 4.488834381103516, 5.789525508880615, 7.090216636657715, 8.390908241271973, 9.691598892211914, 10.992290496826172, 12.29298210144043, 13.593672752380371, 14.894364356994629, 16.19505500793457, 17.495746612548828, 18.796438217163086, 20.097129821777344, 21.39781951904297, 22.69851303100586, 23.999202728271484, 25.299894332885742, 26.6005859375, 27.901277542114258, 29.201969146728516, 30.50265884399414, 31.8033504486084, 33.104042053222656, 34.40473175048828, 35.70542526245117, 37.0061149597168, 38.30680847167969, 39.60749816894531, 40.9081916809082, 42.20888137817383, 43.50957489013672, 44.810264587402344, 46.11095428466797]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 1.0, 2.0, 4.0, 3.0, 4.0, 1.0, 15.0, 20.0, 18.0, 21.0, 22.0, 26.0, 19.0, 29.0, 29.0, 33.0, 25.0, 48.0, 40.0, 42.0, 32.0, 37.0, 55.0, 41.0, 32.0, 44.0, 34.0, 35.0, 31.0, 31.0, 22.0, 24.0, 25.0, 26.0, 19.0, 19.0, 17.0, 16.0, 14.0, 8.0, 10.0, 6.0, 6.0, 9.0, 1.0, 2.0, 4.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.19491195678711, -15.685200691223145, -15.17548942565918, -14.665778160095215, -14.15606689453125, -13.646355628967285, -13.13664436340332, -12.626934051513672, -12.11722183227539, -11.607510566711426, -11.097799301147461, -10.588088035583496, -10.078376770019531, -9.568665504455566, -9.058954238891602, -8.549243927001953, -8.039532661437988, -7.529821395874023, -7.020110130310059, -6.510398864746094, -6.000687599182129, -5.490976333618164, -4.981265544891357, -4.471554279327393, -3.9618430137634277, -3.452131748199463, -2.942420482635498, -2.4327094554901123, -1.9229981899261475, -1.4132869243621826, -0.9035758972167969, -0.39386463165283203, 0.11584663391113281, 0.6255578398704529, 1.135269045829773, 1.6449801921844482, 2.154691457748413, 2.664402723312378, 3.1741137504577637, 3.6838250160217285, 4.193536281585693, 4.703247547149658, 5.212958812713623, 5.72266960144043, 6.2323808670043945, 6.742092132568359, 7.251803398132324, 7.761514663696289, 8.271225929260254, 8.780937194824219, 9.290648460388184, 9.800359725952148, 10.310070991516113, 10.819782257080078, 11.329492568969727, 11.839204788208008, 12.348915100097656, 12.858626365661621, 13.368337631225586, 13.87804889678955, 14.387760162353516, 14.89747142791748, 15.407182693481445, 15.916893005371094, 16.426605224609375]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 5.0, 3.0, 4.0, 9.0, 6.0, 8.0, 7.0, 12.0, 13.0, 19.0, 22.0, 13.0, 18.0, 22.0, 36.0, 23.0, 34.0, 31.0, 46.0, 43.0, 46.0, 36.0, 53.0, 56.0, 44.0, 53.0, 34.0, 35.0, 33.0, 32.0, 22.0, 28.0, 30.0, 19.0, 23.0, 19.0, 11.0, 12.0, 14.0, 5.0, 3.0, 8.0, 3.0, 4.0, 0.0, 5.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.03125, -1.9627685546875, -1.894287109375, -1.8258056640625, -1.75732421875, -1.6888427734375, -1.620361328125, -1.5518798828125, -1.4833984375, -1.4149169921875, -1.346435546875, -1.2779541015625, -1.20947265625, -1.1409912109375, -1.072509765625, -1.0040283203125, -0.935546875, -0.8670654296875, -0.798583984375, -0.7301025390625, -0.66162109375, -0.5931396484375, -0.524658203125, -0.4561767578125, -0.3876953125, -0.3192138671875, -0.250732421875, -0.1822509765625, -0.11376953125, -0.0452880859375, 0.023193359375, 0.0916748046875, 0.16015625, 0.2286376953125, 0.297119140625, 0.3656005859375, 0.43408203125, 0.5025634765625, 0.571044921875, 0.6395263671875, 0.7080078125, 0.7764892578125, 0.844970703125, 0.9134521484375, 0.98193359375, 1.0504150390625, 1.118896484375, 1.1873779296875, 1.255859375, 1.3243408203125, 1.392822265625, 1.4613037109375, 1.52978515625, 1.5982666015625, 1.666748046875, 1.7352294921875, 1.8037109375, 1.8721923828125, 1.940673828125, 2.0091552734375, 2.07763671875, 2.1461181640625, 2.214599609375, 2.2830810546875, 2.3515625]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 6.0, 12.0, 7.0, 24.0, 26.0, 43.0, 52.0, 86.0, 121.0, 176.0, 272.0, 351.0, 531.0, 707.0, 920.0, 1200.0, 1723.0, 2340.0, 3199.0, 4396.0, 5937.0, 8251.0, 11825.0, 17268.0, 25045.0, 37923.0, 58458.0, 93772.0, 151606.0, 197186.0, 151366.0, 93065.0, 57825.0, 38042.0, 25449.0, 17096.0, 11863.0, 8216.0, 5936.0, 4360.0, 3289.0, 2283.0, 1784.0, 1266.0, 919.0, 684.0, 533.0, 340.0, 259.0, 163.0, 110.0, 93.0, 64.0, 34.0, 23.0, 20.0, 6.0, 6.0, 7.0, 4.0, 4.0], "bins": [-0.2230224609375, -0.21615982055664062, -0.20929718017578125, -0.20243453979492188, -0.1955718994140625, -0.18870925903320312, -0.18184661865234375, -0.17498397827148438, -0.168121337890625, -0.16125869750976562, -0.15439605712890625, -0.14753341674804688, -0.1406707763671875, -0.13380813598632812, -0.12694549560546875, -0.12008285522460938, -0.11322021484375, -0.10635757446289062, -0.09949493408203125, -0.09263229370117188, -0.0857696533203125, -0.07890701293945312, -0.07204437255859375, -0.06518173217773438, -0.058319091796875, -0.051456451416015625, -0.04459381103515625, -0.037731170654296875, -0.0308685302734375, -0.024005889892578125, -0.01714324951171875, -0.010280609130859375, -0.00341796875, 0.003444671630859375, 0.01030731201171875, 0.017169952392578125, 0.0240325927734375, 0.030895233154296875, 0.03775787353515625, 0.044620513916015625, 0.051483154296875, 0.058345794677734375, 0.06520843505859375, 0.07207107543945312, 0.0789337158203125, 0.08579635620117188, 0.09265899658203125, 0.09952163696289062, 0.10638427734375, 0.11324691772460938, 0.12010955810546875, 0.12697219848632812, 0.1338348388671875, 0.14069747924804688, 0.14756011962890625, 0.15442276000976562, 0.161285400390625, 0.16814804077148438, 0.17501068115234375, 0.18187332153320312, 0.1887359619140625, 0.19559860229492188, 0.20246124267578125, 0.20932388305664062, 0.2161865234375]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 5.0, 3.0, 6.0, 6.0, 4.0, 10.0, 8.0, 17.0, 13.0, 21.0, 22.0, 30.0, 22.0, 26.0, 39.0, 37.0, 29.0, 45.0, 43.0, 42.0, 37.0, 41.0, 1064.0, 33.0, 41.0, 33.0, 44.0, 40.0, 28.0, 26.0, 31.0, 27.0, 20.0, 17.0, 20.0, 12.0, 17.0, 13.0, 8.0, 9.0, 6.0, 9.0, 9.0, 7.0, 4.0, 5.0, 3.0, 1.0, 2.0, 0.0, 4.0], "bins": [-1.4765625, -1.43438720703125, -1.3922119140625, -1.35003662109375, -1.307861328125, -1.26568603515625, -1.2235107421875, -1.18133544921875, -1.13916015625, -1.09698486328125, -1.0548095703125, -1.01263427734375, -0.970458984375, -0.92828369140625, -0.8861083984375, -0.84393310546875, -0.8017578125, -0.75958251953125, -0.7174072265625, -0.67523193359375, -0.633056640625, -0.59088134765625, -0.5487060546875, -0.50653076171875, -0.46435546875, -0.42218017578125, -0.3800048828125, -0.33782958984375, -0.295654296875, -0.25347900390625, -0.2113037109375, -0.16912841796875, -0.126953125, -0.08477783203125, -0.0426025390625, -0.00042724609375, 0.041748046875, 0.08392333984375, 0.1260986328125, 0.16827392578125, 0.21044921875, 0.25262451171875, 0.2947998046875, 0.33697509765625, 0.379150390625, 0.42132568359375, 0.4635009765625, 0.50567626953125, 0.5478515625, 0.59002685546875, 0.6322021484375, 0.67437744140625, 0.716552734375, 0.75872802734375, 0.8009033203125, 0.84307861328125, 0.88525390625, 0.92742919921875, 0.9696044921875, 1.01177978515625, 1.053955078125, 1.09613037109375, 1.1383056640625, 1.18048095703125, 1.22265625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 1.0, 8.0, 8.0, 15.0, 24.0, 27.0, 43.0, 61.0, 81.0, 113.0, 177.0, 225.0, 364.0, 430.0, 617.0, 915.0, 1299.0, 1775.0, 2525.0, 3736.0, 5452.0, 7891.0, 11719.0, 17535.0, 26914.0, 42264.0, 66631.0, 108256.0, 168829.0, 1244070.0, 140097.0, 86953.0, 54551.0, 34594.0, 22237.0, 14992.0, 9844.0, 6634.0, 4579.0, 3250.0, 2206.0, 1569.0, 1063.0, 750.0, 544.0, 376.0, 266.0, 207.0, 135.0, 92.0, 70.0, 43.0, 24.0, 26.0, 13.0, 12.0, 8.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.1856689453125, -0.1799163818359375, -0.174163818359375, -0.1684112548828125, -0.16265869140625, -0.1569061279296875, -0.151153564453125, -0.1454010009765625, -0.1396484375, -0.1338958740234375, -0.128143310546875, -0.1223907470703125, -0.11663818359375, -0.1108856201171875, -0.105133056640625, -0.0993804931640625, -0.0936279296875, -0.0878753662109375, -0.082122802734375, -0.0763702392578125, -0.07061767578125, -0.0648651123046875, -0.059112548828125, -0.0533599853515625, -0.047607421875, -0.0418548583984375, -0.036102294921875, -0.0303497314453125, -0.02459716796875, -0.0188446044921875, -0.013092041015625, -0.0073394775390625, -0.0015869140625, 0.0041656494140625, 0.009918212890625, 0.0156707763671875, 0.02142333984375, 0.0271759033203125, 0.032928466796875, 0.0386810302734375, 0.04443359375, 0.0501861572265625, 0.055938720703125, 0.0616912841796875, 0.06744384765625, 0.0731964111328125, 0.078948974609375, 0.0847015380859375, 0.0904541015625, 0.0962066650390625, 0.101959228515625, 0.1077117919921875, 0.11346435546875, 0.1192169189453125, 0.124969482421875, 0.1307220458984375, 0.136474609375, 0.1422271728515625, 0.147979736328125, 0.1537322998046875, 0.15948486328125, 0.1652374267578125, 0.170989990234375, 0.1767425537109375, 0.1824951171875]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 2.0, 6.0, 5.0, 4.0, 11.0, 18.0, 13.0, 15.0, 28.0, 23.0, 30.0, 48.0, 65.0, 87.0, 104.0, 109.0, 85.0, 68.0, 65.0, 47.0, 36.0, 25.0, 20.0, 19.0, 21.0, 15.0, 9.0, 6.0, 3.0, 7.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010929107666015625, -0.0010569244623184204, -0.0010209381580352783, -0.0009849518537521362, -0.0009489655494689941, -0.000912979245185852, -0.00087699294090271, -0.0008410066366195679, -0.0008050203323364258, -0.0007690340280532837, -0.0007330477237701416, -0.0006970614194869995, -0.0006610751152038574, -0.0006250888109207153, -0.0005891025066375732, -0.0005531162023544312, -0.0005171298980712891, -0.00048114359378814697, -0.0004451572895050049, -0.0004091709852218628, -0.0003731846809387207, -0.0003371983766555786, -0.0003012120723724365, -0.00026522576808929443, -0.00022923946380615234, -0.00019325315952301025, -0.00015726685523986816, -0.00012128055095672607, -8.529424667358398e-05, -4.9307942390441895e-05, -1.3321638107299805e-05, 2.2664666175842285e-05, 5.8650970458984375e-05, 9.463727474212646e-05, 0.00013062357902526855, 0.00016660988330841064, 0.00020259618759155273, 0.00023858249187469482, 0.0002745687961578369, 0.000310555100440979, 0.0003465414047241211, 0.0003825277090072632, 0.0004185140132904053, 0.00045450031757354736, 0.0004904866218566895, 0.0005264729261398315, 0.0005624592304229736, 0.0005984455347061157, 0.0006344318389892578, 0.0006704181432723999, 0.000706404447555542, 0.0007423907518386841, 0.0007783770561218262, 0.0008143633604049683, 0.0008503496646881104, 0.0008863359689712524, 0.0009223222732543945, 0.0009583085775375366, 0.0009942948818206787, 0.0010302811861038208, 0.0010662674903869629, 0.001102253794670105, 0.001138240098953247, 0.0011742264032363892, 0.0012102127075195312]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 9.0, 6.0, 5.0, 15.0, 13.0, 27.0, 31.0, 40.0, 53.0, 91.0, 178.0, 281.0, 709.0, 15805.0, 1026283.0, 3773.0, 587.0, 245.0, 141.0, 61.0, 50.0, 40.0, 33.0, 17.0, 16.0, 12.0, 10.0, 5.0, 3.0, 4.0, 4.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0250701904296875, -0.024319171905517578, -0.023568153381347656, -0.022817134857177734, -0.022066116333007812, -0.02131509780883789, -0.02056407928466797, -0.019813060760498047, -0.019062042236328125, -0.018311023712158203, -0.01756000518798828, -0.01680898666381836, -0.016057968139648438, -0.015306949615478516, -0.014555931091308594, -0.013804912567138672, -0.01305389404296875, -0.012302875518798828, -0.011551856994628906, -0.010800838470458984, -0.010049819946289062, -0.00929880142211914, -0.008547782897949219, -0.007796764373779297, -0.007045745849609375, -0.006294727325439453, -0.005543708801269531, -0.004792690277099609, -0.0040416717529296875, -0.0032906532287597656, -0.0025396347045898438, -0.0017886161804199219, -0.00103759765625, -0.0002865791320800781, 0.00046443939208984375, 0.0012154579162597656, 0.0019664764404296875, 0.0027174949645996094, 0.0034685134887695312, 0.004219532012939453, 0.004970550537109375, 0.005721569061279297, 0.006472587585449219, 0.007223606109619141, 0.007974624633789062, 0.008725643157958984, 0.009476661682128906, 0.010227680206298828, 0.01097869873046875, 0.011729717254638672, 0.012480735778808594, 0.013231754302978516, 0.013982772827148438, 0.01473379135131836, 0.015484809875488281, 0.016235828399658203, 0.016986846923828125, 0.017737865447998047, 0.01848888397216797, 0.01923990249633789, 0.019990921020507812, 0.020741939544677734, 0.021492958068847656, 0.022243976593017578, 0.0229949951171875]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 14.0, 130.0, 458.0, 361.0, 51.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009727643919177353, -0.0008826218545436859, -0.0007924793171696365, -0.0007023367797955871, -0.0006121943006291986, -0.0005220517050474882, -0.0004319092258810997, -0.0003417666885070503, -0.00025162415113300085, -0.00016148161375895143, -7.133909093681723e-05, 1.8803431885316968e-05, 0.00010894596925936639, 0.00019908850663341582, 0.0002892310149036348, 0.0003793735522776842, 0.00046951608965173364, 0.0005596586270257831, 0.0006498011643998325, 0.0007399437017738819, 0.0008300861809402704, 0.0009202287765219808, 0.0010103712556883693, 0.0011005138512700796, 0.0011906563304364681, 0.0012807988096028566, 0.001370941405184567, 0.0014610838843509555, 0.0015512264799326658, 0.0016413689590990543, 0.0017315114382654428, 0.0018216540338471532, 0.0019117963965982199, 0.0020019388757646084, 0.002092081354930997, 0.002182224066928029, 0.0022723665460944176, 0.002362509025260806, 0.0024526515044271946, 0.0025427942164242268, 0.0026329366955906153, 0.002723079174757004, 0.0028132216539233923, 0.0029033643659204245, 0.002993506845086813, 0.0030836493242532015, 0.00317379180341959, 0.003263934515416622, 0.003354076761752367, 0.0034442192409187555, 0.003534361720085144, 0.003624504432082176, 0.0037146469112485647, 0.0038047893904149532, 0.0038949318695813417, 0.00398507434874773, 0.004075217060744762, 0.004165359772741795, 0.0042555020190775394, 0.004345644731074572, 0.0044357869774103165, 0.004525929689407349, 0.004616072401404381, 0.004706214647740126, 0.004796357359737158]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 4.0, 3.0, 10.0, 9.0, 3.0, 18.0, 18.0, 18.0, 20.0, 27.0, 32.0, 39.0, 41.0, 45.0, 27.0, 49.0, 59.0, 49.0, 52.0, 59.0, 60.0, 52.0, 41.0, 53.0, 33.0, 30.0, 36.0, 22.0, 20.0, 18.0, 21.0, 17.0, 10.0, 3.0, 2.0, 7.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0006871223449707031, -0.0006687510758638382, -0.0006503798067569733, -0.0006320085376501083, -0.0006136372685432434, -0.0005952659994363785, -0.0005768947303295135, -0.0005585234612226486, -0.0005401521921157837, -0.0005217809230089188, -0.0005034096539020538, -0.0004850383847951889, -0.000466667115688324, -0.00044829584658145905, -0.0004299245774745941, -0.0004115533083677292, -0.00039318203926086426, -0.00037481077015399933, -0.0003564395010471344, -0.00033806823194026947, -0.00031969696283340454, -0.0003013256937265396, -0.0002829544246196747, -0.00026458315551280975, -0.0002462118864059448, -0.0002278406172990799, -0.00020946934819221497, -0.00019109807908535004, -0.0001727268099784851, -0.00015435554087162018, -0.00013598427176475525, -0.00011761300265789032, -9.924173355102539e-05, -8.087046444416046e-05, -6.249919533729553e-05, -4.41279262304306e-05, -2.5756657123565674e-05, -7.385388016700745e-06, 1.0985881090164185e-05, 2.9357150197029114e-05, 4.772841930389404e-05, 6.609968841075897e-05, 8.44709575176239e-05, 0.00010284222662448883, 0.00012121349573135376, 0.0001395847648382187, 0.00015795603394508362, 0.00017632730305194855, 0.00019469857215881348, 0.0002130698412656784, 0.00023144111037254333, 0.00024981237947940826, 0.0002681836485862732, 0.0002865549176931381, 0.00030492618680000305, 0.000323297455906868, 0.0003416687250137329, 0.00036003999412059784, 0.00037841126322746277, 0.0003967825323343277, 0.0004151538014411926, 0.00043352507054805756, 0.0004518963396549225, 0.0004702676087617874, 0.0004886388778686523]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 5.0, 3.0, 4.0, 9.0, 6.0, 8.0, 7.0, 12.0, 13.0, 19.0, 22.0, 13.0, 18.0, 22.0, 36.0, 23.0, 34.0, 31.0, 46.0, 45.0, 44.0, 36.0, 54.0, 55.0, 44.0, 53.0, 34.0, 35.0, 33.0, 32.0, 23.0, 28.0, 30.0, 18.0, 24.0, 18.0, 11.0, 12.0, 14.0, 5.0, 3.0, 8.0, 3.0, 4.0, 0.0, 5.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.03125, -1.962738037109375, -1.89422607421875, -1.825714111328125, -1.7572021484375, -1.688690185546875, -1.62017822265625, -1.551666259765625, -1.483154296875, -1.414642333984375, -1.34613037109375, -1.277618408203125, -1.2091064453125, -1.140594482421875, -1.07208251953125, -1.003570556640625, -0.93505859375, -0.866546630859375, -0.79803466796875, -0.729522705078125, -0.6610107421875, -0.592498779296875, -0.52398681640625, -0.455474853515625, -0.386962890625, -0.318450927734375, -0.24993896484375, -0.181427001953125, -0.1129150390625, -0.044403076171875, 0.02410888671875, 0.092620849609375, 0.1611328125, 0.229644775390625, 0.29815673828125, 0.366668701171875, 0.4351806640625, 0.503692626953125, 0.57220458984375, 0.640716552734375, 0.709228515625, 0.777740478515625, 0.84625244140625, 0.914764404296875, 0.9832763671875, 1.051788330078125, 1.12030029296875, 1.188812255859375, 1.25732421875, 1.325836181640625, 1.39434814453125, 1.462860107421875, 1.5313720703125, 1.599884033203125, 1.66839599609375, 1.736907958984375, 1.805419921875, 1.873931884765625, 1.94244384765625, 2.010955810546875, 2.0794677734375, 2.147979736328125, 2.21649169921875, 2.285003662109375, 2.353515625]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 6.0, 22.0, 22.0, 42.0, 60.0, 98.0, 136.0, 241.0, 507.0, 953.0, 2226.0, 5386.0, 12818.0, 29801.0, 69575.0, 166032.0, 315143.0, 250713.0, 112400.0, 46729.0, 20403.0, 8569.0, 3505.0, 1589.0, 717.0, 349.0, 196.0, 127.0, 76.0, 42.0, 29.0, 15.0, 11.0, 9.0, 7.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.607421875, -2.53021240234375, -2.4530029296875, -2.37579345703125, -2.298583984375, -2.22137451171875, -2.1441650390625, -2.06695556640625, -1.98974609375, -1.91253662109375, -1.8353271484375, -1.75811767578125, -1.680908203125, -1.60369873046875, -1.5264892578125, -1.44927978515625, -1.3720703125, -1.29486083984375, -1.2176513671875, -1.14044189453125, -1.063232421875, -0.98602294921875, -0.9088134765625, -0.83160400390625, -0.75439453125, -0.67718505859375, -0.5999755859375, -0.52276611328125, -0.445556640625, -0.36834716796875, -0.2911376953125, -0.21392822265625, -0.13671875, -0.05950927734375, 0.0177001953125, 0.09490966796875, 0.172119140625, 0.24932861328125, 0.3265380859375, 0.40374755859375, 0.48095703125, 0.55816650390625, 0.6353759765625, 0.71258544921875, 0.789794921875, 0.86700439453125, 0.9442138671875, 1.02142333984375, 1.0986328125, 1.17584228515625, 1.2530517578125, 1.33026123046875, 1.407470703125, 1.48468017578125, 1.5618896484375, 1.63909912109375, 1.71630859375, 1.79351806640625, 1.8707275390625, 1.94793701171875, 2.025146484375, 2.10235595703125, 2.1795654296875, 2.25677490234375, 2.333984375]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 2.0, 6.0, 9.0, 14.0, 17.0, 10.0, 21.0, 18.0, 34.0, 33.0, 31.0, 39.0, 59.0, 52.0, 79.0, 153.0, 392.0, 1466.0, 184.0, 93.0, 50.0, 51.0, 39.0, 46.0, 37.0, 27.0, 24.0, 16.0, 12.0, 8.0, 13.0, 4.0, 2.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-14.0546875, -13.71246337890625, -13.3702392578125, -13.02801513671875, -12.685791015625, -12.34356689453125, -12.0013427734375, -11.65911865234375, -11.31689453125, -10.97467041015625, -10.6324462890625, -10.29022216796875, -9.947998046875, -9.60577392578125, -9.2635498046875, -8.92132568359375, -8.5791015625, -8.23687744140625, -7.8946533203125, -7.55242919921875, -7.210205078125, -6.86798095703125, -6.5257568359375, -6.18353271484375, -5.84130859375, -5.49908447265625, -5.1568603515625, -4.81463623046875, -4.472412109375, -4.13018798828125, -3.7879638671875, -3.44573974609375, -3.103515625, -2.76129150390625, -2.4190673828125, -2.07684326171875, -1.734619140625, -1.39239501953125, -1.0501708984375, -0.70794677734375, -0.36572265625, -0.02349853515625, 0.3187255859375, 0.66094970703125, 1.003173828125, 1.34539794921875, 1.6876220703125, 2.02984619140625, 2.3720703125, 2.71429443359375, 3.0565185546875, 3.39874267578125, 3.740966796875, 4.08319091796875, 4.4254150390625, 4.76763916015625, 5.10986328125, 5.45208740234375, 5.7943115234375, 6.13653564453125, 6.478759765625, 6.82098388671875, 7.1632080078125, 7.50543212890625, 7.84765625]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 6.0, 2.0, 3.0, 4.0, 7.0, 13.0, 6.0, 7.0, 13.0, 16.0, 19.0, 34.0, 41.0, 60.0, 80.0, 103.0, 165.0, 219.0, 427.0, 950.0, 17031.0, 3086127.0, 37811.0, 1225.0, 452.0, 257.0, 168.0, 106.0, 93.0, 58.0, 51.0, 27.0, 27.0, 26.0, 24.0, 19.0, 12.0, 7.0, 7.0, 5.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.484375, -17.665283203125, -16.84619140625, -16.027099609375, -15.2080078125, -14.388916015625, -13.56982421875, -12.750732421875, -11.931640625, -11.112548828125, -10.29345703125, -9.474365234375, -8.6552734375, -7.836181640625, -7.01708984375, -6.197998046875, -5.37890625, -4.559814453125, -3.74072265625, -2.921630859375, -2.1025390625, -1.283447265625, -0.46435546875, 0.354736328125, 1.173828125, 1.992919921875, 2.81201171875, 3.631103515625, 4.4501953125, 5.269287109375, 6.08837890625, 6.907470703125, 7.7265625, 8.545654296875, 9.36474609375, 10.183837890625, 11.0029296875, 11.822021484375, 12.64111328125, 13.460205078125, 14.279296875, 15.098388671875, 15.91748046875, 16.736572265625, 17.5556640625, 18.374755859375, 19.19384765625, 20.012939453125, 20.83203125, 21.651123046875, 22.47021484375, 23.289306640625, 24.1083984375, 24.927490234375, 25.74658203125, 26.565673828125, 27.384765625, 28.203857421875, 29.02294921875, 29.842041015625, 30.6611328125, 31.480224609375, 32.29931640625, 33.118408203125, 33.9375]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 7.0, 25.0, 43.0, 127.0, 242.0, 283.0, 157.0, 92.0, 29.0, 9.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.05703353881836, -29.151933670043945, -28.246835708618164, -27.34173583984375, -26.436635971069336, -25.531536102294922, -24.62643814086914, -23.721338272094727, -22.816238403320312, -21.9111385345459, -21.006040573120117, -20.100940704345703, -19.19584083557129, -18.290740966796875, -17.385643005371094, -16.48054313659668, -15.575444221496582, -14.670345306396484, -13.76524543762207, -12.860146522521973, -11.955046653747559, -11.049947738647461, -10.144847869873047, -9.23974895477295, -8.334650039672852, -7.429550647735596, -6.52445125579834, -5.619352340698242, -4.714252471923828, -3.8091535568237305, -2.9040541648864746, -1.9989547729492188, -1.0938549041748047, -0.1887555718421936, 0.7163437604904175, 1.6214430332183838, 2.5265424251556396, 3.4316415786743164, 4.336740970611572, 5.241840362548828, 6.146939754486084, 7.05203914642334, 7.957138538360596, 8.862237930297852, 9.76733684539795, 10.672435760498047, 11.577535629272461, 12.482635498046875, 13.387734413146973, 14.29283332824707, 15.197933197021484, 16.1030330657959, 17.00813102722168, 17.913230895996094, 18.818330764770508, 19.723430633544922, 20.628528594970703, 21.533628463745117, 22.4387264251709, 23.343826293945312, 24.248926162719727, 25.15402603149414, 26.059123992919922, 26.964223861694336, 27.86932373046875]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 3.0, 6.0, 15.0, 9.0, 9.0, 15.0, 10.0, 15.0, 14.0, 21.0, 18.0, 27.0, 28.0, 19.0, 38.0, 37.0, 34.0, 31.0, 44.0, 41.0, 45.0, 47.0, 46.0, 52.0, 38.0, 29.0, 36.0, 32.0, 27.0, 23.0, 28.0, 30.0, 26.0, 28.0, 15.0, 12.0, 15.0, 7.0, 9.0, 7.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-20.2705135345459, -19.670528411865234, -19.070541381835938, -18.47055435180664, -17.870569229125977, -17.270584106445312, -16.670597076416016, -16.07061004638672, -15.470624923706055, -14.870638847351074, -14.270652770996094, -13.670666694641113, -13.070680618286133, -12.470694541931152, -11.870708465576172, -11.270722389221191, -10.670736312866211, -10.07075023651123, -9.47076416015625, -8.87077808380127, -8.270792007446289, -7.670805931091309, -7.070819854736328, -6.470833778381348, -5.870847702026367, -5.270861625671387, -4.670875549316406, -4.070889472961426, -3.4709033966064453, -2.870917320251465, -2.2709312438964844, -1.670945167541504, -1.0709609985351562, -0.4709749221801758, 0.1290111541748047, 0.7289972305297852, 1.3289833068847656, 1.928969383239746, 2.5289554595947266, 3.128941535949707, 3.7289276123046875, 4.328913688659668, 4.928899765014648, 5.528885841369629, 6.128871917724609, 6.72885799407959, 7.32884407043457, 7.928830146789551, 8.528816223144531, 9.128802299499512, 9.728788375854492, 10.328774452209473, 10.928760528564453, 11.528746604919434, 12.128732681274414, 12.728718757629395, 13.328704833984375, 13.928690910339355, 14.528676986694336, 15.128663063049316, 15.728649139404297, 16.328636169433594, 16.928621292114258, 17.528606414794922, 18.12859344482422]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 5.0, 3.0, 6.0, 6.0, 3.0, 5.0, 4.0, 12.0, 13.0, 10.0, 21.0, 16.0, 17.0, 25.0, 41.0, 25.0, 19.0, 22.0, 30.0, 33.0, 36.0, 51.0, 35.0, 49.0, 51.0, 40.0, 41.0, 37.0, 39.0, 33.0, 38.0, 21.0, 25.0, 21.0, 26.0, 18.0, 23.0, 22.0, 12.0, 11.0, 11.0, 11.0, 6.0, 6.0, 4.0, 5.0, 3.0, 4.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-2.349609375, -2.2789306640625, -2.208251953125, -2.1375732421875, -2.06689453125, -1.9962158203125, -1.925537109375, -1.8548583984375, -1.7841796875, -1.7135009765625, -1.642822265625, -1.5721435546875, -1.50146484375, -1.4307861328125, -1.360107421875, -1.2894287109375, -1.21875, -1.1480712890625, -1.077392578125, -1.0067138671875, -0.93603515625, -0.8653564453125, -0.794677734375, -0.7239990234375, -0.6533203125, -0.5826416015625, -0.511962890625, -0.4412841796875, -0.37060546875, -0.2999267578125, -0.229248046875, -0.1585693359375, -0.087890625, -0.0172119140625, 0.053466796875, 0.1241455078125, 0.19482421875, 0.2655029296875, 0.336181640625, 0.4068603515625, 0.4775390625, 0.5482177734375, 0.618896484375, 0.6895751953125, 0.76025390625, 0.8309326171875, 0.901611328125, 0.9722900390625, 1.04296875, 1.1136474609375, 1.184326171875, 1.2550048828125, 1.32568359375, 1.3963623046875, 1.467041015625, 1.5377197265625, 1.6083984375, 1.6790771484375, 1.749755859375, 1.8204345703125, 1.89111328125, 1.9617919921875, 2.032470703125, 2.1031494140625, 2.173828125]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 2.0, 2.0, 6.0, 4.0, 4.0, 4.0, 9.0, 9.0, 11.0, 10.0, 17.0, 16.0, 24.0, 24.0, 27.0, 28.0, 30.0, 44.0, 74.0, 146.0, 309.0, 830.0, 4011.0, 59946.0, 1382138.0, 2531140.0, 203804.0, 9246.0, 1366.0, 409.0, 198.0, 92.0, 51.0, 32.0, 34.0, 17.0, 28.0, 26.0, 18.0, 15.0, 11.0, 13.0, 7.0, 6.0, 11.0, 8.0, 7.0, 7.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 4.0], "bins": [-7.53515625, -7.30804443359375, -7.0809326171875, -6.85382080078125, -6.626708984375, -6.39959716796875, -6.1724853515625, -5.94537353515625, -5.71826171875, -5.49114990234375, -5.2640380859375, -5.03692626953125, -4.809814453125, -4.58270263671875, -4.3555908203125, -4.12847900390625, -3.9013671875, -3.67425537109375, -3.4471435546875, -3.22003173828125, -2.992919921875, -2.76580810546875, -2.5386962890625, -2.31158447265625, -2.08447265625, -1.85736083984375, -1.6302490234375, -1.40313720703125, -1.176025390625, -0.94891357421875, -0.7218017578125, -0.49468994140625, -0.267578125, -0.04046630859375, 0.1866455078125, 0.41375732421875, 0.640869140625, 0.86798095703125, 1.0950927734375, 1.32220458984375, 1.54931640625, 1.77642822265625, 2.0035400390625, 2.23065185546875, 2.457763671875, 2.68487548828125, 2.9119873046875, 3.13909912109375, 3.3662109375, 3.59332275390625, 3.8204345703125, 4.04754638671875, 4.274658203125, 4.50177001953125, 4.7288818359375, 4.95599365234375, 5.18310546875, 5.41021728515625, 5.6373291015625, 5.86444091796875, 6.091552734375, 6.31866455078125, 6.5457763671875, 6.77288818359375, 7.0]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 5.0, 15.0, 5.0, 11.0, 16.0, 30.0, 35.0, 40.0, 42.0, 66.0, 91.0, 100.0, 154.0, 170.0, 224.0, 254.0, 317.0, 305.0, 411.0, 329.0, 310.0, 259.0, 197.0, 158.0, 118.0, 88.0, 75.0, 47.0, 55.0, 29.0, 26.0, 21.0, 18.0, 13.0, 14.0, 9.0, 10.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.65234375, -4.516357421875, -4.38037109375, -4.244384765625, -4.1083984375, -3.972412109375, -3.83642578125, -3.700439453125, -3.564453125, -3.428466796875, -3.29248046875, -3.156494140625, -3.0205078125, -2.884521484375, -2.74853515625, -2.612548828125, -2.4765625, -2.340576171875, -2.20458984375, -2.068603515625, -1.9326171875, -1.796630859375, -1.66064453125, -1.524658203125, -1.388671875, -1.252685546875, -1.11669921875, -0.980712890625, -0.8447265625, -0.708740234375, -0.57275390625, -0.436767578125, -0.30078125, -0.164794921875, -0.02880859375, 0.107177734375, 0.2431640625, 0.379150390625, 0.51513671875, 0.651123046875, 0.787109375, 0.923095703125, 1.05908203125, 1.195068359375, 1.3310546875, 1.467041015625, 1.60302734375, 1.739013671875, 1.875, 2.010986328125, 2.14697265625, 2.282958984375, 2.4189453125, 2.554931640625, 2.69091796875, 2.826904296875, 2.962890625, 3.098876953125, 3.23486328125, 3.370849609375, 3.5068359375, 3.642822265625, 3.77880859375, 3.914794921875, 4.05078125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 5.0, 11.0, 15.0, 16.0, 17.0, 24.0, 29.0, 39.0, 55.0, 59.0, 91.0, 98.0, 120.0, 145.0, 246.0, 305.0, 732.0, 3084.0, 36187.0, 758349.0, 3046357.0, 328036.0, 16664.0, 1878.0, 580.0, 287.0, 201.0, 164.0, 118.0, 96.0, 60.0, 53.0, 43.0, 29.0, 29.0, 15.0, 19.0, 6.0, 5.0, 9.0, 6.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0, -8.6934814453125, -8.386962890625, -8.0804443359375, -7.77392578125, -7.4674072265625, -7.160888671875, -6.8543701171875, -6.5478515625, -6.2413330078125, -5.934814453125, -5.6282958984375, -5.32177734375, -5.0152587890625, -4.708740234375, -4.4022216796875, -4.095703125, -3.7891845703125, -3.482666015625, -3.1761474609375, -2.86962890625, -2.5631103515625, -2.256591796875, -1.9500732421875, -1.6435546875, -1.3370361328125, -1.030517578125, -0.7239990234375, -0.41748046875, -0.1109619140625, 0.195556640625, 0.5020751953125, 0.80859375, 1.1151123046875, 1.421630859375, 1.7281494140625, 2.03466796875, 2.3411865234375, 2.647705078125, 2.9542236328125, 3.2607421875, 3.5672607421875, 3.873779296875, 4.1802978515625, 4.48681640625, 4.7933349609375, 5.099853515625, 5.4063720703125, 5.712890625, 6.0194091796875, 6.325927734375, 6.6324462890625, 6.93896484375, 7.2454833984375, 7.552001953125, 7.8585205078125, 8.1650390625, 8.4715576171875, 8.778076171875, 9.0845947265625, 9.39111328125, 9.6976318359375, 10.004150390625, 10.3106689453125, 10.6171875]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 9.0, 10.0, 36.0, 49.0, 51.0, 86.0, 104.0, 119.0, 141.0, 119.0, 108.0, 82.0, 40.0, 28.0, 18.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-29.795066833496094, -28.9697265625, -28.144386291503906, -27.319046020507812, -26.49370574951172, -25.668365478515625, -24.8430233001709, -24.017683029174805, -23.19234275817871, -22.367002487182617, -21.541662216186523, -20.71632194519043, -19.890979766845703, -19.06563949584961, -18.240299224853516, -17.414958953857422, -16.589618682861328, -15.764278411865234, -14.93893814086914, -14.11359691619873, -13.288256645202637, -12.462916374206543, -11.637575149536133, -10.812234878540039, -9.986894607543945, -9.161554336547852, -8.336214065551758, -7.510872840881348, -6.685532569885254, -5.86019229888916, -5.034851551055908, -4.209510803222656, -3.3841705322265625, -2.5588300228118896, -1.7334895133972168, -0.908149003982544, -0.0828084945678711, 0.7425317764282227, 1.5678725242614746, 2.3932132720947266, 3.2185535430908203, 4.043893814086914, 4.869234561920166, 5.694575309753418, 6.519915580749512, 7.3452558517456055, 8.170597076416016, 8.99593734741211, 9.821277618408203, 10.646617889404297, 11.47195816040039, 12.2972993850708, 13.122639656066895, 13.947979927062988, 14.773321151733398, 15.598661422729492, 16.424001693725586, 17.24934196472168, 18.074682235717773, 18.900022506713867, 19.725364685058594, 20.550704956054688, 21.37604522705078, 22.201385498046875, 23.02672576904297]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 3.0, 5.0, 13.0, 20.0, 19.0, 19.0, 16.0, 32.0, 23.0, 29.0, 47.0, 35.0, 34.0, 37.0, 47.0, 50.0, 38.0, 50.0, 43.0, 49.0, 47.0, 29.0, 48.0, 34.0, 38.0, 32.0, 24.0, 26.0, 31.0, 10.0, 14.0, 11.0, 12.0, 9.0, 8.0, 1.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-18.86268424987793, -18.28342628479004, -17.70416831970215, -17.124910354614258, -16.545652389526367, -15.966394424438477, -15.387136459350586, -14.807878494262695, -14.228620529174805, -13.649362564086914, -13.070104598999023, -12.490846633911133, -11.911588668823242, -11.332330703735352, -10.753072738647461, -10.17381477355957, -9.594555854797363, -9.015297889709473, -8.436039924621582, -7.856781959533691, -7.277523994445801, -6.69826602935791, -6.119007587432861, -5.539749622344971, -4.96049165725708, -4.3812336921691895, -3.801975727081299, -3.222717523574829, -2.6434595584869385, -2.064201593399048, -1.4849433898925781, -0.9056854248046875, -0.3264274597167969, 0.2528305649757385, 0.8320885896682739, 1.411346673965454, 1.9906046390533447, 2.5698626041412354, 3.149120807647705, 3.7283787727355957, 4.307636737823486, 4.886894702911377, 5.466152667999268, 6.045411109924316, 6.624669075012207, 7.203927040100098, 7.783185005187988, 8.362442970275879, 8.94170093536377, 9.52095890045166, 10.10021686553955, 10.679474830627441, 11.258732795715332, 11.837990760803223, 12.41724967956543, 12.99650764465332, 13.575765609741211, 14.155023574829102, 14.734281539916992, 15.313539505004883, 15.892797470092773, 16.472055435180664, 17.051313400268555, 17.630571365356445, 18.209829330444336]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 1.0, 2.0, 0.0, 3.0, 2.0, 11.0, 4.0, 1.0, 5.0, 6.0, 5.0, 12.0, 13.0, 13.0, 12.0, 18.0, 20.0, 23.0, 24.0, 24.0, 16.0, 26.0, 23.0, 25.0, 41.0, 37.0, 51.0, 43.0, 50.0, 36.0, 26.0, 39.0, 32.0, 25.0, 26.0, 36.0, 30.0, 31.0, 21.0, 20.0, 21.0, 19.0, 18.0, 17.0, 17.0, 12.0, 18.0, 10.0, 15.0, 4.0, 6.0, 4.0, 5.0, 2.0, 5.0, 3.0, 1.0, 3.0, 0.0, 2.0, 3.0], "bins": [-2.005859375, -1.94427490234375, -1.8826904296875, -1.82110595703125, -1.759521484375, -1.69793701171875, -1.6363525390625, -1.57476806640625, -1.51318359375, -1.45159912109375, -1.3900146484375, -1.32843017578125, -1.266845703125, -1.20526123046875, -1.1436767578125, -1.08209228515625, -1.0205078125, -0.95892333984375, -0.8973388671875, -0.83575439453125, -0.774169921875, -0.71258544921875, -0.6510009765625, -0.58941650390625, -0.52783203125, -0.46624755859375, -0.4046630859375, -0.34307861328125, -0.281494140625, -0.21990966796875, -0.1583251953125, -0.09674072265625, -0.03515625, 0.02642822265625, 0.0880126953125, 0.14959716796875, 0.211181640625, 0.27276611328125, 0.3343505859375, 0.39593505859375, 0.45751953125, 0.51910400390625, 0.5806884765625, 0.64227294921875, 0.703857421875, 0.76544189453125, 0.8270263671875, 0.88861083984375, 0.9501953125, 1.01177978515625, 1.0733642578125, 1.13494873046875, 1.196533203125, 1.25811767578125, 1.3197021484375, 1.38128662109375, 1.44287109375, 1.50445556640625, 1.5660400390625, 1.62762451171875, 1.689208984375, 1.75079345703125, 1.8123779296875, 1.87396240234375, 1.935546875]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 6.0, 9.0, 8.0, 19.0, 28.0, 38.0, 58.0, 111.0, 156.0, 209.0, 338.0, 448.0, 660.0, 1018.0, 1431.0, 1991.0, 2743.0, 4053.0, 5821.0, 8684.0, 12682.0, 19424.0, 30736.0, 50101.0, 86332.0, 159693.0, 241872.0, 173924.0, 94783.0, 54303.0, 33035.0, 20898.0, 13584.0, 9150.0, 6216.0, 4207.0, 2997.0, 2099.0, 1460.0, 1003.0, 717.0, 487.0, 336.0, 228.0, 159.0, 100.0, 74.0, 49.0, 34.0, 19.0, 9.0, 10.0, 6.0, 5.0, 0.0, 4.0, 0.0, 1.0], "bins": [-0.290283203125, -0.2813720703125, -0.2724609375, -0.2635498046875, -0.254638671875, -0.2457275390625, -0.23681640625, -0.2279052734375, -0.218994140625, -0.2100830078125, -0.201171875, -0.1922607421875, -0.183349609375, -0.1744384765625, -0.16552734375, -0.1566162109375, -0.147705078125, -0.1387939453125, -0.1298828125, -0.1209716796875, -0.112060546875, -0.1031494140625, -0.09423828125, -0.0853271484375, -0.076416015625, -0.0675048828125, -0.05859375, -0.0496826171875, -0.040771484375, -0.0318603515625, -0.02294921875, -0.0140380859375, -0.005126953125, 0.0037841796875, 0.0126953125, 0.0216064453125, 0.030517578125, 0.0394287109375, 0.04833984375, 0.0572509765625, 0.066162109375, 0.0750732421875, 0.083984375, 0.0928955078125, 0.101806640625, 0.1107177734375, 0.11962890625, 0.1285400390625, 0.137451171875, 0.1463623046875, 0.1552734375, 0.1641845703125, 0.173095703125, 0.1820068359375, 0.19091796875, 0.1998291015625, 0.208740234375, 0.2176513671875, 0.2265625, 0.2354736328125, 0.244384765625, 0.2532958984375, 0.26220703125, 0.2711181640625, 0.280029296875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 3.0, 3.0, 3.0, 6.0, 7.0, 7.0, 13.0, 10.0, 14.0, 11.0, 30.0, 19.0, 39.0, 30.0, 36.0, 32.0, 39.0, 33.0, 38.0, 55.0, 60.0, 1078.0, 37.0, 51.0, 50.0, 45.0, 38.0, 34.0, 36.0, 37.0, 22.0, 23.0, 22.0, 23.0, 6.0, 12.0, 7.0, 9.0, 10.0, 2.0, 2.0, 0.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.634765625, -1.5842742919921875, -1.533782958984375, -1.4832916259765625, -1.43280029296875, -1.3823089599609375, -1.331817626953125, -1.2813262939453125, -1.2308349609375, -1.1803436279296875, -1.129852294921875, -1.0793609619140625, -1.02886962890625, -0.9783782958984375, -0.927886962890625, -0.8773956298828125, -0.826904296875, -0.7764129638671875, -0.725921630859375, -0.6754302978515625, -0.62493896484375, -0.5744476318359375, -0.523956298828125, -0.4734649658203125, -0.4229736328125, -0.3724822998046875, -0.321990966796875, -0.2714996337890625, -0.22100830078125, -0.1705169677734375, -0.120025634765625, -0.0695343017578125, -0.01904296875, 0.0314483642578125, 0.081939697265625, 0.1324310302734375, 0.18292236328125, 0.2334136962890625, 0.283905029296875, 0.3343963623046875, 0.3848876953125, 0.4353790283203125, 0.485870361328125, 0.5363616943359375, 0.58685302734375, 0.6373443603515625, 0.687835693359375, 0.7383270263671875, 0.788818359375, 0.8393096923828125, 0.889801025390625, 0.9402923583984375, 0.99078369140625, 1.0412750244140625, 1.091766357421875, 1.1422576904296875, 1.1927490234375, 1.2432403564453125, 1.293731689453125, 1.3442230224609375, 1.39471435546875, 1.4452056884765625, 1.495697021484375, 1.5461883544921875, 1.5966796875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 8.0, 9.0, 20.0, 32.0, 44.0, 52.0, 93.0, 117.0, 153.0, 277.0, 339.0, 532.0, 814.0, 1127.0, 1698.0, 2561.0, 3962.0, 6056.0, 9765.0, 15651.0, 25211.0, 41603.0, 72262.0, 130433.0, 1225153.0, 260528.0, 124095.0, 68784.0, 40169.0, 24068.0, 14710.0, 9196.0, 5926.0, 3782.0, 2614.0, 1662.0, 1160.0, 806.0, 539.0, 343.0, 236.0, 174.0, 109.0, 80.0, 66.0, 38.0, 28.0, 15.0, 14.0, 5.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.248779296875, -0.2409954071044922, -0.23321151733398438, -0.22542762756347656, -0.21764373779296875, -0.20985984802246094, -0.20207595825195312, -0.1942920684814453, -0.1865081787109375, -0.1787242889404297, -0.17094039916992188, -0.16315650939941406, -0.15537261962890625, -0.14758872985839844, -0.13980484008789062, -0.1320209503173828, -0.124237060546875, -0.11645317077636719, -0.10866928100585938, -0.10088539123535156, -0.09310150146484375, -0.08531761169433594, -0.07753372192382812, -0.06974983215332031, -0.0619659423828125, -0.05418205261230469, -0.046398162841796875, -0.03861427307128906, -0.03083038330078125, -0.023046493530273438, -0.015262603759765625, -0.0074787139892578125, 0.00030517578125, 0.008089065551757812, 0.015872955322265625, 0.023656845092773438, 0.03144073486328125, 0.03922462463378906, 0.047008514404296875, 0.05479240417480469, 0.0625762939453125, 0.07036018371582031, 0.07814407348632812, 0.08592796325683594, 0.09371185302734375, 0.10149574279785156, 0.10927963256835938, 0.11706352233886719, 0.124847412109375, 0.1326313018798828, 0.14041519165039062, 0.14819908142089844, 0.15598297119140625, 0.16376686096191406, 0.17155075073242188, 0.1793346405029297, 0.1871185302734375, 0.1949024200439453, 0.20268630981445312, 0.21047019958496094, 0.21825408935546875, 0.22603797912597656, 0.23382186889648438, 0.2416057586669922, 0.2493896484375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 7.0, 2.0, 6.0, 8.0, 12.0, 7.0, 12.0, 19.0, 18.0, 38.0, 38.0, 50.0, 39.0, 61.0, 57.0, 64.0, 68.0, 74.0, 65.0, 55.0, 57.0, 41.0, 36.0, 25.0, 29.0, 22.0, 13.0, 16.0, 17.0, 11.0, 8.0, 7.0, 8.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007238388061523438, -0.0006979629397392273, -0.0006720870733261108, -0.0006462112069129944, -0.0006203353404998779, -0.0005944594740867615, -0.000568583607673645, -0.0005427077412605286, -0.0005168318748474121, -0.0004909560084342957, -0.0004650801420211792, -0.00043920427560806274, -0.0004133284091949463, -0.00038745254278182983, -0.0003615766763687134, -0.0003357008099555969, -0.00030982494354248047, -0.000283949077129364, -0.00025807321071624756, -0.0002321973443031311, -0.00020632147789001465, -0.0001804456114768982, -0.00015456974506378174, -0.00012869387865066528, -0.00010281801223754883, -7.694214582443237e-05, -5.106627941131592e-05, -2.5190412998199463e-05, 6.854534149169922e-07, 2.6561319828033447e-05, 5.24371862411499e-05, 7.831305265426636e-05, 0.00010418891906738281, 0.00013006478548049927, 0.00015594065189361572, 0.00018181651830673218, 0.00020769238471984863, 0.0002335682511329651, 0.00025944411754608154, 0.000285319983959198, 0.00031119585037231445, 0.0003370717167854309, 0.00036294758319854736, 0.0003888234496116638, 0.0004146993160247803, 0.00044057518243789673, 0.0004664510488510132, 0.0004923269152641296, 0.0005182027816772461, 0.0005440786480903625, 0.000569954514503479, 0.0005958303809165955, 0.0006217062473297119, 0.0006475821137428284, 0.0006734579801559448, 0.0006993338465690613, 0.0007252097129821777, 0.0007510855793952942, 0.0007769614458084106, 0.0008028373122215271, 0.0008287131786346436, 0.00085458904504776, 0.0008804649114608765, 0.0009063407778739929, 0.0009322166442871094]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 7.0, 11.0, 11.0, 14.0, 13.0, 15.0, 18.0, 19.0, 34.0, 35.0, 57.0, 94.0, 131.0, 224.0, 475.0, 1967.0, 275847.0, 764663.0, 3525.0, 611.0, 272.0, 148.0, 79.0, 61.0, 54.0, 42.0, 25.0, 21.0, 19.0, 8.0, 18.0, 4.0, 4.0, 2.0, 5.0, 8.0, 2.0, 1.0, 6.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01666259765625, -0.0161435604095459, -0.015624523162841797, -0.015105485916137695, -0.014586448669433594, -0.014067411422729492, -0.01354837417602539, -0.013029336929321289, -0.012510299682617188, -0.011991262435913086, -0.011472225189208984, -0.010953187942504883, -0.010434150695800781, -0.00991511344909668, -0.009396076202392578, -0.008877038955688477, -0.008358001708984375, -0.007838964462280273, -0.007319927215576172, -0.00680088996887207, -0.006281852722167969, -0.005762815475463867, -0.005243778228759766, -0.004724740982055664, -0.0042057037353515625, -0.003686666488647461, -0.0031676292419433594, -0.002648591995239258, -0.0021295547485351562, -0.0016105175018310547, -0.0010914802551269531, -0.0005724430084228516, -5.340576171875e-05, 0.00046563148498535156, 0.0009846687316894531, 0.0015037059783935547, 0.0020227432250976562, 0.002541780471801758, 0.0030608177185058594, 0.003579854965209961, 0.0040988922119140625, 0.004617929458618164, 0.005136966705322266, 0.005656003952026367, 0.006175041198730469, 0.00669407844543457, 0.007213115692138672, 0.0077321529388427734, 0.008251190185546875, 0.008770227432250977, 0.009289264678955078, 0.00980830192565918, 0.010327339172363281, 0.010846376419067383, 0.011365413665771484, 0.011884450912475586, 0.012403488159179688, 0.012922525405883789, 0.01344156265258789, 0.013960599899291992, 0.014479637145996094, 0.014998674392700195, 0.015517711639404297, 0.0160367488861084, 0.0165557861328125]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 8.0, 29.0, 87.0, 207.0, 318.0, 223.0, 99.0, 29.0, 6.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00032286858186125755, -0.0002732789143919945, -0.00022368927602656186, -0.000174099623109214, -0.00012450997019186616, -7.492030272260308e-05, -2.5330664357170463e-05, 2.4258974008262157e-05, 7.384864147752523e-05, 0.00012343829439487308, 0.00017302794731222093, 0.00022261760022956878, 0.00027220725314691663, 0.0003217969206161797, 0.0003713865589816123, 0.00042097619734704494, 0.000470565864816308, 0.0005201555322855711, 0.0005697451997548342, 0.0006193348090164363, 0.0006689244764856994, 0.0007185141439549625, 0.0007681037532165647, 0.0008176934206858277, 0.0008672830881550908, 0.0009168727556243539, 0.000966462423093617, 0.00101605209056288, 0.0010656416416168213, 0.0011152313090860844, 0.0011648209765553474, 0.0012144106440246105, 0.0012640003114938736, 0.0013135899789631367, 0.0013631796464323997, 0.0014127693139016628, 0.001462358981370926, 0.001511948648840189, 0.0015615381998941302, 0.0016111278673633933, 0.0016607175348326564, 0.0017103072023019195, 0.0017598968697711825, 0.0018094865372404456, 0.0018590760882943869, 0.00190866575576365, 0.001958255423232913, 0.002007845090702176, 0.002057434758171439, 0.0021070244256407022, 0.0021566140931099653, 0.0022062037605792284, 0.0022557934280484915, 0.0023053830955177546, 0.0023549727629870176, 0.002404562197625637, 0.0024541518650949, 0.002503741532564163, 0.0025533312000334263, 0.0026029208675026894, 0.0026525105349719524, 0.0027021002024412155, 0.0027516898699104786, 0.0028012795373797417, 0.0028508692048490047]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 1.0, 6.0, 6.0, 9.0, 4.0, 10.0, 18.0, 16.0, 18.0, 17.0, 23.0, 30.0, 28.0, 32.0, 42.0, 28.0, 35.0, 43.0, 45.0, 46.0, 49.0, 42.0, 40.0, 39.0, 37.0, 30.0, 34.0, 40.0, 30.0, 24.0, 22.0, 29.0, 14.0, 25.0, 16.0, 19.0, 7.0, 9.0, 12.0, 6.0, 10.0, 3.0, 3.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00043070316314697266, -0.00041798409074544907, -0.0004052650183439255, -0.0003925459459424019, -0.0003798268735408783, -0.0003671078011393547, -0.0003543887287378311, -0.0003416696563363075, -0.00032895058393478394, -0.00031623151153326035, -0.00030351243913173676, -0.00029079336673021317, -0.0002780742943286896, -0.000265355221927166, -0.0002526361495256424, -0.0002399170771241188, -0.00022719800472259521, -0.00021447893232107162, -0.00020175985991954803, -0.00018904078751802444, -0.00017632171511650085, -0.00016360264271497726, -0.00015088357031345367, -0.00013816449791193008, -0.0001254454255104065, -0.0001127263531088829, -0.00010000728070735931, -8.728820830583572e-05, -7.456913590431213e-05, -6.185006350278854e-05, -4.9130991101264954e-05, -3.6411918699741364e-05, -2.3692846298217773e-05, -1.0973773896694183e-05, 1.7452985048294067e-06, 1.4464370906352997e-05, 2.7183443307876587e-05, 3.990251570940018e-05, 5.262158811092377e-05, 6.534066051244736e-05, 7.805973291397095e-05, 9.077880531549454e-05, 0.00010349787771701813, 0.00011621695011854172, 0.0001289360225200653, 0.0001416550949215889, 0.0001543741673231125, 0.00016709323972463608, 0.00017981231212615967, 0.00019253138452768326, 0.00020525045692920685, 0.00021796952933073044, 0.00023068860173225403, 0.00024340767413377762, 0.0002561267465353012, 0.0002688458189368248, 0.0002815648913383484, 0.000294283963739872, 0.00030700303614139557, 0.00031972210854291916, 0.00033244118094444275, 0.00034516025334596634, 0.00035787932574748993, 0.0003705983981490135, 0.0003833174705505371]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 1.0, 2.0, 0.0, 3.0, 2.0, 11.0, 4.0, 1.0, 5.0, 6.0, 5.0, 12.0, 13.0, 13.0, 12.0, 19.0, 20.0, 24.0, 22.0, 24.0, 16.0, 27.0, 26.0, 22.0, 40.0, 38.0, 50.0, 44.0, 50.0, 35.0, 29.0, 36.0, 32.0, 25.0, 27.0, 35.0, 30.0, 32.0, 21.0, 19.0, 21.0, 19.0, 18.0, 17.0, 17.0, 12.0, 18.0, 10.0, 15.0, 4.0, 6.0, 4.0, 5.0, 2.0, 5.0, 3.0, 1.0, 3.0, 0.0, 2.0, 3.0], "bins": [-2.00390625, -1.942352294921875, -1.88079833984375, -1.819244384765625, -1.7576904296875, -1.696136474609375, -1.63458251953125, -1.573028564453125, -1.511474609375, -1.449920654296875, -1.38836669921875, -1.326812744140625, -1.2652587890625, -1.203704833984375, -1.14215087890625, -1.080596923828125, -1.01904296875, -0.957489013671875, -0.89593505859375, -0.834381103515625, -0.7728271484375, -0.711273193359375, -0.64971923828125, -0.588165283203125, -0.526611328125, -0.465057373046875, -0.40350341796875, -0.341949462890625, -0.2803955078125, -0.218841552734375, -0.15728759765625, -0.095733642578125, -0.0341796875, 0.027374267578125, 0.08892822265625, 0.150482177734375, 0.2120361328125, 0.273590087890625, 0.33514404296875, 0.396697998046875, 0.458251953125, 0.519805908203125, 0.58135986328125, 0.642913818359375, 0.7044677734375, 0.766021728515625, 0.82757568359375, 0.889129638671875, 0.95068359375, 1.012237548828125, 1.07379150390625, 1.135345458984375, 1.1968994140625, 1.258453369140625, 1.32000732421875, 1.381561279296875, 1.443115234375, 1.504669189453125, 1.56622314453125, 1.627777099609375, 1.6893310546875, 1.750885009765625, 1.81243896484375, 1.873992919921875, 1.935546875]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 7.0, 4.0, 12.0, 16.0, 28.0, 50.0, 90.0, 135.0, 231.0, 475.0, 1185.0, 3176.0, 8944.0, 26030.0, 67175.0, 167149.0, 363285.0, 246029.0, 101755.0, 39787.0, 14649.0, 5124.0, 1756.0, 735.0, 319.0, 165.0, 96.0, 46.0, 42.0, 24.0, 8.0, 6.0, 7.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.908203125, -2.8165283203125, -2.724853515625, -2.6331787109375, -2.54150390625, -2.4498291015625, -2.358154296875, -2.2664794921875, -2.1748046875, -2.0831298828125, -1.991455078125, -1.8997802734375, -1.80810546875, -1.7164306640625, -1.624755859375, -1.5330810546875, -1.44140625, -1.3497314453125, -1.258056640625, -1.1663818359375, -1.07470703125, -0.9830322265625, -0.891357421875, -0.7996826171875, -0.7080078125, -0.6163330078125, -0.524658203125, -0.4329833984375, -0.34130859375, -0.2496337890625, -0.157958984375, -0.0662841796875, 0.025390625, 0.1170654296875, 0.208740234375, 0.3004150390625, 0.39208984375, 0.4837646484375, 0.575439453125, 0.6671142578125, 0.7587890625, 0.8504638671875, 0.942138671875, 1.0338134765625, 1.12548828125, 1.2171630859375, 1.308837890625, 1.4005126953125, 1.4921875, 1.5838623046875, 1.675537109375, 1.7672119140625, 1.85888671875, 1.9505615234375, 2.042236328125, 2.1339111328125, 2.2255859375, 2.3172607421875, 2.408935546875, 2.5006103515625, 2.59228515625, 2.6839599609375, 2.775634765625, 2.8673095703125, 2.958984375]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 5.0, 4.0, 17.0, 8.0, 15.0, 21.0, 18.0, 15.0, 25.0, 29.0, 47.0, 42.0, 33.0, 57.0, 73.0, 117.0, 349.0, 1450.0, 210.0, 111.0, 55.0, 44.0, 43.0, 37.0, 37.0, 38.0, 27.0, 23.0, 25.0, 13.0, 6.0, 16.0, 11.0, 10.0, 6.0, 5.0, 5.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.77734375, -6.49725341796875, -6.2171630859375, -5.93707275390625, -5.656982421875, -5.37689208984375, -5.0968017578125, -4.81671142578125, -4.53662109375, -4.25653076171875, -3.9764404296875, -3.69635009765625, -3.416259765625, -3.13616943359375, -2.8560791015625, -2.57598876953125, -2.2958984375, -2.01580810546875, -1.7357177734375, -1.45562744140625, -1.175537109375, -0.89544677734375, -0.6153564453125, -0.33526611328125, -0.05517578125, 0.22491455078125, 0.5050048828125, 0.78509521484375, 1.065185546875, 1.34527587890625, 1.6253662109375, 1.90545654296875, 2.185546875, 2.46563720703125, 2.7457275390625, 3.02581787109375, 3.305908203125, 3.58599853515625, 3.8660888671875, 4.14617919921875, 4.42626953125, 4.70635986328125, 4.9864501953125, 5.26654052734375, 5.546630859375, 5.82672119140625, 6.1068115234375, 6.38690185546875, 6.6669921875, 6.94708251953125, 7.2271728515625, 7.50726318359375, 7.787353515625, 8.06744384765625, 8.3475341796875, 8.62762451171875, 8.90771484375, 9.18780517578125, 9.4678955078125, 9.74798583984375, 10.028076171875, 10.30816650390625, 10.5882568359375, 10.86834716796875, 11.1484375]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 6.0, 11.0, 10.0, 11.0, 11.0, 24.0, 28.0, 27.0, 41.0, 48.0, 63.0, 83.0, 138.0, 153.0, 250.0, 489.0, 1411.0, 84413.0, 3049230.0, 7396.0, 798.0, 337.0, 206.0, 130.0, 96.0, 71.0, 55.0, 40.0, 31.0, 14.0, 21.0, 7.0, 21.0, 7.0, 9.0, 4.0, 4.0, 2.0, 3.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.875, -24.05419921875, -23.2333984375, -22.41259765625, -21.591796875, -20.77099609375, -19.9501953125, -19.12939453125, -18.30859375, -17.48779296875, -16.6669921875, -15.84619140625, -15.025390625, -14.20458984375, -13.3837890625, -12.56298828125, -11.7421875, -10.92138671875, -10.1005859375, -9.27978515625, -8.458984375, -7.63818359375, -6.8173828125, -5.99658203125, -5.17578125, -4.35498046875, -3.5341796875, -2.71337890625, -1.892578125, -1.07177734375, -0.2509765625, 0.56982421875, 1.390625, 2.21142578125, 3.0322265625, 3.85302734375, 4.673828125, 5.49462890625, 6.3154296875, 7.13623046875, 7.95703125, 8.77783203125, 9.5986328125, 10.41943359375, 11.240234375, 12.06103515625, 12.8818359375, 13.70263671875, 14.5234375, 15.34423828125, 16.1650390625, 16.98583984375, 17.806640625, 18.62744140625, 19.4482421875, 20.26904296875, 21.08984375, 21.91064453125, 22.7314453125, 23.55224609375, 24.373046875, 25.19384765625, 26.0146484375, 26.83544921875, 27.65625]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 74.0, 632.0, 299.0, 11.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.503320693969727, -18.72210121154785, -15.94088363647461, -13.159664154052734, -10.378445625305176, -7.597227096557617, -4.816007614135742, -2.0347900390625, 0.746429443359375, 3.5276482105255127, 6.30886697769165, 9.090085983276367, 11.871304512023926, 14.652523040771484, 17.43374252319336, 20.2149600982666, 22.996179580688477, 25.77739906311035, 28.558616638183594, 31.33983612060547, 34.121055603027344, 36.90227508544922, 39.683494567871094, 42.4647102355957, 45.24592971801758, 48.02714920043945, 50.80836868286133, 53.58958435058594, 56.37080383300781, 59.15202331542969, 61.93324279785156, 64.71446228027344, 67.49567413330078, 70.27689361572266, 73.05811309814453, 75.8393325805664, 78.62055206298828, 81.40176391601562, 84.1829833984375, 86.96420288085938, 89.74542236328125, 92.52664184570312, 95.307861328125, 98.08908081054688, 100.87030029296875, 103.65151977539062, 106.4327392578125, 109.21395111083984, 111.99517822265625, 114.77639770507812, 117.5576171875, 120.33883666992188, 123.12005615234375, 125.90127563476562, 128.6824951171875, 131.46371459960938, 134.2449188232422, 137.02613830566406, 139.80735778808594, 142.5885772705078, 145.3697967529297, 148.15101623535156, 150.93223571777344, 153.7134552001953, 156.4946746826172]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 8.0, 6.0, 8.0, 10.0, 12.0, 17.0, 15.0, 18.0, 17.0, 13.0, 28.0, 24.0, 35.0, 41.0, 31.0, 40.0, 38.0, 47.0, 38.0, 47.0, 30.0, 42.0, 33.0, 39.0, 37.0, 32.0, 35.0, 35.0, 29.0, 25.0, 22.0, 34.0, 20.0, 18.0, 13.0, 17.0, 11.0, 4.0, 6.0, 5.0, 7.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-22.69818878173828, -22.0194034576416, -21.340618133544922, -20.66183090209961, -19.98304557800293, -19.30426025390625, -18.62547492980957, -17.94668960571289, -17.267902374267578, -16.5891170501709, -15.910330772399902, -15.231545448303223, -14.552759170532227, -13.873973846435547, -13.195188522338867, -12.516403198242188, -11.837617874145508, -11.158832550048828, -10.480046272277832, -9.801260948181152, -9.122474670410156, -8.443689346313477, -7.764904022216797, -7.086118221282959, -6.407332420349121, -5.728546619415283, -5.049760818481445, -4.370975494384766, -3.6921896934509277, -3.01340389251709, -2.33461856842041, -1.6558327674865723, -0.9770450592041016, -0.2982593774795532, 0.3805263042449951, 1.059311866760254, 1.7380976676940918, 2.4168834686279297, 3.0956687927246094, 3.7744545936584473, 4.453240394592285, 5.132026195526123, 5.810811996459961, 6.489597320556641, 7.1683831214904785, 7.847168922424316, 8.525954246520996, 9.204740524291992, 9.883525848388672, 10.562311172485352, 11.241097450256348, 11.919882774353027, 12.598669052124023, 13.277454376220703, 13.956239700317383, 14.635025024414062, 15.313811302185059, 15.992596626281738, 16.671382904052734, 17.350168228149414, 18.028953552246094, 18.707740783691406, 19.386524200439453, 20.065311431884766, 20.744096755981445]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 3.0, 5.0, 4.0, 2.0, 3.0, 3.0, 6.0, 2.0, 8.0, 9.0, 11.0, 12.0, 22.0, 20.0, 13.0, 18.0, 27.0, 17.0, 27.0, 30.0, 33.0, 35.0, 37.0, 33.0, 45.0, 49.0, 43.0, 27.0, 40.0, 42.0, 35.0, 26.0, 38.0, 34.0, 27.0, 23.0, 24.0, 24.0, 12.0, 22.0, 15.0, 17.0, 19.0, 13.0, 8.0, 13.0, 6.0, 11.0, 3.0, 3.0, 4.0, 6.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.271484375, -2.198577880859375, -2.12567138671875, -2.052764892578125, -1.9798583984375, -1.906951904296875, -1.83404541015625, -1.761138916015625, -1.688232421875, -1.615325927734375, -1.54241943359375, -1.469512939453125, -1.3966064453125, -1.323699951171875, -1.25079345703125, -1.177886962890625, -1.10498046875, -1.032073974609375, -0.95916748046875, -0.886260986328125, -0.8133544921875, -0.740447998046875, -0.66754150390625, -0.594635009765625, -0.521728515625, -0.448822021484375, -0.37591552734375, -0.303009033203125, -0.2301025390625, -0.157196044921875, -0.08428955078125, -0.011383056640625, 0.0615234375, 0.134429931640625, 0.20733642578125, 0.280242919921875, 0.3531494140625, 0.426055908203125, 0.49896240234375, 0.571868896484375, 0.644775390625, 0.717681884765625, 0.79058837890625, 0.863494873046875, 0.9364013671875, 1.009307861328125, 1.08221435546875, 1.155120849609375, 1.22802734375, 1.300933837890625, 1.37384033203125, 1.446746826171875, 1.5196533203125, 1.592559814453125, 1.66546630859375, 1.738372802734375, 1.811279296875, 1.884185791015625, 1.95709228515625, 2.029998779296875, 2.1029052734375, 2.175811767578125, 2.24871826171875, 2.321624755859375, 2.39453125]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 6.0, 3.0, 2.0, 2.0, 6.0, 3.0, 5.0, 4.0, 8.0, 14.0, 11.0, 11.0, 8.0, 21.0, 22.0, 26.0, 27.0, 33.0, 48.0, 52.0, 89.0, 157.0, 279.0, 788.0, 3331.0, 35439.0, 697934.0, 2756964.0, 660153.0, 33588.0, 3312.0, 916.0, 379.0, 195.0, 107.0, 65.0, 58.0, 27.0, 33.0, 20.0, 25.0, 11.0, 28.0, 17.0, 10.0, 9.0, 8.0, 8.0, 7.0, 6.0, 3.0, 1.0, 4.0, 2.0, 5.0, 4.0, 1.0, 1.0, 1.0], "bins": [-7.1171875, -6.89813232421875, -6.6790771484375, -6.46002197265625, -6.240966796875, -6.02191162109375, -5.8028564453125, -5.58380126953125, -5.36474609375, -5.14569091796875, -4.9266357421875, -4.70758056640625, -4.488525390625, -4.26947021484375, -4.0504150390625, -3.83135986328125, -3.6123046875, -3.39324951171875, -3.1741943359375, -2.95513916015625, -2.736083984375, -2.51702880859375, -2.2979736328125, -2.07891845703125, -1.85986328125, -1.64080810546875, -1.4217529296875, -1.20269775390625, -0.983642578125, -0.76458740234375, -0.5455322265625, -0.32647705078125, -0.107421875, 0.11163330078125, 0.3306884765625, 0.54974365234375, 0.768798828125, 0.98785400390625, 1.2069091796875, 1.42596435546875, 1.64501953125, 1.86407470703125, 2.0831298828125, 2.30218505859375, 2.521240234375, 2.74029541015625, 2.9593505859375, 3.17840576171875, 3.3974609375, 3.61651611328125, 3.8355712890625, 4.05462646484375, 4.273681640625, 4.49273681640625, 4.7117919921875, 4.93084716796875, 5.14990234375, 5.36895751953125, 5.5880126953125, 5.80706787109375, 6.026123046875, 6.24517822265625, 6.4642333984375, 6.68328857421875, 6.90234375]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 10.0, 5.0, 8.0, 11.0, 16.0, 20.0, 27.0, 25.0, 38.0, 41.0, 79.0, 79.0, 121.0, 141.0, 194.0, 253.0, 254.0, 309.0, 346.0, 358.0, 300.0, 285.0, 270.0, 201.0, 136.0, 124.0, 80.0, 102.0, 55.0, 42.0, 31.0, 23.0, 22.0, 14.0, 16.0, 12.0, 4.0, 4.0, 5.0, 4.0, 3.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.13671875, -3.9947509765625, -3.852783203125, -3.7108154296875, -3.56884765625, -3.4268798828125, -3.284912109375, -3.1429443359375, -3.0009765625, -2.8590087890625, -2.717041015625, -2.5750732421875, -2.43310546875, -2.2911376953125, -2.149169921875, -2.0072021484375, -1.865234375, -1.7232666015625, -1.581298828125, -1.4393310546875, -1.29736328125, -1.1553955078125, -1.013427734375, -0.8714599609375, -0.7294921875, -0.5875244140625, -0.445556640625, -0.3035888671875, -0.16162109375, -0.0196533203125, 0.122314453125, 0.2642822265625, 0.40625, 0.5482177734375, 0.690185546875, 0.8321533203125, 0.97412109375, 1.1160888671875, 1.258056640625, 1.4000244140625, 1.5419921875, 1.6839599609375, 1.825927734375, 1.9678955078125, 2.10986328125, 2.2518310546875, 2.393798828125, 2.5357666015625, 2.677734375, 2.8197021484375, 2.961669921875, 3.1036376953125, 3.24560546875, 3.3875732421875, 3.529541015625, 3.6715087890625, 3.8134765625, 3.9554443359375, 4.097412109375, 4.2393798828125, 4.38134765625, 4.5233154296875, 4.665283203125, 4.8072509765625, 4.94921875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 7.0, 3.0, 5.0, 9.0, 9.0, 21.0, 18.0, 19.0, 28.0, 54.0, 64.0, 94.0, 117.0, 155.0, 212.0, 340.0, 536.0, 1627.0, 37059.0, 2948143.0, 1191465.0, 11810.0, 1041.0, 426.0, 293.0, 186.0, 149.0, 92.0, 82.0, 52.0, 40.0, 26.0, 26.0, 21.0, 16.0, 12.0, 4.0, 8.0, 9.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.21875, -15.709716796875, -15.20068359375, -14.691650390625, -14.1826171875, -13.673583984375, -13.16455078125, -12.655517578125, -12.146484375, -11.637451171875, -11.12841796875, -10.619384765625, -10.1103515625, -9.601318359375, -9.09228515625, -8.583251953125, -8.07421875, -7.565185546875, -7.05615234375, -6.547119140625, -6.0380859375, -5.529052734375, -5.02001953125, -4.510986328125, -4.001953125, -3.492919921875, -2.98388671875, -2.474853515625, -1.9658203125, -1.456787109375, -0.94775390625, -0.438720703125, 0.0703125, 0.579345703125, 1.08837890625, 1.597412109375, 2.1064453125, 2.615478515625, 3.12451171875, 3.633544921875, 4.142578125, 4.651611328125, 5.16064453125, 5.669677734375, 6.1787109375, 6.687744140625, 7.19677734375, 7.705810546875, 8.21484375, 8.723876953125, 9.23291015625, 9.741943359375, 10.2509765625, 10.760009765625, 11.26904296875, 11.778076171875, 12.287109375, 12.796142578125, 13.30517578125, 13.814208984375, 14.3232421875, 14.832275390625, 15.34130859375, 15.850341796875, 16.359375]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 22.0, 189.0, 453.0, 294.0, 54.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-103.65222930908203, -100.47725677490234, -97.30227661132812, -94.12730407714844, -90.95233154296875, -87.77735900878906, -84.60238647460938, -81.42740631103516, -78.25243377685547, -75.07746124267578, -71.90248107910156, -68.72750854492188, -65.55253601074219, -62.3775634765625, -59.20258712768555, -56.027610778808594, -52.852638244628906, -49.67766571044922, -46.502689361572266, -43.32771301269531, -40.152740478515625, -36.97776794433594, -33.802791595458984, -30.627817153930664, -27.452842712402344, -24.277868270874023, -21.102893829345703, -17.927919387817383, -14.752944946289062, -11.577970504760742, -8.402996063232422, -5.228021621704102, -2.0530548095703125, 1.1219196319580078, 4.296894073486328, 7.471868515014648, 10.646842956542969, 13.821817398071289, 16.99679183959961, 20.17176628112793, 23.34674072265625, 26.52171516418457, 29.69668960571289, 32.871665954589844, 36.04663848876953, 39.22161102294922, 42.39658737182617, 45.571563720703125, 48.74653625488281, 51.9215087890625, 55.09648513793945, 58.271461486816406, 61.446434020996094, 64.62140655517578, 67.79638671875, 70.97135925292969, 74.14633178710938, 77.32130432128906, 80.49627685546875, 83.67125701904297, 86.84622955322266, 90.02120208740234, 93.19618225097656, 96.37115478515625, 99.54612731933594]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 5.0, 1.0, 3.0, 5.0, 6.0, 8.0, 7.0, 8.0, 12.0, 9.0, 16.0, 29.0, 14.0, 16.0, 25.0, 31.0, 33.0, 36.0, 37.0, 36.0, 47.0, 38.0, 35.0, 37.0, 35.0, 34.0, 39.0, 42.0, 40.0, 40.0, 38.0, 31.0, 30.0, 28.0, 29.0, 16.0, 13.0, 14.0, 16.0, 8.0, 12.0, 14.0, 9.0, 7.0, 10.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-16.75714874267578, -16.243026733398438, -15.728904724121094, -15.214783668518066, -14.700661659240723, -14.186539649963379, -13.672418594360352, -13.158296585083008, -12.644174575805664, -12.13005256652832, -11.615930557250977, -11.10180950164795, -10.587687492370605, -10.073565483093262, -9.559444427490234, -9.04532241821289, -8.531200408935547, -8.017078399658203, -7.502956867218018, -6.988835334777832, -6.474713325500488, -5.9605913162231445, -5.446469783782959, -4.932348251342773, -4.41822624206543, -3.904104471206665, -3.3899827003479004, -2.8758609294891357, -2.361739158630371, -1.8476173877716064, -1.3334956169128418, -0.8193738460540771, -0.3052520751953125, 0.20886969566345215, 0.7229914665222168, 1.2371132373809814, 1.751235008239746, 2.2653567790985107, 2.7794785499572754, 3.29360032081604, 3.8077220916748047, 4.321844100952148, 4.835965633392334, 5.3500871658325195, 5.864209175109863, 6.378331184387207, 6.892452716827393, 7.406574249267578, 7.920696258544922, 8.434818267822266, 8.94894027709961, 9.463061332702637, 9.97718334197998, 10.491305351257324, 11.005426406860352, 11.519548416137695, 12.033670425415039, 12.547792434692383, 13.061914443969727, 13.576035499572754, 14.090157508850098, 14.604279518127441, 15.118400573730469, 15.632522583007812, 16.146644592285156]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 4.0, 7.0, 9.0, 3.0, 20.0, 19.0, 22.0, 19.0, 26.0, 17.0, 29.0, 28.0, 33.0, 42.0, 33.0, 52.0, 51.0, 38.0, 40.0, 29.0, 41.0, 59.0, 33.0, 34.0, 25.0, 32.0, 45.0, 31.0, 27.0, 29.0, 23.0, 16.0, 15.0, 14.0, 12.0, 8.0, 10.0, 3.0, 4.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.53125, -2.452484130859375, -2.37371826171875, -2.294952392578125, -2.2161865234375, -2.137420654296875, -2.05865478515625, -1.979888916015625, -1.901123046875, -1.822357177734375, -1.74359130859375, -1.664825439453125, -1.5860595703125, -1.507293701171875, -1.42852783203125, -1.349761962890625, -1.27099609375, -1.192230224609375, -1.11346435546875, -1.034698486328125, -0.9559326171875, -0.877166748046875, -0.79840087890625, -0.719635009765625, -0.640869140625, -0.562103271484375, -0.48333740234375, -0.404571533203125, -0.3258056640625, -0.247039794921875, -0.16827392578125, -0.089508056640625, -0.0107421875, 0.068023681640625, 0.14678955078125, 0.225555419921875, 0.3043212890625, 0.383087158203125, 0.46185302734375, 0.540618896484375, 0.619384765625, 0.698150634765625, 0.77691650390625, 0.855682373046875, 0.9344482421875, 1.013214111328125, 1.09197998046875, 1.170745849609375, 1.24951171875, 1.328277587890625, 1.40704345703125, 1.485809326171875, 1.5645751953125, 1.643341064453125, 1.72210693359375, 1.800872802734375, 1.879638671875, 1.958404541015625, 2.03717041015625, 2.115936279296875, 2.1947021484375, 2.273468017578125, 2.35223388671875, 2.430999755859375, 2.509765625]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 12.0, 12.0, 13.0, 31.0, 29.0, 55.0, 73.0, 108.0, 160.0, 250.0, 378.0, 539.0, 810.0, 1215.0, 1800.0, 2649.0, 4187.0, 6282.0, 10189.0, 16053.0, 26407.0, 45285.0, 80965.0, 152999.0, 254476.0, 196662.0, 104464.0, 56403.0, 32263.0, 19568.0, 11920.0, 7757.0, 5008.0, 3216.0, 2114.0, 1366.0, 929.0, 585.0, 437.0, 289.0, 178.0, 148.0, 78.0, 70.0, 40.0, 27.0, 22.0, 13.0, 11.0, 6.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.3486328125, -0.3379707336425781, -0.32730865478515625, -0.3166465759277344, -0.3059844970703125, -0.2953224182128906, -0.28466033935546875, -0.2739982604980469, -0.263336181640625, -0.2526741027832031, -0.24201202392578125, -0.23134994506835938, -0.2206878662109375, -0.21002578735351562, -0.19936370849609375, -0.18870162963867188, -0.17803955078125, -0.16737747192382812, -0.15671539306640625, -0.14605331420898438, -0.1353912353515625, -0.12472915649414062, -0.11406707763671875, -0.10340499877929688, -0.092742919921875, -0.08208084106445312, -0.07141876220703125, -0.060756683349609375, -0.0500946044921875, -0.039432525634765625, -0.02877044677734375, -0.018108367919921875, -0.0074462890625, 0.003215789794921875, 0.01387786865234375, 0.024539947509765625, 0.0352020263671875, 0.045864105224609375, 0.05652618408203125, 0.06718826293945312, 0.077850341796875, 0.08851242065429688, 0.09917449951171875, 0.10983657836914062, 0.1204986572265625, 0.13116073608398438, 0.14182281494140625, 0.15248489379882812, 0.16314697265625, 0.17380905151367188, 0.18447113037109375, 0.19513320922851562, 0.2057952880859375, 0.21645736694335938, 0.22711944580078125, 0.23778152465820312, 0.248443603515625, 0.2591056823730469, 0.26976776123046875, 0.2804298400878906, 0.2910919189453125, 0.3017539978027344, 0.31241607666015625, 0.3230781555175781, 0.333740234375]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 3.0, 8.0, 11.0, 7.0, 18.0, 18.0, 13.0, 13.0, 19.0, 23.0, 28.0, 19.0, 36.0, 26.0, 29.0, 32.0, 49.0, 34.0, 37.0, 46.0, 39.0, 1060.0, 34.0, 37.0, 35.0, 35.0, 40.0, 31.0, 35.0, 38.0, 23.0, 23.0, 13.0, 11.0, 16.0, 15.0, 11.0, 12.0, 15.0, 5.0, 7.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0], "bins": [-1.654296875, -1.6084747314453125, -1.562652587890625, -1.5168304443359375, -1.47100830078125, -1.4251861572265625, -1.379364013671875, -1.3335418701171875, -1.2877197265625, -1.2418975830078125, -1.196075439453125, -1.1502532958984375, -1.10443115234375, -1.0586090087890625, -1.012786865234375, -0.9669647216796875, -0.921142578125, -0.8753204345703125, -0.829498291015625, -0.7836761474609375, -0.73785400390625, -0.6920318603515625, -0.646209716796875, -0.6003875732421875, -0.5545654296875, -0.5087432861328125, -0.462921142578125, -0.4170989990234375, -0.37127685546875, -0.3254547119140625, -0.279632568359375, -0.2338104248046875, -0.18798828125, -0.1421661376953125, -0.096343994140625, -0.0505218505859375, -0.00469970703125, 0.0411224365234375, 0.086944580078125, 0.1327667236328125, 0.1785888671875, 0.2244110107421875, 0.270233154296875, 0.3160552978515625, 0.36187744140625, 0.4076995849609375, 0.453521728515625, 0.4993438720703125, 0.545166015625, 0.5909881591796875, 0.636810302734375, 0.6826324462890625, 0.72845458984375, 0.7742767333984375, 0.820098876953125, 0.8659210205078125, 0.9117431640625, 0.9575653076171875, 1.003387451171875, 1.0492095947265625, 1.09503173828125, 1.1408538818359375, 1.186676025390625, 1.2324981689453125, 1.2783203125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 6.0, 5.0, 7.0, 9.0, 18.0, 30.0, 51.0, 59.0, 86.0, 141.0, 203.0, 292.0, 441.0, 610.0, 845.0, 1360.0, 1963.0, 2870.0, 4421.0, 6768.0, 10332.0, 15876.0, 25939.0, 42274.0, 70788.0, 121251.0, 207640.0, 1246425.0, 133525.0, 78430.0, 46582.0, 28083.0, 17512.0, 10855.0, 7127.0, 4622.0, 3114.0, 2064.0, 1396.0, 932.0, 701.0, 464.0, 321.0, 244.0, 144.0, 111.0, 59.0, 48.0, 41.0, 17.0, 17.0, 11.0, 8.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2425537109375, -0.23499488830566406, -0.22743606567382812, -0.2198772430419922, -0.21231842041015625, -0.2047595977783203, -0.19720077514648438, -0.18964195251464844, -0.1820831298828125, -0.17452430725097656, -0.16696548461914062, -0.1594066619873047, -0.15184783935546875, -0.1442890167236328, -0.13673019409179688, -0.12917137145996094, -0.121612548828125, -0.11405372619628906, -0.10649490356445312, -0.09893608093261719, -0.09137725830078125, -0.08381843566894531, -0.07625961303710938, -0.06870079040527344, -0.0611419677734375, -0.05358314514160156, -0.046024322509765625, -0.03846549987792969, -0.03090667724609375, -0.023347854614257812, -0.015789031982421875, -0.008230209350585938, -0.00067138671875, 0.0068874359130859375, 0.014446258544921875, 0.022005081176757812, 0.02956390380859375, 0.03712272644042969, 0.044681549072265625, 0.05224037170410156, 0.0597991943359375, 0.06735801696777344, 0.07491683959960938, 0.08247566223144531, 0.09003448486328125, 0.09759330749511719, 0.10515213012695312, 0.11271095275878906, 0.120269775390625, 0.12782859802246094, 0.13538742065429688, 0.1429462432861328, 0.15050506591796875, 0.1580638885498047, 0.16562271118164062, 0.17318153381347656, 0.1807403564453125, 0.18829917907714844, 0.19585800170898438, 0.2034168243408203, 0.21097564697265625, 0.2185344696044922, 0.22609329223632812, 0.23365211486816406, 0.2412109375]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 5.0, 5.0, 7.0, 2.0, 5.0, 21.0, 11.0, 21.0, 27.0, 39.0, 54.0, 65.0, 95.0, 94.0, 101.0, 99.0, 93.0, 78.0, 44.0, 38.0, 23.0, 27.0, 15.0, 7.0, 4.0, 6.0, 7.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00135040283203125, -0.0013047903776168823, -0.0012591779232025146, -0.001213565468788147, -0.0011679530143737793, -0.0011223405599594116, -0.001076728105545044, -0.0010311156511306763, -0.0009855031967163086, -0.0009398907423019409, -0.0008942782878875732, -0.0008486658334732056, -0.0008030533790588379, -0.0007574409246444702, -0.0007118284702301025, -0.0006662160158157349, -0.0006206035614013672, -0.0005749911069869995, -0.0005293786525726318, -0.00048376619815826416, -0.0004381537437438965, -0.0003925412893295288, -0.00034692883491516113, -0.00030131638050079346, -0.0002557039260864258, -0.0002100914716720581, -0.00016447901725769043, -0.00011886656284332275, -7.325410842895508e-05, -2.7641654014587402e-05, 1.7970800399780273e-05, 6.358325481414795e-05, 0.00010919570922851562, 0.0001548081636428833, 0.00020042061805725098, 0.00024603307247161865, 0.00029164552688598633, 0.000337257981300354, 0.0003828704357147217, 0.00042848289012908936, 0.00047409534454345703, 0.0005197077989578247, 0.0005653202533721924, 0.0006109327077865601, 0.0006565451622009277, 0.0007021576166152954, 0.0007477700710296631, 0.0007933825254440308, 0.0008389949798583984, 0.0008846074342727661, 0.0009302198886871338, 0.0009758323431015015, 0.0010214447975158691, 0.0010670572519302368, 0.0011126697063446045, 0.0011582821607589722, 0.0012038946151733398, 0.0012495070695877075, 0.0012951195240020752, 0.0013407319784164429, 0.0013863444328308105, 0.0014319568872451782, 0.001477569341659546, 0.0015231817960739136, 0.0015687942504882812]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 2.0, 5.0, 8.0, 5.0, 5.0, 13.0, 25.0, 38.0, 60.0, 107.0, 191.0, 463.0, 4357.0, 1039744.0, 2642.0, 421.0, 188.0, 81.0, 58.0, 41.0, 23.0, 24.0, 13.0, 11.0, 4.0, 7.0, 5.0, 4.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.03558349609375, -0.03455066680908203, -0.03351783752441406, -0.032485008239746094, -0.031452178955078125, -0.030419349670410156, -0.029386520385742188, -0.02835369110107422, -0.02732086181640625, -0.02628803253173828, -0.025255203247070312, -0.024222373962402344, -0.023189544677734375, -0.022156715393066406, -0.021123886108398438, -0.02009105682373047, -0.0190582275390625, -0.01802539825439453, -0.016992568969726562, -0.015959739685058594, -0.014926910400390625, -0.013894081115722656, -0.012861251831054688, -0.011828422546386719, -0.01079559326171875, -0.009762763977050781, -0.008729934692382812, -0.007697105407714844, -0.006664276123046875, -0.005631446838378906, -0.0045986175537109375, -0.0035657882690429688, -0.002532958984375, -0.0015001296997070312, -0.0004673004150390625, 0.0005655288696289062, 0.001598358154296875, 0.0026311874389648438, 0.0036640167236328125, 0.004696846008300781, 0.00572967529296875, 0.006762504577636719, 0.0077953338623046875, 0.008828163146972656, 0.009860992431640625, 0.010893821716308594, 0.011926651000976562, 0.012959480285644531, 0.0139923095703125, 0.015025138854980469, 0.016057968139648438, 0.017090797424316406, 0.018123626708984375, 0.019156455993652344, 0.020189285278320312, 0.02122211456298828, 0.02225494384765625, 0.02328777313232422, 0.024320602416992188, 0.025353431701660156, 0.026386260986328125, 0.027419090270996094, 0.028451919555664062, 0.02948474884033203, 0.030517578125]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 31.0, 246.0, 491.0, 220.0, 24.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009341160766780376, -0.0008362005464732647, -0.0007382850162684917, -0.0006403694860637188, -0.0005424539558589458, -0.000444538367446512, -0.00034662283724173903, -0.0002487073070369661, -0.00015079177683219314, -5.287623935146257e-05, 4.503929812926799e-05, 0.00014295484288595617, 0.00024087037309072912, 0.0003387859323993325, 0.00043670146260410547, 0.0005346169928088784, 0.0006325325230136514, 0.0007304480532184243, 0.0008283635834231973, 0.0009262791136279702, 0.0010241946438327432, 0.001122110290452838, 0.001220025820657611, 0.0013179413508623838, 0.0014158568810671568, 0.0015137724112719297, 0.0016116879414767027, 0.0017096034716814756, 0.0018075190018862486, 0.0019054345320910215, 0.0020033500622957945, 0.0021012655925005674, 0.0021991811227053404, 0.0022970966529101133, 0.0023950121831148863, 0.0024929277133196592, 0.002590843243524432, 0.002688758773729205, 0.002786674303933978, 0.002884589834138751, 0.002982505364343524, 0.003080420894548297, 0.00317833642475307, 0.003276251954957843, 0.0033741674851626158, 0.0034720830153673887, 0.0035699985455721617, 0.0036679140757769346, 0.0037658298388123512, 0.003863745369017124, 0.003961660899221897, 0.00405957642942667, 0.004157491959631443, 0.004255407489836216, 0.004353323020040989, 0.004451238550245762, 0.004549154080450535, 0.004647069610655308, 0.004744985140860081, 0.004842900671064854, 0.004940816201269627, 0.0050387317314744, 0.0051366472616791725, 0.0052345627918839455, 0.005332478322088718]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 2.0, 6.0, 7.0, 8.0, 6.0, 2.0, 12.0, 4.0, 17.0, 21.0, 18.0, 23.0, 16.0, 26.0, 20.0, 29.0, 26.0, 45.0, 34.0, 38.0, 41.0, 35.0, 36.0, 29.0, 41.0, 44.0, 34.0, 32.0, 29.0, 34.0, 37.0, 32.0, 23.0, 21.0, 32.0, 23.0, 16.0, 24.0, 18.0, 11.0, 18.0, 9.0, 5.0, 8.0, 5.0, 6.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.0005388259887695312, -0.0005229907110333443, -0.0005071554332971573, -0.0004913201555609703, -0.0004754848778247833, -0.00045964960008859634, -0.00044381432235240936, -0.0004279790446162224, -0.0004121437668800354, -0.0003963084891438484, -0.00038047321140766144, -0.00036463793367147446, -0.0003488026559352875, -0.0003329673781991005, -0.0003171321004629135, -0.00030129682272672653, -0.00028546154499053955, -0.00026962626725435257, -0.0002537909895181656, -0.0002379557117819786, -0.00022212043404579163, -0.00020628515630960464, -0.00019044987857341766, -0.00017461460083723068, -0.0001587793231010437, -0.00014294404536485672, -0.00012710876762866974, -0.00011127348989248276, -9.543821215629578e-05, -7.96029344201088e-05, -6.376765668392181e-05, -4.793237894773483e-05, -3.209710121154785e-05, -1.626182347536087e-05, -4.2654573917388916e-07, 1.5408731997013092e-05, 3.124400973320007e-05, 4.7079287469387054e-05, 6.291456520557404e-05, 7.874984294176102e-05, 9.4585120677948e-05, 0.00011042039841413498, 0.00012625567615032196, 0.00014209095388650894, 0.00015792623162269592, 0.0001737615093588829, 0.00018959678709506989, 0.00020543206483125687, 0.00022126734256744385, 0.00023710262030363083, 0.0002529378980398178, 0.0002687731757760048, 0.00028460845351219177, 0.00030044373124837875, 0.00031627900898456573, 0.0003321142867207527, 0.0003479495644569397, 0.0003637848421931267, 0.00037962011992931366, 0.00039545539766550064, 0.0004112906754016876, 0.0004271259531378746, 0.0004429612308740616, 0.00045879650861024857, 0.00047463178634643555]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 4.0, 7.0, 9.0, 3.0, 20.0, 19.0, 22.0, 19.0, 26.0, 17.0, 29.0, 28.0, 33.0, 42.0, 33.0, 52.0, 51.0, 38.0, 40.0, 29.0, 41.0, 59.0, 33.0, 34.0, 25.0, 32.0, 45.0, 31.0, 27.0, 29.0, 23.0, 16.0, 15.0, 14.0, 12.0, 8.0, 10.0, 3.0, 4.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.53125, -2.452484130859375, -2.37371826171875, -2.294952392578125, -2.2161865234375, -2.137420654296875, -2.05865478515625, -1.979888916015625, -1.901123046875, -1.822357177734375, -1.74359130859375, -1.664825439453125, -1.5860595703125, -1.507293701171875, -1.42852783203125, -1.349761962890625, -1.27099609375, -1.192230224609375, -1.11346435546875, -1.034698486328125, -0.9559326171875, -0.877166748046875, -0.79840087890625, -0.719635009765625, -0.640869140625, -0.562103271484375, -0.48333740234375, -0.404571533203125, -0.3258056640625, -0.247039794921875, -0.16827392578125, -0.089508056640625, -0.0107421875, 0.068023681640625, 0.14678955078125, 0.225555419921875, 0.3043212890625, 0.383087158203125, 0.46185302734375, 0.540618896484375, 0.619384765625, 0.698150634765625, 0.77691650390625, 0.855682373046875, 0.9344482421875, 1.013214111328125, 1.09197998046875, 1.170745849609375, 1.24951171875, 1.328277587890625, 1.40704345703125, 1.485809326171875, 1.5645751953125, 1.643341064453125, 1.72210693359375, 1.800872802734375, 1.879638671875, 1.958404541015625, 2.03717041015625, 2.115936279296875, 2.1947021484375, 2.273468017578125, 2.35223388671875, 2.430999755859375, 2.509765625]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 5.0, 7.0, 6.0, 6.0, 11.0, 22.0, 21.0, 26.0, 39.0, 60.0, 87.0, 144.0, 205.0, 331.0, 616.0, 1255.0, 2853.0, 6790.0, 16787.0, 43972.0, 114215.0, 288325.0, 345738.0, 138439.0, 53407.0, 20507.0, 8003.0, 3343.0, 1516.0, 763.0, 379.0, 257.0, 125.0, 75.0, 77.0, 38.0, 30.0, 31.0, 13.0, 11.0, 5.0, 9.0, 3.0, 4.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.912109375, -2.81536865234375, -2.7186279296875, -2.62188720703125, -2.525146484375, -2.42840576171875, -2.3316650390625, -2.23492431640625, -2.13818359375, -2.04144287109375, -1.9447021484375, -1.84796142578125, -1.751220703125, -1.65447998046875, -1.5577392578125, -1.46099853515625, -1.3642578125, -1.26751708984375, -1.1707763671875, -1.07403564453125, -0.977294921875, -0.88055419921875, -0.7838134765625, -0.68707275390625, -0.59033203125, -0.49359130859375, -0.3968505859375, -0.30010986328125, -0.203369140625, -0.10662841796875, -0.0098876953125, 0.08685302734375, 0.18359375, 0.28033447265625, 0.3770751953125, 0.47381591796875, 0.570556640625, 0.66729736328125, 0.7640380859375, 0.86077880859375, 0.95751953125, 1.05426025390625, 1.1510009765625, 1.24774169921875, 1.344482421875, 1.44122314453125, 1.5379638671875, 1.63470458984375, 1.7314453125, 1.82818603515625, 1.9249267578125, 2.02166748046875, 2.118408203125, 2.21514892578125, 2.3118896484375, 2.40863037109375, 2.50537109375, 2.60211181640625, 2.6988525390625, 2.79559326171875, 2.892333984375, 2.98907470703125, 3.0858154296875, 3.18255615234375, 3.279296875]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 10.0, 6.0, 3.0, 10.0, 7.0, 18.0, 21.0, 24.0, 29.0, 32.0, 36.0, 53.0, 52.0, 67.0, 80.0, 160.0, 338.0, 1468.0, 188.0, 89.0, 75.0, 60.0, 40.0, 34.0, 28.0, 24.0, 24.0, 17.0, 11.0, 12.0, 10.0, 10.0, 8.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.328125, -10.9864501953125, -10.644775390625, -10.3031005859375, -9.96142578125, -9.6197509765625, -9.278076171875, -8.9364013671875, -8.5947265625, -8.2530517578125, -7.911376953125, -7.5697021484375, -7.22802734375, -6.8863525390625, -6.544677734375, -6.2030029296875, -5.861328125, -5.5196533203125, -5.177978515625, -4.8363037109375, -4.49462890625, -4.1529541015625, -3.811279296875, -3.4696044921875, -3.1279296875, -2.7862548828125, -2.444580078125, -2.1029052734375, -1.76123046875, -1.4195556640625, -1.077880859375, -0.7362060546875, -0.39453125, -0.0528564453125, 0.288818359375, 0.6304931640625, 0.97216796875, 1.3138427734375, 1.655517578125, 1.9971923828125, 2.3388671875, 2.6805419921875, 3.022216796875, 3.3638916015625, 3.70556640625, 4.0472412109375, 4.388916015625, 4.7305908203125, 5.072265625, 5.4139404296875, 5.755615234375, 6.0972900390625, 6.43896484375, 6.7806396484375, 7.122314453125, 7.4639892578125, 7.8056640625, 8.1473388671875, 8.489013671875, 8.8306884765625, 9.17236328125, 9.5140380859375, 9.855712890625, 10.1973876953125, 10.5390625]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 3.0, 8.0, 6.0, 3.0, 10.0, 6.0, 11.0, 13.0, 33.0, 27.0, 48.0, 63.0, 101.0, 158.0, 273.0, 576.0, 3309.0, 3104145.0, 34732.0, 1105.0, 437.0, 214.0, 152.0, 81.0, 57.0, 41.0, 19.0, 16.0, 11.0, 12.0, 15.0, 8.0, 4.0, 2.0, 4.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-50.6875, -49.22802734375, -47.7685546875, -46.30908203125, -44.849609375, -43.39013671875, -41.9306640625, -40.47119140625, -39.01171875, -37.55224609375, -36.0927734375, -34.63330078125, -33.173828125, -31.71435546875, -30.2548828125, -28.79541015625, -27.3359375, -25.87646484375, -24.4169921875, -22.95751953125, -21.498046875, -20.03857421875, -18.5791015625, -17.11962890625, -15.66015625, -14.20068359375, -12.7412109375, -11.28173828125, -9.822265625, -8.36279296875, -6.9033203125, -5.44384765625, -3.984375, -2.52490234375, -1.0654296875, 0.39404296875, 1.853515625, 3.31298828125, 4.7724609375, 6.23193359375, 7.69140625, 9.15087890625, 10.6103515625, 12.06982421875, 13.529296875, 14.98876953125, 16.4482421875, 17.90771484375, 19.3671875, 20.82666015625, 22.2861328125, 23.74560546875, 25.205078125, 26.66455078125, 28.1240234375, 29.58349609375, 31.04296875, 32.50244140625, 33.9619140625, 35.42138671875, 36.880859375, 38.34033203125, 39.7998046875, 41.25927734375, 42.71875]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 85.0, 391.0, 415.0, 107.0, 9.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.1226806640625, -78.42129516601562, -76.71990203857422, -75.01851654052734, -73.31712341308594, -71.61573791503906, -69.91435241699219, -68.21295928955078, -66.5115737915039, -64.81018829345703, -63.108795166015625, -61.40740966796875, -59.70602035522461, -58.00463104248047, -56.303245544433594, -54.60185623168945, -52.90046691894531, -51.19907760620117, -49.49768829345703, -47.796302795410156, -46.094913482666016, -44.393524169921875, -42.692138671875, -40.99074935913086, -39.28936004638672, -37.58797073364258, -35.88658142089844, -34.18519592285156, -32.48380661010742, -30.78241729736328, -29.081029891967773, -27.379642486572266, -25.67825698852539, -23.97686767578125, -22.275480270385742, -20.574092864990234, -18.872703552246094, -17.171314239501953, -15.469926834106445, -13.768538475036621, -12.067150115966797, -10.365761756896973, -8.664373397827148, -6.962985038757324, -5.2615966796875, -3.560208320617676, -1.8588199615478516, -0.15743160247802734, 1.5439567565917969, 3.245345115661621, 4.946733474731445, 6.6481218338012695, 8.349510192871094, 10.050898551940918, 11.752286911010742, 13.453675270080566, 15.15506362915039, 16.85645294189453, 18.55784034729004, 20.259227752685547, 21.960617065429688, 23.662006378173828, 25.363393783569336, 27.064781188964844, 28.766170501708984]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 6.0, 4.0, 4.0, 5.0, 4.0, 13.0, 16.0, 14.0, 15.0, 18.0, 27.0, 27.0, 21.0, 48.0, 43.0, 31.0, 47.0, 28.0, 43.0, 46.0, 53.0, 58.0, 39.0, 40.0, 53.0, 47.0, 45.0, 36.0, 30.0, 23.0, 21.0, 23.0, 15.0, 14.0, 12.0, 8.0, 11.0, 9.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.709001541137695, -24.9377384185791, -24.166475296020508, -23.395212173461914, -22.62394905090332, -21.852684020996094, -21.0814208984375, -20.310157775878906, -19.538894653320312, -18.76763153076172, -17.996368408203125, -17.22510528564453, -16.453842163085938, -15.682578086853027, -14.911314964294434, -14.140050888061523, -13.368788719177246, -12.597525596618652, -11.826262474060059, -11.054998397827148, -10.283735275268555, -9.512472152709961, -8.741209030151367, -7.969945430755615, -7.1986823081970215, -6.427419185638428, -5.656155586242676, -4.884892463684082, -4.113629341125488, -3.3423657417297363, -2.5711026191711426, -1.7998390197753906, -1.0285758972167969, -0.2573125958442688, 0.5139507055282593, 1.2852139472961426, 2.0564773082733154, 2.8277406692504883, 3.599003791809082, 4.370267391204834, 5.141530513763428, 5.9127936363220215, 6.684057235717773, 7.455320358276367, 8.226583480834961, 8.997846603393555, 9.769109725952148, 10.540373802185059, 11.311636924743652, 12.082900047302246, 12.85416316986084, 13.62542724609375, 14.396690368652344, 15.167953491210938, 15.939216613769531, 16.710479736328125, 17.48174285888672, 18.253005981445312, 19.024269104003906, 19.7955322265625, 20.566795349121094, 21.338058471679688, 22.10932159423828, 22.880586624145508, 23.6518497467041]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 3.0, 1.0, 4.0, 9.0, 8.0, 8.0, 8.0, 11.0, 11.0, 15.0, 26.0, 23.0, 23.0, 36.0, 34.0, 36.0, 34.0, 41.0, 43.0, 41.0, 55.0, 34.0, 50.0, 45.0, 34.0, 35.0, 39.0, 45.0, 33.0, 35.0, 37.0, 28.0, 25.0, 15.0, 13.0, 15.0, 12.0, 8.0, 2.0, 8.0, 11.0, 7.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.26171875, -3.168243408203125, -3.07476806640625, -2.981292724609375, -2.8878173828125, -2.794342041015625, -2.70086669921875, -2.607391357421875, -2.513916015625, -2.420440673828125, -2.32696533203125, -2.233489990234375, -2.1400146484375, -2.046539306640625, -1.95306396484375, -1.859588623046875, -1.76611328125, -1.672637939453125, -1.57916259765625, -1.485687255859375, -1.3922119140625, -1.298736572265625, -1.20526123046875, -1.111785888671875, -1.018310546875, -0.924835205078125, -0.83135986328125, -0.737884521484375, -0.6444091796875, -0.550933837890625, -0.45745849609375, -0.363983154296875, -0.2705078125, -0.177032470703125, -0.08355712890625, 0.009918212890625, 0.1033935546875, 0.196868896484375, 0.29034423828125, 0.383819580078125, 0.477294921875, 0.570770263671875, 0.66424560546875, 0.757720947265625, 0.8511962890625, 0.944671630859375, 1.03814697265625, 1.131622314453125, 1.22509765625, 1.318572998046875, 1.41204833984375, 1.505523681640625, 1.5989990234375, 1.692474365234375, 1.78594970703125, 1.879425048828125, 1.972900390625, 2.066375732421875, 2.15985107421875, 2.253326416015625, 2.3468017578125, 2.440277099609375, 2.53375244140625, 2.627227783203125, 2.720703125]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 9.0, 5.0, 7.0, 9.0, 9.0, 11.0, 16.0, 19.0, 28.0, 30.0, 42.0, 65.0, 104.0, 176.0, 278.0, 574.0, 1880.0, 12743.0, 169219.0, 1567401.0, 2091644.0, 321558.0, 23367.0, 3103.0, 893.0, 416.0, 199.0, 146.0, 107.0, 60.0, 39.0, 32.0, 20.0, 14.0, 16.0, 11.0, 12.0, 3.0, 8.0, 5.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-7.26171875, -7.06610107421875, -6.8704833984375, -6.67486572265625, -6.479248046875, -6.28363037109375, -6.0880126953125, -5.89239501953125, -5.69677734375, -5.50115966796875, -5.3055419921875, -5.10992431640625, -4.914306640625, -4.71868896484375, -4.5230712890625, -4.32745361328125, -4.1318359375, -3.93621826171875, -3.7406005859375, -3.54498291015625, -3.349365234375, -3.15374755859375, -2.9581298828125, -2.76251220703125, -2.56689453125, -2.37127685546875, -2.1756591796875, -1.98004150390625, -1.784423828125, -1.58880615234375, -1.3931884765625, -1.19757080078125, -1.001953125, -0.80633544921875, -0.6107177734375, -0.41510009765625, -0.219482421875, -0.02386474609375, 0.1717529296875, 0.36737060546875, 0.56298828125, 0.75860595703125, 0.9542236328125, 1.14984130859375, 1.345458984375, 1.54107666015625, 1.7366943359375, 1.93231201171875, 2.1279296875, 2.32354736328125, 2.5191650390625, 2.71478271484375, 2.910400390625, 3.10601806640625, 3.3016357421875, 3.49725341796875, 3.69287109375, 3.88848876953125, 4.0841064453125, 4.27972412109375, 4.475341796875, 4.67095947265625, 4.8665771484375, 5.06219482421875, 5.2578125]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 5.0, 10.0, 16.0, 14.0, 18.0, 25.0, 31.0, 35.0, 60.0, 78.0, 95.0, 119.0, 152.0, 217.0, 262.0, 345.0, 346.0, 355.0, 401.0, 316.0, 279.0, 211.0, 169.0, 126.0, 79.0, 75.0, 52.0, 47.0, 28.0, 28.0, 22.0, 17.0, 7.0, 9.0, 7.0, 5.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5703125, -4.40985107421875, -4.2493896484375, -4.08892822265625, -3.928466796875, -3.76800537109375, -3.6075439453125, -3.44708251953125, -3.28662109375, -3.12615966796875, -2.9656982421875, -2.80523681640625, -2.644775390625, -2.48431396484375, -2.3238525390625, -2.16339111328125, -2.0029296875, -1.84246826171875, -1.6820068359375, -1.52154541015625, -1.361083984375, -1.20062255859375, -1.0401611328125, -0.87969970703125, -0.71923828125, -0.55877685546875, -0.3983154296875, -0.23785400390625, -0.077392578125, 0.08306884765625, 0.2435302734375, 0.40399169921875, 0.564453125, 0.72491455078125, 0.8853759765625, 1.04583740234375, 1.206298828125, 1.36676025390625, 1.5272216796875, 1.68768310546875, 1.84814453125, 2.00860595703125, 2.1690673828125, 2.32952880859375, 2.489990234375, 2.65045166015625, 2.8109130859375, 2.97137451171875, 3.1318359375, 3.29229736328125, 3.4527587890625, 3.61322021484375, 3.773681640625, 3.93414306640625, 4.0946044921875, 4.25506591796875, 4.41552734375, 4.57598876953125, 4.7364501953125, 4.89691162109375, 5.057373046875, 5.21783447265625, 5.3782958984375, 5.53875732421875, 5.69921875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 4.0, 2.0, 9.0, 6.0, 11.0, 13.0, 11.0, 25.0, 40.0, 38.0, 45.0, 75.0, 98.0, 122.0, 188.0, 262.0, 370.0, 643.0, 5744.0, 677859.0, 3456165.0, 49792.0, 1229.0, 449.0, 301.0, 202.0, 140.0, 114.0, 90.0, 65.0, 44.0, 32.0, 21.0, 26.0, 15.0, 13.0, 7.0, 8.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-20.125, -19.5697021484375, -19.014404296875, -18.4591064453125, -17.90380859375, -17.3485107421875, -16.793212890625, -16.2379150390625, -15.6826171875, -15.1273193359375, -14.572021484375, -14.0167236328125, -13.46142578125, -12.9061279296875, -12.350830078125, -11.7955322265625, -11.240234375, -10.6849365234375, -10.129638671875, -9.5743408203125, -9.01904296875, -8.4637451171875, -7.908447265625, -7.3531494140625, -6.7978515625, -6.2425537109375, -5.687255859375, -5.1319580078125, -4.57666015625, -4.0213623046875, -3.466064453125, -2.9107666015625, -2.35546875, -1.8001708984375, -1.244873046875, -0.6895751953125, -0.13427734375, 0.4210205078125, 0.976318359375, 1.5316162109375, 2.0869140625, 2.6422119140625, 3.197509765625, 3.7528076171875, 4.30810546875, 4.8634033203125, 5.418701171875, 5.9739990234375, 6.529296875, 7.0845947265625, 7.639892578125, 8.1951904296875, 8.75048828125, 9.3057861328125, 9.861083984375, 10.4163818359375, 10.9716796875, 11.5269775390625, 12.082275390625, 12.6375732421875, 13.19287109375, 13.7481689453125, 14.303466796875, 14.8587646484375, 15.4140625]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 6.0, 21.0, 27.0, 43.0, 74.0, 119.0, 122.0, 125.0, 112.0, 106.0, 85.0, 62.0, 51.0, 27.0, 11.0, 11.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.96943664550781, -38.07806396484375, -37.18669509887695, -36.29532241821289, -35.403953552246094, -34.51258087158203, -33.621212005615234, -32.72983932495117, -31.838468551635742, -30.947097778320312, -30.055727005004883, -29.164356231689453, -28.27298355102539, -27.381614685058594, -26.49024200439453, -25.5988712310791, -24.707500457763672, -23.816129684448242, -22.924758911132812, -22.033388137817383, -21.142017364501953, -20.25064468383789, -19.35927391052246, -18.46790313720703, -17.5765323638916, -16.685161590576172, -15.793790817260742, -14.902419090270996, -14.011048316955566, -13.119677543640137, -12.22830581665039, -11.336935043334961, -10.445564270019531, -9.554193496704102, -8.662822723388672, -7.771450996398926, -6.880080223083496, -5.988709449768066, -5.0973381996154785, -4.205966949462891, -3.314596176147461, -2.423225164413452, -1.5318541526794434, -0.6404831409454346, 0.2508878707885742, 1.142258644104004, 2.033629894256592, 2.9250011444091797, 3.8163719177246094, 4.707742691040039, 5.599113941192627, 6.490485191345215, 7.3818559646606445, 8.273226737976074, 9.16459846496582, 10.05596923828125, 10.94734001159668, 11.83871078491211, 12.730081558227539, 13.621453285217285, 14.512824058532715, 15.404194831848145, 16.29556655883789, 17.18693733215332, 18.07830810546875]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 3.0, 8.0, 8.0, 11.0, 6.0, 12.0, 17.0, 16.0, 16.0, 28.0, 17.0, 19.0, 23.0, 31.0, 22.0, 35.0, 34.0, 49.0, 43.0, 49.0, 35.0, 43.0, 44.0, 50.0, 62.0, 31.0, 42.0, 45.0, 31.0, 26.0, 23.0, 35.0, 26.0, 14.0, 16.0, 8.0, 5.0, 6.0, 9.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.916261672973633, -19.291183471679688, -18.666105270385742, -18.041027069091797, -17.41594886779785, -16.790870666503906, -16.16579246520996, -15.5407133102417, -14.915635108947754, -14.290556907653809, -13.665478706359863, -13.040400505065918, -12.415321350097656, -11.790243148803711, -11.165164947509766, -10.54008674621582, -9.915008544921875, -9.28993034362793, -8.664852142333984, -8.039773941040039, -7.4146952629089355, -6.78961706161499, -6.164538383483887, -5.539460182189941, -4.914381980895996, -4.289303779602051, -3.6642253398895264, -3.039146900177002, -2.4140686988830566, -1.7889904975891113, -1.163912057876587, -0.5388336181640625, 0.08624267578125, 0.7113209962844849, 1.3363993167877197, 1.9614776372909546, 2.5865559577941895, 3.2116341590881348, 3.836712598800659, 4.461791038513184, 5.086869239807129, 5.711947441101074, 6.3370256423950195, 6.962104320526123, 7.587182521820068, 8.212261199951172, 8.837339401245117, 9.462417602539062, 10.087495803833008, 10.712574005126953, 11.337652206420898, 11.962730407714844, 12.587808609008789, 13.212886810302734, 13.837965965270996, 14.463044166564941, 15.088122367858887, 15.713200569152832, 16.338279724121094, 16.96335792541504, 17.588436126708984, 18.21351432800293, 18.838592529296875, 19.46367073059082, 20.088748931884766]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 2.0, 4.0, 10.0, 9.0, 9.0, 14.0, 17.0, 24.0, 20.0, 23.0, 14.0, 29.0, 30.0, 40.0, 27.0, 43.0, 30.0, 35.0, 59.0, 45.0, 45.0, 47.0, 41.0, 37.0, 33.0, 29.0, 36.0, 38.0, 37.0, 19.0, 29.0, 20.0, 15.0, 23.0, 17.0, 5.0, 10.0, 9.0, 4.0, 10.0, 6.0, 2.0, 4.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-2.91796875, -2.833221435546875, -2.74847412109375, -2.663726806640625, -2.5789794921875, -2.494232177734375, -2.40948486328125, -2.324737548828125, -2.239990234375, -2.155242919921875, -2.07049560546875, -1.985748291015625, -1.9010009765625, -1.816253662109375, -1.73150634765625, -1.646759033203125, -1.56201171875, -1.477264404296875, -1.39251708984375, -1.307769775390625, -1.2230224609375, -1.138275146484375, -1.05352783203125, -0.968780517578125, -0.884033203125, -0.799285888671875, -0.71453857421875, -0.629791259765625, -0.5450439453125, -0.460296630859375, -0.37554931640625, -0.290802001953125, -0.2060546875, -0.121307373046875, -0.03656005859375, 0.048187255859375, 0.1329345703125, 0.217681884765625, 0.30242919921875, 0.387176513671875, 0.471923828125, 0.556671142578125, 0.64141845703125, 0.726165771484375, 0.8109130859375, 0.895660400390625, 0.98040771484375, 1.065155029296875, 1.14990234375, 1.234649658203125, 1.31939697265625, 1.404144287109375, 1.4888916015625, 1.573638916015625, 1.65838623046875, 1.743133544921875, 1.827880859375, 1.912628173828125, 1.99737548828125, 2.082122802734375, 2.1668701171875, 2.251617431640625, 2.33636474609375, 2.421112060546875, 2.505859375]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 9.0, 8.0, 4.0, 10.0, 7.0, 23.0, 22.0, 48.0, 48.0, 96.0, 156.0, 240.0, 376.0, 583.0, 945.0, 1602.0, 2642.0, 4175.0, 7143.0, 12092.0, 21835.0, 40398.0, 78425.0, 161323.0, 285185.0, 212234.0, 102817.0, 51582.0, 27411.0, 15127.0, 8773.0, 5137.0, 3120.0, 1864.0, 1135.0, 702.0, 450.0, 269.0, 199.0, 104.0, 82.0, 51.0, 43.0, 27.0, 15.0, 11.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.403564453125, -0.3904151916503906, -0.37726593017578125, -0.3641166687011719, -0.3509674072265625, -0.3378181457519531, -0.32466888427734375, -0.3115196228027344, -0.298370361328125, -0.2852210998535156, -0.27207183837890625, -0.2589225769042969, -0.2457733154296875, -0.23262405395507812, -0.21947479248046875, -0.20632553100585938, -0.19317626953125, -0.18002700805664062, -0.16687774658203125, -0.15372848510742188, -0.1405792236328125, -0.12742996215820312, -0.11428070068359375, -0.10113143920898438, -0.087982177734375, -0.07483291625976562, -0.06168365478515625, -0.048534393310546875, -0.0353851318359375, -0.022235870361328125, -0.00908660888671875, 0.004062652587890625, 0.0172119140625, 0.030361175537109375, 0.04351043701171875, 0.056659698486328125, 0.0698089599609375, 0.08295822143554688, 0.09610748291015625, 0.10925674438476562, 0.122406005859375, 0.13555526733398438, 0.14870452880859375, 0.16185379028320312, 0.1750030517578125, 0.18815231323242188, 0.20130157470703125, 0.21445083618164062, 0.22760009765625, 0.24074935913085938, 0.25389862060546875, 0.2670478820800781, 0.2801971435546875, 0.2933464050292969, 0.30649566650390625, 0.3196449279785156, 0.332794189453125, 0.3459434509277344, 0.35909271240234375, 0.3722419738769531, 0.3853912353515625, 0.3985404968261719, 0.41168975830078125, 0.4248390197753906, 0.43798828125]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 7.0, 2.0, 6.0, 2.0, 7.0, 2.0, 11.0, 4.0, 7.0, 8.0, 13.0, 19.0, 22.0, 16.0, 24.0, 33.0, 27.0, 30.0, 30.0, 27.0, 29.0, 32.0, 29.0, 30.0, 55.0, 1065.0, 42.0, 36.0, 38.0, 31.0, 32.0, 35.0, 34.0, 30.0, 34.0, 29.0, 26.0, 19.0, 22.0, 22.0, 11.0, 16.0, 9.0, 7.0, 7.0, 8.0, 3.0, 4.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.66015625, -1.6111907958984375, -1.562225341796875, -1.5132598876953125, -1.46429443359375, -1.4153289794921875, -1.366363525390625, -1.3173980712890625, -1.2684326171875, -1.2194671630859375, -1.170501708984375, -1.1215362548828125, -1.07257080078125, -1.0236053466796875, -0.974639892578125, -0.9256744384765625, -0.876708984375, -0.8277435302734375, -0.778778076171875, -0.7298126220703125, -0.68084716796875, -0.6318817138671875, -0.582916259765625, -0.5339508056640625, -0.4849853515625, -0.4360198974609375, -0.387054443359375, -0.3380889892578125, -0.28912353515625, -0.2401580810546875, -0.191192626953125, -0.1422271728515625, -0.09326171875, -0.0442962646484375, 0.004669189453125, 0.0536346435546875, 0.10260009765625, 0.1515655517578125, 0.200531005859375, 0.2494964599609375, 0.2984619140625, 0.3474273681640625, 0.396392822265625, 0.4453582763671875, 0.49432373046875, 0.5432891845703125, 0.592254638671875, 0.6412200927734375, 0.690185546875, 0.7391510009765625, 0.788116455078125, 0.8370819091796875, 0.88604736328125, 0.9350128173828125, 0.983978271484375, 1.0329437255859375, 1.0819091796875, 1.1308746337890625, 1.179840087890625, 1.2288055419921875, 1.27777099609375, 1.3267364501953125, 1.375701904296875, 1.4246673583984375, 1.4736328125]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 5.0, 11.0, 9.0, 10.0, 18.0, 13.0, 28.0, 43.0, 43.0, 68.0, 103.0, 140.0, 199.0, 258.0, 361.0, 525.0, 785.0, 1067.0, 1631.0, 2263.0, 3392.0, 5170.0, 7298.0, 11029.0, 16830.0, 25805.0, 40403.0, 64591.0, 106233.0, 169144.0, 1248722.0, 145965.0, 89408.0, 54448.0, 34423.0, 21934.0, 14374.0, 9681.0, 6307.0, 4352.0, 3106.0, 2057.0, 1479.0, 1068.0, 682.0, 517.0, 375.0, 254.0, 171.0, 117.0, 94.0, 51.0, 33.0, 22.0, 8.0, 13.0, 7.0, 1.0, 2.0, 3.0], "bins": [-0.2403564453125, -0.2333545684814453, -0.22635269165039062, -0.21935081481933594, -0.21234893798828125, -0.20534706115722656, -0.19834518432617188, -0.1913433074951172, -0.1843414306640625, -0.1773395538330078, -0.17033767700195312, -0.16333580017089844, -0.15633392333984375, -0.14933204650878906, -0.14233016967773438, -0.1353282928466797, -0.128326416015625, -0.12132453918457031, -0.11432266235351562, -0.10732078552246094, -0.10031890869140625, -0.09331703186035156, -0.08631515502929688, -0.07931327819824219, -0.0723114013671875, -0.06530952453613281, -0.058307647705078125, -0.05130577087402344, -0.04430389404296875, -0.03730201721191406, -0.030300140380859375, -0.023298263549804688, -0.01629638671875, -0.009294509887695312, -0.002292633056640625, 0.0047092437744140625, 0.01171112060546875, 0.018712997436523438, 0.025714874267578125, 0.03271675109863281, 0.0397186279296875, 0.04672050476074219, 0.053722381591796875, 0.06072425842285156, 0.06772613525390625, 0.07472801208496094, 0.08172988891601562, 0.08873176574707031, 0.095733642578125, 0.10273551940917969, 0.10973739624023438, 0.11673927307128906, 0.12374114990234375, 0.13074302673339844, 0.13774490356445312, 0.1447467803955078, 0.1517486572265625, 0.1587505340576172, 0.16575241088867188, 0.17275428771972656, 0.17975616455078125, 0.18675804138183594, 0.19375991821289062, 0.2007617950439453, 0.207763671875]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 12.0, 9.0, 24.0, 20.0, 27.0, 30.0, 46.0, 58.0, 58.0, 58.0, 65.0, 73.0, 66.0, 65.0, 59.0, 47.0, 58.0, 43.0, 31.0, 24.0, 31.0, 23.0, 15.0, 13.0, 10.0, 6.0, 4.0, 4.0, 2.0, 1.0, 6.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009121894836425781, -0.0008810833096504211, -0.0008499771356582642, -0.0008188709616661072, -0.0007877647876739502, -0.0007566586136817932, -0.0007255524396896362, -0.0006944462656974792, -0.0006633400917053223, -0.0006322339177131653, -0.0006011277437210083, -0.0005700215697288513, -0.0005389153957366943, -0.0005078092217445374, -0.00047670304775238037, -0.0004455968737602234, -0.0004144906997680664, -0.0003833845257759094, -0.00035227835178375244, -0.00032117217779159546, -0.0002900660037994385, -0.0002589598298072815, -0.0002278536558151245, -0.00019674748182296753, -0.00016564130783081055, -0.00013453513383865356, -0.00010342895984649658, -7.23227858543396e-05, -4.121661186218262e-05, -1.0110437870025635e-05, 2.0995736122131348e-05, 5.210191011428833e-05, 8.320808410644531e-05, 0.0001143142580986023, 0.00014542043209075928, 0.00017652660608291626, 0.00020763278007507324, 0.00023873895406723022, 0.0002698451280593872, 0.0003009513020515442, 0.00033205747604370117, 0.00036316365003585815, 0.00039426982402801514, 0.0004253759980201721, 0.0004564821720123291, 0.0004875883460044861, 0.0005186945199966431, 0.0005498006939888, 0.000580906867980957, 0.000612013041973114, 0.000643119215965271, 0.000674225389957428, 0.000705331563949585, 0.0007364377379417419, 0.0007675439119338989, 0.0007986500859260559, 0.0008297562599182129, 0.0008608624339103699, 0.0008919686079025269, 0.0009230747818946838, 0.0009541809558868408, 0.0009852871298789978, 0.0010163933038711548, 0.0010474994778633118, 0.0010786056518554688]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 5.0, 4.0, 4.0, 7.0, 19.0, 16.0, 21.0, 32.0, 31.0, 54.0, 84.0, 112.0, 187.0, 304.0, 967.0, 75129.0, 967083.0, 3248.0, 553.0, 221.0, 141.0, 95.0, 61.0, 51.0, 37.0, 23.0, 17.0, 10.0, 10.0, 7.0, 6.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0228118896484375, -0.022145509719848633, -0.021479129791259766, -0.0208127498626709, -0.02014636993408203, -0.019479990005493164, -0.018813610076904297, -0.01814723014831543, -0.017480850219726562, -0.016814470291137695, -0.016148090362548828, -0.015481710433959961, -0.014815330505371094, -0.014148950576782227, -0.01348257064819336, -0.012816190719604492, -0.012149810791015625, -0.011483430862426758, -0.01081705093383789, -0.010150671005249023, -0.009484291076660156, -0.008817911148071289, -0.008151531219482422, -0.007485151290893555, -0.0068187713623046875, -0.00615239143371582, -0.005486011505126953, -0.004819631576538086, -0.004153251647949219, -0.0034868717193603516, -0.0028204917907714844, -0.002154111862182617, -0.00148773193359375, -0.0008213520050048828, -0.00015497207641601562, 0.0005114078521728516, 0.0011777877807617188, 0.001844167709350586, 0.002510547637939453, 0.0031769275665283203, 0.0038433074951171875, 0.004509687423706055, 0.005176067352294922, 0.005842447280883789, 0.006508827209472656, 0.0071752071380615234, 0.00784158706665039, 0.008507966995239258, 0.009174346923828125, 0.009840726852416992, 0.01050710678100586, 0.011173486709594727, 0.011839866638183594, 0.012506246566772461, 0.013172626495361328, 0.013839006423950195, 0.014505386352539062, 0.01517176628112793, 0.015838146209716797, 0.016504526138305664, 0.01717090606689453, 0.0178372859954834, 0.018503665924072266, 0.019170045852661133, 0.01983642578125]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 6.0, 35.0, 86.0, 156.0, 219.0, 240.0, 146.0, 62.0, 35.0, 15.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0021842936985194683, -0.0021414197981357574, -0.0020985458977520466, -0.002055671764537692, -0.002012797864153981, -0.0019699239637702703, -0.0019270499469712377, -0.001884175930172205, -0.0018413020297884941, -0.0017984281294047832, -0.0017555541126057506, -0.0017126800958067179, -0.001669806195423007, -0.0016269322950392962, -0.0015840582782402635, -0.0015411842614412308, -0.00149831036105752, -0.001455436460673809, -0.0014125624438747764, -0.0013696884270757437, -0.0013268145266920328, -0.001283940626308322, -0.0012410666095092893, -0.0011981925927102566, -0.0011553186923265457, -0.0011124447919428349, -0.0010695707751438022, -0.0010266967583447695, -0.0009838228579610586, -0.0009409488993696868, -0.0008980749407783151, -0.0008552009821869433, -0.0008123270235955715, -0.0007694530650041997, -0.000726579106412828, -0.0006837051478214562, -0.0006408311892300844, -0.0005979572306387126, -0.0005550832720473409, -0.0005122093134559691, -0.0004693353548645973, -0.00042646139627322555, -0.00038358743768185377, -0.000340713479090482, -0.0002978395204991102, -0.00025496556190773845, -0.00021209160331636667, -0.0001692176447249949, -0.00012634368613362312, -8.346972754225135e-05, -4.0595768950879574e-05, 2.278189640492201e-06, 4.5152148231863976e-05, 8.802610682323575e-05, 0.00013090006541460752, 0.0001737740240059793, 0.00021664798259735107, 0.00025952194118872285, 0.0003023958997800946, 0.0003452698583714664, 0.0003881438169628382, 0.00043101777555420995, 0.0004738917341455817, 0.0005167656927369535, 0.0005596396513283253]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 8.0, 6.0, 8.0, 6.0, 9.0, 11.0, 12.0, 15.0, 15.0, 31.0, 20.0, 26.0, 25.0, 29.0, 29.0, 43.0, 45.0, 35.0, 37.0, 45.0, 42.0, 36.0, 39.0, 34.0, 34.0, 42.0, 34.0, 27.0, 54.0, 29.0, 19.0, 20.0, 17.0, 11.0, 22.0, 16.0, 9.0, 13.0, 14.0, 6.0, 8.0, 4.0, 2.0, 5.0, 6.0, 3.0, 1.0, 2.0, 4.0], "bins": [-0.0004981160163879395, -0.00048444420099258423, -0.000470772385597229, -0.0004571005702018738, -0.00044342875480651855, -0.00042975693941116333, -0.0004160851240158081, -0.0004024133086204529, -0.00038874149322509766, -0.00037506967782974243, -0.0003613978624343872, -0.000347726047039032, -0.00033405423164367676, -0.00032038241624832153, -0.0003067106008529663, -0.0002930387854576111, -0.00027936697006225586, -0.00026569515466690063, -0.0002520233392715454, -0.00023835152387619019, -0.00022467970848083496, -0.00021100789308547974, -0.0001973360776901245, -0.0001836642622947693, -0.00016999244689941406, -0.00015632063150405884, -0.0001426488161087036, -0.0001289770007133484, -0.00011530518531799316, -0.00010163336992263794, -8.796155452728271e-05, -7.428973913192749e-05, -6.0617923736572266e-05, -4.694610834121704e-05, -3.3274292945861816e-05, -1.9602477550506592e-05, -5.930662155151367e-06, 7.741153240203857e-06, 2.1412968635559082e-05, 3.508478403091431e-05, 4.875659942626953e-05, 6.242841482162476e-05, 7.610023021697998e-05, 8.97720456123352e-05, 0.00010344386100769043, 0.00011711567640304565, 0.00013078749179840088, 0.0001444593071937561, 0.00015813112258911133, 0.00017180293798446655, 0.00018547475337982178, 0.000199146568775177, 0.00021281838417053223, 0.00022649019956588745, 0.00024016201496124268, 0.0002538338303565979, 0.0002675056457519531, 0.00028117746114730835, 0.0002948492765426636, 0.0003085210919380188, 0.000322192907333374, 0.00033586472272872925, 0.00034953653812408447, 0.0003632083535194397, 0.0003768801689147949]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 2.0, 4.0, 10.0, 9.0, 9.0, 14.0, 17.0, 24.0, 20.0, 23.0, 14.0, 29.0, 30.0, 40.0, 27.0, 43.0, 30.0, 35.0, 59.0, 45.0, 45.0, 47.0, 41.0, 37.0, 33.0, 29.0, 36.0, 38.0, 37.0, 19.0, 29.0, 20.0, 15.0, 23.0, 17.0, 5.0, 10.0, 9.0, 4.0, 10.0, 6.0, 2.0, 4.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-2.91796875, -2.833221435546875, -2.74847412109375, -2.663726806640625, -2.5789794921875, -2.494232177734375, -2.40948486328125, -2.324737548828125, -2.239990234375, -2.155242919921875, -2.07049560546875, -1.985748291015625, -1.9010009765625, -1.816253662109375, -1.73150634765625, -1.646759033203125, -1.56201171875, -1.477264404296875, -1.39251708984375, -1.307769775390625, -1.2230224609375, -1.138275146484375, -1.05352783203125, -0.968780517578125, -0.884033203125, -0.799285888671875, -0.71453857421875, -0.629791259765625, -0.5450439453125, -0.460296630859375, -0.37554931640625, -0.290802001953125, -0.2060546875, -0.121307373046875, -0.03656005859375, 0.048187255859375, 0.1329345703125, 0.217681884765625, 0.30242919921875, 0.387176513671875, 0.471923828125, 0.556671142578125, 0.64141845703125, 0.726165771484375, 0.8109130859375, 0.895660400390625, 0.98040771484375, 1.065155029296875, 1.14990234375, 1.234649658203125, 1.31939697265625, 1.404144287109375, 1.4888916015625, 1.573638916015625, 1.65838623046875, 1.743133544921875, 1.827880859375, 1.912628173828125, 1.99737548828125, 2.082122802734375, 2.1668701171875, 2.251617431640625, 2.33636474609375, 2.421112060546875, 2.505859375]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 7.0, 4.0, 13.0, 10.0, 27.0, 30.0, 36.0, 45.0, 57.0, 92.0, 146.0, 226.0, 287.0, 516.0, 859.0, 1723.0, 3544.0, 7670.0, 17826.0, 43080.0, 100576.0, 223185.0, 359306.0, 162182.0, 72278.0, 30401.0, 12850.0, 5663.0, 2611.0, 1343.0, 711.0, 431.0, 238.0, 172.0, 107.0, 76.0, 53.0, 47.0, 38.0, 32.0, 19.0, 12.0, 9.0, 8.0, 6.0, 4.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.8203125, -2.735626220703125, -2.65093994140625, -2.566253662109375, -2.4815673828125, -2.396881103515625, -2.31219482421875, -2.227508544921875, -2.142822265625, -2.058135986328125, -1.97344970703125, -1.888763427734375, -1.8040771484375, -1.719390869140625, -1.63470458984375, -1.550018310546875, -1.46533203125, -1.380645751953125, -1.29595947265625, -1.211273193359375, -1.1265869140625, -1.041900634765625, -0.95721435546875, -0.872528076171875, -0.787841796875, -0.703155517578125, -0.61846923828125, -0.533782958984375, -0.4490966796875, -0.364410400390625, -0.27972412109375, -0.195037841796875, -0.1103515625, -0.025665283203125, 0.05902099609375, 0.143707275390625, 0.2283935546875, 0.313079833984375, 0.39776611328125, 0.482452392578125, 0.567138671875, 0.651824951171875, 0.73651123046875, 0.821197509765625, 0.9058837890625, 0.990570068359375, 1.07525634765625, 1.159942626953125, 1.24462890625, 1.329315185546875, 1.41400146484375, 1.498687744140625, 1.5833740234375, 1.668060302734375, 1.75274658203125, 1.837432861328125, 1.922119140625, 2.006805419921875, 2.09149169921875, 2.176177978515625, 2.2608642578125, 2.345550537109375, 2.43023681640625, 2.514923095703125, 2.599609375]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 4.0, 3.0, 2.0, 4.0, 1.0, 2.0, 4.0, 10.0, 10.0, 11.0, 6.0, 16.0, 21.0, 11.0, 13.0, 27.0, 28.0, 29.0, 31.0, 45.0, 33.0, 69.0, 76.0, 109.0, 244.0, 1452.0, 238.0, 109.0, 59.0, 53.0, 39.0, 54.0, 30.0, 23.0, 32.0, 29.0, 24.0, 20.0, 20.0, 14.0, 8.0, 7.0, 9.0, 3.0, 5.0, 4.0, 4.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.109375, -8.820556640625, -8.53173828125, -8.242919921875, -7.9541015625, -7.665283203125, -7.37646484375, -7.087646484375, -6.798828125, -6.510009765625, -6.22119140625, -5.932373046875, -5.6435546875, -5.354736328125, -5.06591796875, -4.777099609375, -4.48828125, -4.199462890625, -3.91064453125, -3.621826171875, -3.3330078125, -3.044189453125, -2.75537109375, -2.466552734375, -2.177734375, -1.888916015625, -1.60009765625, -1.311279296875, -1.0224609375, -0.733642578125, -0.44482421875, -0.156005859375, 0.1328125, 0.421630859375, 0.71044921875, 0.999267578125, 1.2880859375, 1.576904296875, 1.86572265625, 2.154541015625, 2.443359375, 2.732177734375, 3.02099609375, 3.309814453125, 3.5986328125, 3.887451171875, 4.17626953125, 4.465087890625, 4.75390625, 5.042724609375, 5.33154296875, 5.620361328125, 5.9091796875, 6.197998046875, 6.48681640625, 6.775634765625, 7.064453125, 7.353271484375, 7.64208984375, 7.930908203125, 8.2197265625, 8.508544921875, 8.79736328125, 9.086181640625, 9.375]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 1.0, 6.0, 7.0, 6.0, 14.0, 12.0, 19.0, 23.0, 35.0, 57.0, 82.0, 123.0, 238.0, 557.0, 2886.0, 3120670.0, 19133.0, 978.0, 337.0, 189.0, 98.0, 80.0, 39.0, 40.0, 24.0, 21.0, 14.0, 1.0, 7.0, 4.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.6875, -61.953125, -60.21875, -58.484375, -56.75, -55.015625, -53.28125, -51.546875, -49.8125, -48.078125, -46.34375, -44.609375, -42.875, -41.140625, -39.40625, -37.671875, -35.9375, -34.203125, -32.46875, -30.734375, -29.0, -27.265625, -25.53125, -23.796875, -22.0625, -20.328125, -18.59375, -16.859375, -15.125, -13.390625, -11.65625, -9.921875, -8.1875, -6.453125, -4.71875, -2.984375, -1.25, 0.484375, 2.21875, 3.953125, 5.6875, 7.421875, 9.15625, 10.890625, 12.625, 14.359375, 16.09375, 17.828125, 19.5625, 21.296875, 23.03125, 24.765625, 26.5, 28.234375, 29.96875, 31.703125, 33.4375, 35.171875, 36.90625, 38.640625, 40.375, 42.109375, 43.84375, 45.578125, 47.3125]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 20.0, 102.0, 234.0, 331.0, 227.0, 79.0, 15.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-54.53334045410156, -53.475311279296875, -52.41728210449219, -51.359256744384766, -50.30122756958008, -49.24319839477539, -48.18517303466797, -47.12714385986328, -46.069114685058594, -45.011085510253906, -43.95305633544922, -42.8950309753418, -41.83700180053711, -40.77897262573242, -39.720947265625, -38.66291809082031, -37.604888916015625, -36.54685974121094, -35.48883056640625, -34.43080520629883, -33.37277603149414, -32.31474685668945, -31.2567195892334, -30.198692321777344, -29.140663146972656, -28.08263397216797, -27.024606704711914, -25.96657943725586, -24.908550262451172, -23.850521087646484, -22.79249382019043, -21.734466552734375, -20.676433563232422, -19.618404388427734, -18.56037712097168, -17.502349853515625, -16.444320678710938, -15.386292457580566, -14.328264236450195, -13.270236015319824, -12.21220874786377, -11.154180526733398, -10.096152305603027, -9.038124084472656, -7.980095863342285, -6.922067642211914, -5.864039421081543, -4.806011199951172, -3.747982978820801, -2.6899547576904297, -1.6319265365600586, -0.5738983154296875, 0.4841299057006836, 1.5421581268310547, 2.600186347961426, 3.658214569091797, 4.716242790222168, 5.774271011352539, 6.83229923248291, 7.890327453613281, 8.948355674743652, 10.006383895874023, 11.064412117004395, 12.122440338134766, 13.180468559265137]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [2.0, 3.0, 6.0, 2.0, 3.0, 2.0, 6.0, 5.0, 13.0, 6.0, 13.0, 11.0, 10.0, 12.0, 13.0, 19.0, 19.0, 22.0, 29.0, 28.0, 27.0, 31.0, 33.0, 34.0, 47.0, 33.0, 43.0, 31.0, 39.0, 34.0, 31.0, 34.0, 40.0, 40.0, 25.0, 26.0, 31.0, 31.0, 24.0, 32.0, 20.0, 17.0, 17.0, 15.0, 14.0, 12.0, 9.0, 5.0, 5.0, 7.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-18.148656845092773, -17.512428283691406, -16.876201629638672, -16.239973068237305, -15.60374641418457, -14.967517852783203, -14.331290245056152, -13.695062637329102, -13.05883502960205, -12.422607421875, -11.78637981414795, -11.150152206420898, -10.513923645019531, -9.877696990966797, -9.24146842956543, -8.605240821838379, -7.969013214111328, -7.332785606384277, -6.696557998657227, -6.060329914093018, -5.424102306365967, -4.787874698638916, -4.151646614074707, -3.5154190063476562, -2.8791913986206055, -2.2429637908935547, -1.6067359447479248, -0.9705082178115845, -0.33428049087524414, 0.30194711685180664, 0.9381749629974365, 1.5744028091430664, 2.2106285095214844, 2.846856117248535, 3.483083963394165, 4.119311809539795, 4.755539417266846, 5.3917670249938965, 6.0279951095581055, 6.664222717285156, 7.300450325012207, 7.936677932739258, 8.572905540466309, 9.20913314819336, 9.845361709594727, 10.481588363647461, 11.117816925048828, 11.754044532775879, 12.39027214050293, 13.02649974822998, 13.662727355957031, 14.298954963684082, 14.935182571411133, 15.5714111328125, 16.207637786865234, 16.8438663482666, 17.48009490966797, 18.116323471069336, 18.75255012512207, 19.388778686523438, 20.025005340576172, 20.66123390197754, 21.297460556030273, 21.93368911743164, 22.569915771484375]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 5.0, 3.0, 3.0, 5.0, 12.0, 17.0, 8.0, 15.0, 17.0, 29.0, 25.0, 22.0, 26.0, 32.0, 34.0, 30.0, 22.0, 42.0, 37.0, 43.0, 42.0, 36.0, 37.0, 44.0, 47.0, 36.0, 36.0, 25.0, 26.0, 29.0, 30.0, 31.0, 20.0, 21.0, 17.0, 16.0, 17.0, 9.0, 13.0, 5.0, 12.0, 7.0, 5.0, 5.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-3.021484375, -2.93450927734375, -2.8475341796875, -2.76055908203125, -2.673583984375, -2.58660888671875, -2.4996337890625, -2.41265869140625, -2.32568359375, -2.23870849609375, -2.1517333984375, -2.06475830078125, -1.977783203125, -1.89080810546875, -1.8038330078125, -1.71685791015625, -1.6298828125, -1.54290771484375, -1.4559326171875, -1.36895751953125, -1.281982421875, -1.19500732421875, -1.1080322265625, -1.02105712890625, -0.93408203125, -0.84710693359375, -0.7601318359375, -0.67315673828125, -0.586181640625, -0.49920654296875, -0.4122314453125, -0.32525634765625, -0.23828125, -0.15130615234375, -0.0643310546875, 0.02264404296875, 0.109619140625, 0.19659423828125, 0.2835693359375, 0.37054443359375, 0.45751953125, 0.54449462890625, 0.6314697265625, 0.71844482421875, 0.805419921875, 0.89239501953125, 0.9793701171875, 1.06634521484375, 1.1533203125, 1.24029541015625, 1.3272705078125, 1.41424560546875, 1.501220703125, 1.58819580078125, 1.6751708984375, 1.76214599609375, 1.84912109375, 1.93609619140625, 2.0230712890625, 2.11004638671875, 2.197021484375, 2.28399658203125, 2.3709716796875, 2.45794677734375, 2.544921875]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 0.0, 3.0, 3.0, 4.0, 4.0, 4.0, 5.0, 4.0, 20.0, 15.0, 16.0, 38.0, 22.0, 36.0, 41.0, 50.0, 76.0, 79.0, 108.0, 159.0, 247.0, 465.0, 1298.0, 6214.0, 50612.0, 516483.0, 2097913.0, 1316783.0, 180541.0, 18091.0, 3013.0, 802.0, 364.0, 185.0, 121.0, 77.0, 64.0, 67.0, 42.0, 38.0, 39.0, 25.0, 29.0, 16.0, 14.0, 19.0, 9.0, 7.0, 4.0, 5.0, 6.0, 4.0, 6.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.05078125, -5.87158203125, -5.6923828125, -5.51318359375, -5.333984375, -5.15478515625, -4.9755859375, -4.79638671875, -4.6171875, -4.43798828125, -4.2587890625, -4.07958984375, -3.900390625, -3.72119140625, -3.5419921875, -3.36279296875, -3.18359375, -3.00439453125, -2.8251953125, -2.64599609375, -2.466796875, -2.28759765625, -2.1083984375, -1.92919921875, -1.75, -1.57080078125, -1.3916015625, -1.21240234375, -1.033203125, -0.85400390625, -0.6748046875, -0.49560546875, -0.31640625, -0.13720703125, 0.0419921875, 0.22119140625, 0.400390625, 0.57958984375, 0.7587890625, 0.93798828125, 1.1171875, 1.29638671875, 1.4755859375, 1.65478515625, 1.833984375, 2.01318359375, 2.1923828125, 2.37158203125, 2.55078125, 2.72998046875, 2.9091796875, 3.08837890625, 3.267578125, 3.44677734375, 3.6259765625, 3.80517578125, 3.984375, 4.16357421875, 4.3427734375, 4.52197265625, 4.701171875, 4.88037109375, 5.0595703125, 5.23876953125, 5.41796875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 7.0, 7.0, 11.0, 11.0, 24.0, 22.0, 30.0, 55.0, 75.0, 101.0, 114.0, 164.0, 201.0, 246.0, 346.0, 389.0, 393.0, 375.0, 333.0, 273.0, 216.0, 166.0, 118.0, 88.0, 77.0, 54.0, 50.0, 41.0, 20.0, 9.0, 11.0, 11.0, 6.0, 10.0, 10.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.18359375, -6.01031494140625, -5.8370361328125, -5.66375732421875, -5.490478515625, -5.31719970703125, -5.1439208984375, -4.97064208984375, -4.79736328125, -4.62408447265625, -4.4508056640625, -4.27752685546875, -4.104248046875, -3.93096923828125, -3.7576904296875, -3.58441162109375, -3.4111328125, -3.23785400390625, -3.0645751953125, -2.89129638671875, -2.718017578125, -2.54473876953125, -2.3714599609375, -2.19818115234375, -2.02490234375, -1.85162353515625, -1.6783447265625, -1.50506591796875, -1.331787109375, -1.15850830078125, -0.9852294921875, -0.81195068359375, -0.638671875, -0.46539306640625, -0.2921142578125, -0.11883544921875, 0.054443359375, 0.22772216796875, 0.4010009765625, 0.57427978515625, 0.74755859375, 0.92083740234375, 1.0941162109375, 1.26739501953125, 1.440673828125, 1.61395263671875, 1.7872314453125, 1.96051025390625, 2.1337890625, 2.30706787109375, 2.4803466796875, 2.65362548828125, 2.826904296875, 3.00018310546875, 3.1734619140625, 3.34674072265625, 3.52001953125, 3.69329833984375, 3.8665771484375, 4.03985595703125, 4.213134765625, 4.38641357421875, 4.5596923828125, 4.73297119140625, 4.90625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 5.0, 9.0, 10.0, 8.0, 13.0, 10.0, 13.0, 32.0, 47.0, 46.0, 74.0, 84.0, 107.0, 208.0, 260.0, 415.0, 907.0, 46598.0, 4069328.0, 73743.0, 989.0, 403.0, 254.0, 204.0, 156.0, 111.0, 76.0, 50.0, 32.0, 26.0, 18.0, 16.0, 10.0, 9.0, 7.0, 1.0, 5.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.265625, -22.4501953125, -21.634765625, -20.8193359375, -20.00390625, -19.1884765625, -18.373046875, -17.5576171875, -16.7421875, -15.9267578125, -15.111328125, -14.2958984375, -13.48046875, -12.6650390625, -11.849609375, -11.0341796875, -10.21875, -9.4033203125, -8.587890625, -7.7724609375, -6.95703125, -6.1416015625, -5.326171875, -4.5107421875, -3.6953125, -2.8798828125, -2.064453125, -1.2490234375, -0.43359375, 0.3818359375, 1.197265625, 2.0126953125, 2.828125, 3.6435546875, 4.458984375, 5.2744140625, 6.08984375, 6.9052734375, 7.720703125, 8.5361328125, 9.3515625, 10.1669921875, 10.982421875, 11.7978515625, 12.61328125, 13.4287109375, 14.244140625, 15.0595703125, 15.875, 16.6904296875, 17.505859375, 18.3212890625, 19.13671875, 19.9521484375, 20.767578125, 21.5830078125, 22.3984375, 23.2138671875, 24.029296875, 24.8447265625, 25.66015625, 26.4755859375, 27.291015625, 28.1064453125, 28.921875]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 19.0, 134.0, 324.0, 352.0, 157.0, 24.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.35829162597656, -31.74428939819336, -29.130285263061523, -26.516281127929688, -23.902278900146484, -21.28827667236328, -18.674272537231445, -16.06026840209961, -13.446266174316406, -10.832262992858887, -8.218259811401367, -5.604256629943848, -2.990253448486328, -0.3762502670288086, 2.237752914428711, 4.851757049560547, 7.46575927734375, 10.07976245880127, 12.693765640258789, 15.307768821716309, 17.921772003173828, 20.53577423095703, 23.149778366088867, 25.763782501220703, 28.377784729003906, 30.99178695678711, 33.60578918457031, 36.21979522705078, 38.833797454833984, 41.44779968261719, 44.061805725097656, 46.67580795288086, 49.28981018066406, 51.903812408447266, 54.51781463623047, 57.13182067871094, 59.74582290649414, 62.359825134277344, 64.97383117675781, 67.58782958984375, 70.20183563232422, 72.81584167480469, 75.42984008789062, 78.0438461303711, 80.65785217285156, 83.2718505859375, 85.88585662841797, 88.49986267089844, 91.11386108398438, 93.72786712646484, 96.34186553955078, 98.95587158203125, 101.56986999511719, 104.18387603759766, 106.79788208007812, 109.41188049316406, 112.02588653564453, 114.639892578125, 117.25389099121094, 119.8678970336914, 122.48190307617188, 125.09590148925781, 127.70990753173828, 130.32391357421875, 132.9379119873047]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 0.0, 2.0, 6.0, 8.0, 3.0, 8.0, 11.0, 16.0, 17.0, 16.0, 16.0, 17.0, 20.0, 19.0, 26.0, 32.0, 32.0, 40.0, 37.0, 35.0, 39.0, 41.0, 35.0, 51.0, 32.0, 38.0, 40.0, 33.0, 40.0, 34.0, 36.0, 33.0, 27.0, 22.0, 21.0, 20.0, 13.0, 21.0, 14.0, 5.0, 10.0, 6.0, 8.0, 7.0, 10.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-17.020042419433594, -16.443592071533203, -15.867141723632812, -15.290691375732422, -14.714241027832031, -14.13779067993164, -13.561339378356934, -12.984889030456543, -12.408438682556152, -11.831988334655762, -11.255537986755371, -10.67908763885498, -10.102636337280273, -9.526185989379883, -8.949735641479492, -8.373285293579102, -7.796834945678711, -7.22038459777832, -6.64393424987793, -6.067483425140381, -5.49103307723999, -4.9145827293396, -4.338131904602051, -3.76168155670166, -3.1852312088012695, -2.608780860900879, -2.032330274581909, -1.455879807472229, -0.8794293403625488, -0.3029789924621582, 0.2734715938568115, 0.8499221801757812, 1.4263725280761719, 2.0028228759765625, 2.5792734622955322, 3.155724048614502, 3.7321743965148926, 4.308624744415283, 4.885075569152832, 5.461525917053223, 6.037976264953613, 6.614426612854004, 7.1908769607543945, 7.767327785491943, 8.343778610229492, 8.920228958129883, 9.496679306030273, 10.073129653930664, 10.649580001831055, 11.226030349731445, 11.802480697631836, 12.378931045532227, 12.955381393432617, 13.531831741333008, 14.108283042907715, 14.684733390808105, 15.261183738708496, 15.837634086608887, 16.414085388183594, 16.990535736083984, 17.566986083984375, 18.143436431884766, 18.719886779785156, 19.296337127685547, 19.872787475585938]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 7.0, 4.0, 6.0, 3.0, 4.0, 10.0, 15.0, 26.0, 15.0, 11.0, 22.0, 19.0, 24.0, 25.0, 30.0, 35.0, 42.0, 22.0, 39.0, 38.0, 45.0, 46.0, 28.0, 33.0, 42.0, 38.0, 41.0, 31.0, 40.0, 40.0, 22.0, 23.0, 32.0, 21.0, 19.0, 17.0, 10.0, 16.0, 13.0, 15.0, 6.0, 7.0, 6.0, 5.0, 6.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0], "bins": [-2.833984375, -2.75152587890625, -2.6690673828125, -2.58660888671875, -2.504150390625, -2.42169189453125, -2.3392333984375, -2.25677490234375, -2.17431640625, -2.09185791015625, -2.0093994140625, -1.92694091796875, -1.844482421875, -1.76202392578125, -1.6795654296875, -1.59710693359375, -1.5146484375, -1.43218994140625, -1.3497314453125, -1.26727294921875, -1.184814453125, -1.10235595703125, -1.0198974609375, -0.93743896484375, -0.85498046875, -0.77252197265625, -0.6900634765625, -0.60760498046875, -0.525146484375, -0.44268798828125, -0.3602294921875, -0.27777099609375, -0.1953125, -0.11285400390625, -0.0303955078125, 0.05206298828125, 0.134521484375, 0.21697998046875, 0.2994384765625, 0.38189697265625, 0.46435546875, 0.54681396484375, 0.6292724609375, 0.71173095703125, 0.794189453125, 0.87664794921875, 0.9591064453125, 1.04156494140625, 1.1240234375, 1.20648193359375, 1.2889404296875, 1.37139892578125, 1.453857421875, 1.53631591796875, 1.6187744140625, 1.70123291015625, 1.78369140625, 1.86614990234375, 1.9486083984375, 2.03106689453125, 2.113525390625, 2.19598388671875, 2.2784423828125, 2.36090087890625, 2.443359375]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 5.0, 10.0, 22.0, 20.0, 26.0, 37.0, 57.0, 92.0, 124.0, 184.0, 252.0, 387.0, 592.0, 884.0, 1289.0, 1925.0, 2863.0, 4443.0, 6885.0, 10743.0, 16792.0, 27475.0, 45970.0, 79915.0, 143819.0, 227885.0, 196974.0, 114408.0, 63987.0, 37382.0, 22788.0, 14172.0, 8959.0, 5974.0, 3828.0, 2449.0, 1568.0, 1084.0, 738.0, 447.0, 330.0, 242.0, 183.0, 136.0, 68.0, 40.0, 30.0, 21.0, 28.0, 8.0, 5.0, 5.0, 1.0, 6.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.31884765625, -0.3088226318359375, -0.298797607421875, -0.2887725830078125, -0.27874755859375, -0.2687225341796875, -0.258697509765625, -0.2486724853515625, -0.2386474609375, -0.2286224365234375, -0.218597412109375, -0.2085723876953125, -0.19854736328125, -0.1885223388671875, -0.178497314453125, -0.1684722900390625, -0.158447265625, -0.1484222412109375, -0.138397216796875, -0.1283721923828125, -0.11834716796875, -0.1083221435546875, -0.098297119140625, -0.0882720947265625, -0.0782470703125, -0.0682220458984375, -0.058197021484375, -0.0481719970703125, -0.03814697265625, -0.0281219482421875, -0.018096923828125, -0.0080718994140625, 0.001953125, 0.0119781494140625, 0.022003173828125, 0.0320281982421875, 0.04205322265625, 0.0520782470703125, 0.062103271484375, 0.0721282958984375, 0.0821533203125, 0.0921783447265625, 0.102203369140625, 0.1122283935546875, 0.12225341796875, 0.1322784423828125, 0.142303466796875, 0.1523284912109375, 0.162353515625, 0.1723785400390625, 0.182403564453125, 0.1924285888671875, 0.20245361328125, 0.2124786376953125, 0.222503662109375, 0.2325286865234375, 0.2425537109375, 0.2525787353515625, 0.262603759765625, 0.2726287841796875, 0.28265380859375, 0.2926788330078125, 0.302703857421875, 0.3127288818359375, 0.32275390625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 9.0, 4.0, 5.0, 3.0, 8.0, 3.0, 9.0, 12.0, 6.0, 17.0, 16.0, 20.0, 24.0, 28.0, 25.0, 38.0, 28.0, 39.0, 36.0, 25.0, 36.0, 42.0, 36.0, 1066.0, 42.0, 44.0, 36.0, 33.0, 38.0, 36.0, 34.0, 33.0, 29.0, 32.0, 25.0, 13.0, 16.0, 16.0, 8.0, 13.0, 15.0, 6.0, 9.0, 7.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.6328125, -1.579132080078125, -1.52545166015625, -1.471771240234375, -1.4180908203125, -1.364410400390625, -1.31072998046875, -1.257049560546875, -1.203369140625, -1.149688720703125, -1.09600830078125, -1.042327880859375, -0.9886474609375, -0.934967041015625, -0.88128662109375, -0.827606201171875, -0.77392578125, -0.720245361328125, -0.66656494140625, -0.612884521484375, -0.5592041015625, -0.505523681640625, -0.45184326171875, -0.398162841796875, -0.344482421875, -0.290802001953125, -0.23712158203125, -0.183441162109375, -0.1297607421875, -0.076080322265625, -0.02239990234375, 0.031280517578125, 0.0849609375, 0.138641357421875, 0.19232177734375, 0.246002197265625, 0.2996826171875, 0.353363037109375, 0.40704345703125, 0.460723876953125, 0.514404296875, 0.568084716796875, 0.62176513671875, 0.675445556640625, 0.7291259765625, 0.782806396484375, 0.83648681640625, 0.890167236328125, 0.94384765625, 0.997528076171875, 1.05120849609375, 1.104888916015625, 1.1585693359375, 1.212249755859375, 1.26593017578125, 1.319610595703125, 1.373291015625, 1.426971435546875, 1.48065185546875, 1.534332275390625, 1.5880126953125, 1.641693115234375, 1.69537353515625, 1.749053955078125, 1.802734375]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 4.0, 4.0, 5.0, 11.0, 15.0, 17.0, 30.0, 40.0, 56.0, 78.0, 109.0, 193.0, 216.0, 364.0, 487.0, 671.0, 951.0, 1406.0, 2045.0, 3070.0, 4458.0, 6407.0, 9639.0, 14495.0, 21632.0, 33349.0, 52822.0, 86331.0, 141654.0, 1253132.0, 172750.0, 107142.0, 64629.0, 40288.0, 26121.0, 17019.0, 11353.0, 7640.0, 5096.0, 3433.0, 2444.0, 1663.0, 1147.0, 809.0, 564.0, 423.0, 274.0, 193.0, 150.0, 113.0, 71.0, 39.0, 21.0, 28.0, 19.0, 11.0, 6.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.235595703125, -0.22792434692382812, -0.22025299072265625, -0.21258163452148438, -0.2049102783203125, -0.19723892211914062, -0.18956756591796875, -0.18189620971679688, -0.174224853515625, -0.16655349731445312, -0.15888214111328125, -0.15121078491210938, -0.1435394287109375, -0.13586807250976562, -0.12819671630859375, -0.12052536010742188, -0.11285400390625, -0.10518264770507812, -0.09751129150390625, -0.08983993530273438, -0.0821685791015625, -0.07449722290039062, -0.06682586669921875, -0.059154510498046875, -0.051483154296875, -0.043811798095703125, -0.03614044189453125, -0.028469085693359375, -0.0207977294921875, -0.013126373291015625, -0.00545501708984375, 0.002216339111328125, 0.0098876953125, 0.017559051513671875, 0.02523040771484375, 0.032901763916015625, 0.0405731201171875, 0.048244476318359375, 0.05591583251953125, 0.06358718872070312, 0.071258544921875, 0.07892990112304688, 0.08660125732421875, 0.09427261352539062, 0.1019439697265625, 0.10961532592773438, 0.11728668212890625, 0.12495803833007812, 0.13262939453125, 0.14030075073242188, 0.14797210693359375, 0.15564346313476562, 0.1633148193359375, 0.17098617553710938, 0.17865753173828125, 0.18632888793945312, 0.194000244140625, 0.20167160034179688, 0.20934295654296875, 0.21701431274414062, 0.2246856689453125, 0.23235702514648438, 0.24002838134765625, 0.24769973754882812, 0.25537109375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 3.0, 8.0, 8.0, 10.0, 6.0, 12.0, 20.0, 18.0, 20.0, 46.0, 44.0, 49.0, 58.0, 54.0, 56.0, 83.0, 79.0, 67.0, 52.0, 60.0, 52.0, 41.0, 37.0, 19.0, 15.0, 17.0, 11.0, 11.0, 5.0, 7.0, 9.0, 7.0, 1.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.001087188720703125, -0.0010554268956184387, -0.0010236650705337524, -0.0009919032454490662, -0.0009601414203643799, -0.0009283795952796936, -0.0008966177701950073, -0.000864855945110321, -0.0008330941200256348, -0.0008013322949409485, -0.0007695704698562622, -0.0007378086447715759, -0.0007060468196868896, -0.0006742849946022034, -0.0006425231695175171, -0.0006107613444328308, -0.0005789995193481445, -0.0005472376942634583, -0.000515475869178772, -0.0004837140440940857, -0.0004519522190093994, -0.00042019039392471313, -0.00038842856884002686, -0.0003566667437553406, -0.0003249049186706543, -0.000293143093585968, -0.00026138126850128174, -0.00022961944341659546, -0.00019785761833190918, -0.0001660957932472229, -0.00013433396816253662, -0.00010257214307785034, -7.081031799316406e-05, -3.904849290847778e-05, -7.286667823791504e-06, 2.4475157260894775e-05, 5.6236982345581055e-05, 8.799880743026733e-05, 0.00011976063251495361, 0.0001515224575996399, 0.00018328428268432617, 0.00021504610776901245, 0.00024680793285369873, 0.000278569757938385, 0.0003103315830230713, 0.00034209340810775757, 0.00037385523319244385, 0.0004056170582771301, 0.0004373788833618164, 0.0004691407084465027, 0.000500902533531189, 0.0005326643586158752, 0.0005644261837005615, 0.0005961880087852478, 0.0006279498338699341, 0.0006597116589546204, 0.0006914734840393066, 0.0007232353091239929, 0.0007549971342086792, 0.0007867589592933655, 0.0008185207843780518, 0.000850282609462738, 0.0008820444345474243, 0.0009138062596321106, 0.0009455680847167969]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 5.0, 9.0, 10.0, 12.0, 11.0, 17.0, 32.0, 31.0, 36.0, 62.0, 81.0, 153.0, 265.0, 536.0, 4799.0, 1021433.0, 19499.0, 676.0, 332.0, 148.0, 102.0, 79.0, 71.0, 27.0, 30.0, 16.0, 19.0, 16.0, 8.0, 13.0, 5.0, 2.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.020721435546875, -0.020021677017211914, -0.019321918487548828, -0.018622159957885742, -0.017922401428222656, -0.01722264289855957, -0.016522884368896484, -0.0158231258392334, -0.015123367309570312, -0.014423608779907227, -0.01372385025024414, -0.013024091720581055, -0.012324333190917969, -0.011624574661254883, -0.010924816131591797, -0.010225057601928711, -0.009525299072265625, -0.008825540542602539, -0.008125782012939453, -0.007426023483276367, -0.006726264953613281, -0.006026506423950195, -0.005326747894287109, -0.0046269893646240234, -0.0039272308349609375, -0.0032274723052978516, -0.0025277137756347656, -0.0018279552459716797, -0.0011281967163085938, -0.0004284381866455078, 0.0002713203430175781, 0.0009710788726806641, 0.00167083740234375, 0.002370595932006836, 0.003070354461669922, 0.003770112991333008, 0.004469871520996094, 0.00516963005065918, 0.005869388580322266, 0.0065691471099853516, 0.0072689056396484375, 0.007968664169311523, 0.00866842269897461, 0.009368181228637695, 0.010067939758300781, 0.010767698287963867, 0.011467456817626953, 0.012167215347290039, 0.012866973876953125, 0.013566732406616211, 0.014266490936279297, 0.014966249465942383, 0.01566600799560547, 0.016365766525268555, 0.01706552505493164, 0.017765283584594727, 0.018465042114257812, 0.0191648006439209, 0.019864559173583984, 0.02056431770324707, 0.021264076232910156, 0.021963834762573242, 0.022663593292236328, 0.023363351821899414, 0.0240631103515625]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 27.0, 93.0, 206.0, 281.0, 229.0, 114.0, 42.0, 14.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0026760930195450783, -0.0026253708638250828, -0.002574648940935731, -0.002523927018046379, -0.0024732048623263836, -0.002422482706606388, -0.0023717607837170362, -0.0023210388608276844, -0.002270316705107689, -0.0022195945493876934, -0.0021688726264983416, -0.0021181507036089897, -0.0020674285478889942, -0.0020167063921689987, -0.001965984469279647, -0.0019152624299749732, -0.0018645403906702995, -0.0018138183513656259, -0.0017630963120609522, -0.0017123742727562785, -0.0016616522334516048, -0.0016109301941469312, -0.0015602081548422575, -0.0015094861155375838, -0.0014587640762329102, -0.0014080420369282365, -0.0013573199976235628, -0.0013065979583188891, -0.0012558759190142155, -0.0012051538797095418, -0.0011544318404048681, -0.0011037098011001945, -0.0010529878782108426, -0.001002265838906169, -0.0009515437996014953, -0.0009008217602968216, -0.0008500997209921479, -0.0007993776816874743, -0.0007486556423828006, -0.0006979336030781269, -0.0006472115637734532, -0.0005964895244687796, -0.0005457674851641059, -0.0004950454458594322, -0.00044432340655475855, -0.0003936013672500849, -0.0003428793279454112, -0.00029215728864073753, -0.00024143524933606386, -0.0001907132100313902, -0.00013999117072671652, -8.926913142204285e-05, -3.8547092117369175e-05, 1.2174947187304497e-05, 6.289698649197817e-05, 0.00011361902579665184, 0.0001643410651013255, 0.00021506310440599918, 0.00026578514371067286, 0.0003165071830153465, 0.0003672292223200202, 0.00041795126162469387, 0.00046867330092936754, 0.0005193953402340412, 0.0005701173795387149]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 5.0, 2.0, 2.0, 5.0, 7.0, 5.0, 7.0, 14.0, 6.0, 16.0, 16.0, 18.0, 18.0, 24.0, 23.0, 28.0, 28.0, 27.0, 27.0, 33.0, 30.0, 28.0, 39.0, 41.0, 38.0, 34.0, 35.0, 37.0, 38.0, 30.0, 38.0, 31.0, 36.0, 22.0, 33.0, 25.0, 20.0, 20.0, 26.0, 20.0, 9.0, 14.0, 17.0, 8.0, 7.0, 7.0, 3.0, 1.0, 6.0, 0.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0004534125328063965, -0.00043966155499219894, -0.0004259105771780014, -0.00041215959936380386, -0.0003984086215496063, -0.0003846576437354088, -0.00037090666592121124, -0.0003571556881070137, -0.00034340471029281616, -0.0003296537324786186, -0.0003159027546644211, -0.00030215177685022354, -0.000288400799036026, -0.00027464982122182846, -0.0002608988434076309, -0.0002471478655934334, -0.00023339688777923584, -0.0002196459099650383, -0.00020589493215084076, -0.00019214395433664322, -0.00017839297652244568, -0.00016464199870824814, -0.0001508910208940506, -0.00013714004307985306, -0.00012338906526565552, -0.00010963808745145798, -9.588710963726044e-05, -8.21361318230629e-05, -6.838515400886536e-05, -5.4634176194667816e-05, -4.0883198380470276e-05, -2.7132220566272736e-05, -1.3381242752075195e-05, 3.6973506212234497e-07, 1.4120712876319885e-05, 2.7871690690517426e-05, 4.1622668504714966e-05, 5.5373646318912506e-05, 6.912462413311005e-05, 8.287560194730759e-05, 9.662657976150513e-05, 0.00011037755757570267, 0.0001241285353899002, 0.00013787951320409775, 0.0001516304910182953, 0.00016538146883249283, 0.00017913244664669037, 0.0001928834244608879, 0.00020663440227508545, 0.000220385380089283, 0.00023413635790348053, 0.00024788733571767807, 0.0002616383135318756, 0.00027538929134607315, 0.0002891402691602707, 0.00030289124697446823, 0.00031664222478866577, 0.0003303932026028633, 0.00034414418041706085, 0.0003578951582312584, 0.00037164613604545593, 0.0003853971138596535, 0.000399148091673851, 0.00041289906948804855, 0.0004266500473022461]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 7.0, 4.0, 6.0, 3.0, 4.0, 10.0, 15.0, 26.0, 15.0, 11.0, 22.0, 19.0, 24.0, 25.0, 30.0, 35.0, 42.0, 22.0, 39.0, 38.0, 45.0, 46.0, 28.0, 33.0, 42.0, 38.0, 41.0, 31.0, 40.0, 40.0, 22.0, 23.0, 32.0, 21.0, 19.0, 17.0, 10.0, 16.0, 13.0, 15.0, 6.0, 7.0, 6.0, 5.0, 6.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0], "bins": [-2.833984375, -2.75152587890625, -2.6690673828125, -2.58660888671875, -2.504150390625, -2.42169189453125, -2.3392333984375, -2.25677490234375, -2.17431640625, -2.09185791015625, -2.0093994140625, -1.92694091796875, -1.844482421875, -1.76202392578125, -1.6795654296875, -1.59710693359375, -1.5146484375, -1.43218994140625, -1.3497314453125, -1.26727294921875, -1.184814453125, -1.10235595703125, -1.0198974609375, -0.93743896484375, -0.85498046875, -0.77252197265625, -0.6900634765625, -0.60760498046875, -0.525146484375, -0.44268798828125, -0.3602294921875, -0.27777099609375, -0.1953125, -0.11285400390625, -0.0303955078125, 0.05206298828125, 0.134521484375, 0.21697998046875, 0.2994384765625, 0.38189697265625, 0.46435546875, 0.54681396484375, 0.6292724609375, 0.71173095703125, 0.794189453125, 0.87664794921875, 0.9591064453125, 1.04156494140625, 1.1240234375, 1.20648193359375, 1.2889404296875, 1.37139892578125, 1.453857421875, 1.53631591796875, 1.6187744140625, 1.70123291015625, 1.78369140625, 1.86614990234375, 1.9486083984375, 2.03106689453125, 2.113525390625, 2.19598388671875, 2.2784423828125, 2.36090087890625, 2.443359375]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 7.0, 5.0, 6.0, 10.0, 10.0, 10.0, 21.0, 24.0, 35.0, 44.0, 79.0, 156.0, 293.0, 597.0, 1229.0, 2636.0, 5509.0, 11063.0, 23081.0, 53299.0, 138717.0, 345721.0, 282609.0, 104967.0, 41867.0, 18889.0, 8974.0, 4486.0, 2056.0, 1050.0, 483.0, 232.0, 147.0, 79.0, 42.0, 42.0, 24.0, 13.0, 12.0, 12.0, 8.0, 2.0, 3.0, 3.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.810546875, -2.713165283203125, -2.61578369140625, -2.518402099609375, -2.4210205078125, -2.323638916015625, -2.22625732421875, -2.128875732421875, -2.031494140625, -1.934112548828125, -1.83673095703125, -1.739349365234375, -1.6419677734375, -1.544586181640625, -1.44720458984375, -1.349822998046875, -1.25244140625, -1.155059814453125, -1.05767822265625, -0.960296630859375, -0.8629150390625, -0.765533447265625, -0.66815185546875, -0.570770263671875, -0.473388671875, -0.376007080078125, -0.27862548828125, -0.181243896484375, -0.0838623046875, 0.013519287109375, 0.11090087890625, 0.208282470703125, 0.3056640625, 0.403045654296875, 0.50042724609375, 0.597808837890625, 0.6951904296875, 0.792572021484375, 0.88995361328125, 0.987335205078125, 1.084716796875, 1.182098388671875, 1.27947998046875, 1.376861572265625, 1.4742431640625, 1.571624755859375, 1.66900634765625, 1.766387939453125, 1.86376953125, 1.961151123046875, 2.05853271484375, 2.155914306640625, 2.2532958984375, 2.350677490234375, 2.44805908203125, 2.545440673828125, 2.642822265625, 2.740203857421875, 2.83758544921875, 2.934967041015625, 3.0323486328125, 3.129730224609375, 3.22711181640625, 3.324493408203125, 3.421875]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 9.0, 3.0, 7.0, 10.0, 12.0, 15.0, 11.0, 12.0, 14.0, 25.0, 26.0, 38.0, 35.0, 39.0, 36.0, 58.0, 59.0, 89.0, 170.0, 1421.0, 374.0, 146.0, 78.0, 43.0, 37.0, 43.0, 38.0, 25.0, 27.0, 29.0, 14.0, 20.0, 16.0, 18.0, 10.0, 5.0, 9.0, 10.0, 11.0, 6.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-12.09375, -11.747802734375, -11.40185546875, -11.055908203125, -10.7099609375, -10.364013671875, -10.01806640625, -9.672119140625, -9.326171875, -8.980224609375, -8.63427734375, -8.288330078125, -7.9423828125, -7.596435546875, -7.25048828125, -6.904541015625, -6.55859375, -6.212646484375, -5.86669921875, -5.520751953125, -5.1748046875, -4.828857421875, -4.48291015625, -4.136962890625, -3.791015625, -3.445068359375, -3.09912109375, -2.753173828125, -2.4072265625, -2.061279296875, -1.71533203125, -1.369384765625, -1.0234375, -0.677490234375, -0.33154296875, 0.014404296875, 0.3603515625, 0.706298828125, 1.05224609375, 1.398193359375, 1.744140625, 2.090087890625, 2.43603515625, 2.781982421875, 3.1279296875, 3.473876953125, 3.81982421875, 4.165771484375, 4.51171875, 4.857666015625, 5.20361328125, 5.549560546875, 5.8955078125, 6.241455078125, 6.58740234375, 6.933349609375, 7.279296875, 7.625244140625, 7.97119140625, 8.317138671875, 8.6630859375, 9.009033203125, 9.35498046875, 9.700927734375, 10.046875]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 4.0, 3.0, 11.0, 9.0, 8.0, 18.0, 23.0, 26.0, 37.0, 44.0, 64.0, 85.0, 116.0, 242.0, 394.0, 807.0, 18580.0, 3116954.0, 6564.0, 700.0, 322.0, 208.0, 157.0, 84.0, 65.0, 48.0, 47.0, 22.0, 21.0, 19.0, 4.0, 5.0, 4.0, 5.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-41.6875, -40.43994140625, -39.1923828125, -37.94482421875, -36.697265625, -35.44970703125, -34.2021484375, -32.95458984375, -31.70703125, -30.45947265625, -29.2119140625, -27.96435546875, -26.716796875, -25.46923828125, -24.2216796875, -22.97412109375, -21.7265625, -20.47900390625, -19.2314453125, -17.98388671875, -16.736328125, -15.48876953125, -14.2412109375, -12.99365234375, -11.74609375, -10.49853515625, -9.2509765625, -8.00341796875, -6.755859375, -5.50830078125, -4.2607421875, -3.01318359375, -1.765625, -0.51806640625, 0.7294921875, 1.97705078125, 3.224609375, 4.47216796875, 5.7197265625, 6.96728515625, 8.21484375, 9.46240234375, 10.7099609375, 11.95751953125, 13.205078125, 14.45263671875, 15.7001953125, 16.94775390625, 18.1953125, 19.44287109375, 20.6904296875, 21.93798828125, 23.185546875, 24.43310546875, 25.6806640625, 26.92822265625, 28.17578125, 29.42333984375, 30.6708984375, 31.91845703125, 33.166015625, 34.41357421875, 35.6611328125, 36.90869140625, 38.15625]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 34.0, 307.0, 502.0, 153.0, 14.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.717714309692383, -29.986541748046875, -28.255369186401367, -26.52419662475586, -24.793025970458984, -23.061851501464844, -21.33068084716797, -19.59950828552246, -17.868335723876953, -16.137163162231445, -14.405990600585938, -12.674818992614746, -10.943646430969238, -9.21247386932373, -7.481302261352539, -5.750129699707031, -4.018957138061523, -2.2877848148345947, -0.556612491607666, 1.1745595932006836, 2.9057321548461914, 4.636904716491699, 6.368076324462891, 8.099248886108398, 9.830421447753906, 11.561594009399414, 13.292766571044922, 15.023938179016113, 16.755111694335938, 18.486282348632812, 20.21745491027832, 21.948627471923828, 23.67980194091797, 25.410974502563477, 27.142147064208984, 28.87331771850586, 30.6044921875, 32.335662841796875, 34.06683349609375, 35.79800796508789, 37.52918243408203, 39.260353088378906, 40.99152755737305, 42.72269821166992, 44.45387268066406, 46.18504333496094, 47.91621398925781, 49.64738845825195, 51.37855911254883, 53.1097297668457, 54.840904235839844, 56.57207489013672, 58.30324935913086, 60.034420013427734, 61.765594482421875, 63.49676513671875, 65.22793579101562, 66.9591064453125, 68.69027709960938, 70.42145538330078, 72.15262603759766, 73.88379669189453, 75.6149673461914, 77.34614562988281, 79.07731628417969]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 7.0, 5.0, 6.0, 3.0, 9.0, 9.0, 10.0, 14.0, 17.0, 19.0, 21.0, 26.0, 20.0, 23.0, 22.0, 22.0, 23.0, 33.0, 36.0, 36.0, 46.0, 30.0, 42.0, 31.0, 39.0, 51.0, 46.0, 34.0, 53.0, 33.0, 35.0, 36.0, 30.0, 22.0, 21.0, 11.0, 16.0, 17.0, 8.0, 11.0, 5.0, 4.0, 9.0, 6.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.147106170654297, -22.370359420776367, -21.593612670898438, -20.816865921020508, -20.040119171142578, -19.263370513916016, -18.486623764038086, -17.709877014160156, -16.933130264282227, -16.156383514404297, -15.379636764526367, -14.602889060974121, -13.826142311096191, -13.049395561218262, -12.272647857666016, -11.495901107788086, -10.719154357910156, -9.942407608032227, -9.165660858154297, -8.38891315460205, -7.612166404724121, -6.835419654846191, -6.0586724281311035, -5.281925201416016, -4.505178451538086, -3.728431463241577, -2.9516844749450684, -2.1749374866485596, -1.3981904983520508, -0.621443510055542, 0.1553034782409668, 0.9320507049560547, 1.7087955474853516, 2.4855425357818604, 3.262289524078369, 4.039036750793457, 4.815783500671387, 5.592530250549316, 6.369277477264404, 7.146024703979492, 7.922771453857422, 8.699518203735352, 9.476264953613281, 10.253012657165527, 11.029759407043457, 11.806506156921387, 12.583253860473633, 13.360000610351562, 14.136747360229492, 14.913494110107422, 15.690240859985352, 16.46698760986328, 17.243736267089844, 18.020483016967773, 18.797229766845703, 19.573976516723633, 20.350723266601562, 21.127470016479492, 21.904216766357422, 22.68096351623535, 23.45771026611328, 24.234458923339844, 25.011205673217773, 25.787952423095703, 26.564699172973633]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 2.0, 3.0, 7.0, 4.0, 4.0, 3.0, 6.0, 7.0, 15.0, 8.0, 10.0, 26.0, 18.0, 19.0, 16.0, 27.0, 35.0, 25.0, 28.0, 39.0, 42.0, 30.0, 38.0, 33.0, 40.0, 46.0, 45.0, 32.0, 41.0, 44.0, 39.0, 40.0, 34.0, 28.0, 26.0, 23.0, 19.0, 20.0, 12.0, 13.0, 15.0, 14.0, 6.0, 3.0, 8.0, 6.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-3.123046875, -3.028045654296875, -2.93304443359375, -2.838043212890625, -2.7430419921875, -2.648040771484375, -2.55303955078125, -2.458038330078125, -2.363037109375, -2.268035888671875, -2.17303466796875, -2.078033447265625, -1.9830322265625, -1.888031005859375, -1.79302978515625, -1.698028564453125, -1.60302734375, -1.508026123046875, -1.41302490234375, -1.318023681640625, -1.2230224609375, -1.128021240234375, -1.03302001953125, -0.938018798828125, -0.843017578125, -0.748016357421875, -0.65301513671875, -0.558013916015625, -0.4630126953125, -0.368011474609375, -0.27301025390625, -0.178009033203125, -0.0830078125, 0.011993408203125, 0.10699462890625, 0.201995849609375, 0.2969970703125, 0.391998291015625, 0.48699951171875, 0.582000732421875, 0.677001953125, 0.772003173828125, 0.86700439453125, 0.962005615234375, 1.0570068359375, 1.152008056640625, 1.24700927734375, 1.342010498046875, 1.43701171875, 1.532012939453125, 1.62701416015625, 1.722015380859375, 1.8170166015625, 1.912017822265625, 2.00701904296875, 2.102020263671875, 2.197021484375, 2.292022705078125, 2.38702392578125, 2.482025146484375, 2.5770263671875, 2.672027587890625, 2.76702880859375, 2.862030029296875, 2.95703125]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 3.0, 1.0, 2.0, 7.0, 7.0, 7.0, 8.0, 7.0, 13.0, 22.0, 26.0, 22.0, 29.0, 44.0, 56.0, 55.0, 66.0, 122.0, 148.0, 278.0, 700.0, 2958.0, 33146.0, 696111.0, 2847844.0, 580774.0, 27539.0, 2674.0, 705.0, 269.0, 156.0, 101.0, 82.0, 69.0, 42.0, 45.0, 27.0, 31.0, 23.0, 14.0, 16.0, 6.0, 11.0, 7.0, 2.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-8.046875, -7.7911376953125, -7.535400390625, -7.2796630859375, -7.02392578125, -6.7681884765625, -6.512451171875, -6.2567138671875, -6.0009765625, -5.7452392578125, -5.489501953125, -5.2337646484375, -4.97802734375, -4.7222900390625, -4.466552734375, -4.2108154296875, -3.955078125, -3.6993408203125, -3.443603515625, -3.1878662109375, -2.93212890625, -2.6763916015625, -2.420654296875, -2.1649169921875, -1.9091796875, -1.6534423828125, -1.397705078125, -1.1419677734375, -0.88623046875, -0.6304931640625, -0.374755859375, -0.1190185546875, 0.13671875, 0.3924560546875, 0.648193359375, 0.9039306640625, 1.15966796875, 1.4154052734375, 1.671142578125, 1.9268798828125, 2.1826171875, 2.4383544921875, 2.694091796875, 2.9498291015625, 3.20556640625, 3.4613037109375, 3.717041015625, 3.9727783203125, 4.228515625, 4.4842529296875, 4.739990234375, 4.9957275390625, 5.25146484375, 5.5072021484375, 5.762939453125, 6.0186767578125, 6.2744140625, 6.5301513671875, 6.785888671875, 7.0416259765625, 7.29736328125, 7.5531005859375, 7.808837890625, 8.0645751953125, 8.3203125]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 8.0, 4.0, 11.0, 9.0, 16.0, 22.0, 34.0, 58.0, 75.0, 99.0, 141.0, 182.0, 278.0, 335.0, 463.0, 460.0, 446.0, 376.0, 316.0, 184.0, 162.0, 113.0, 77.0, 48.0, 49.0, 34.0, 21.0, 14.0, 14.0, 8.0, 8.0, 9.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.98046875, -5.7786865234375, -5.576904296875, -5.3751220703125, -5.17333984375, -4.9715576171875, -4.769775390625, -4.5679931640625, -4.3662109375, -4.1644287109375, -3.962646484375, -3.7608642578125, -3.55908203125, -3.3572998046875, -3.155517578125, -2.9537353515625, -2.751953125, -2.5501708984375, -2.348388671875, -2.1466064453125, -1.94482421875, -1.7430419921875, -1.541259765625, -1.3394775390625, -1.1376953125, -0.9359130859375, -0.734130859375, -0.5323486328125, -0.33056640625, -0.1287841796875, 0.072998046875, 0.2747802734375, 0.4765625, 0.6783447265625, 0.880126953125, 1.0819091796875, 1.28369140625, 1.4854736328125, 1.687255859375, 1.8890380859375, 2.0908203125, 2.2926025390625, 2.494384765625, 2.6961669921875, 2.89794921875, 3.0997314453125, 3.301513671875, 3.5032958984375, 3.705078125, 3.9068603515625, 4.108642578125, 4.3104248046875, 4.51220703125, 4.7139892578125, 4.915771484375, 5.1175537109375, 5.3193359375, 5.5211181640625, 5.722900390625, 5.9246826171875, 6.12646484375, 6.3282470703125, 6.530029296875, 6.7318115234375, 6.93359375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 5.0, 7.0, 8.0, 6.0, 15.0, 14.0, 20.0, 34.0, 49.0, 54.0, 70.0, 132.0, 174.0, 249.0, 394.0, 781.0, 31086.0, 4094991.0, 64070.0, 875.0, 435.0, 255.0, 172.0, 132.0, 76.0, 61.0, 40.0, 26.0, 21.0, 14.0, 7.0, 4.0, 7.0, 4.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.5625, -31.646484375, -30.73046875, -29.814453125, -28.8984375, -27.982421875, -27.06640625, -26.150390625, -25.234375, -24.318359375, -23.40234375, -22.486328125, -21.5703125, -20.654296875, -19.73828125, -18.822265625, -17.90625, -16.990234375, -16.07421875, -15.158203125, -14.2421875, -13.326171875, -12.41015625, -11.494140625, -10.578125, -9.662109375, -8.74609375, -7.830078125, -6.9140625, -5.998046875, -5.08203125, -4.166015625, -3.25, -2.333984375, -1.41796875, -0.501953125, 0.4140625, 1.330078125, 2.24609375, 3.162109375, 4.078125, 4.994140625, 5.91015625, 6.826171875, 7.7421875, 8.658203125, 9.57421875, 10.490234375, 11.40625, 12.322265625, 13.23828125, 14.154296875, 15.0703125, 15.986328125, 16.90234375, 17.818359375, 18.734375, 19.650390625, 20.56640625, 21.482421875, 22.3984375, 23.314453125, 24.23046875, 25.146484375, 26.0625]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 55.0, 224.0, 390.0, 271.0, 57.0, 10.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-29.12668228149414, -26.58468246459961, -24.04268455505371, -21.50068473815918, -18.95868682861328, -16.41668701171875, -13.874687194824219, -11.33268928527832, -8.790689468383789, -6.248690605163574, -3.706691265106201, -1.1646919250488281, 1.3773069381713867, 3.9193058013916016, 6.461305618286133, 9.003303527832031, 11.545303344726562, 14.087302207946777, 16.629301071166992, 19.171300888061523, 21.713298797607422, 24.255298614501953, 26.797298431396484, 29.339296340942383, 31.881296157836914, 34.42329406738281, 36.965293884277344, 39.507293701171875, 42.049293518066406, 44.59129333496094, 47.13329315185547, 49.675289154052734, 52.21729278564453, 54.75929260253906, 57.301292419433594, 59.843292236328125, 62.38528823852539, 64.92729187011719, 67.46928405761719, 70.01128387451172, 72.55328369140625, 75.09528350830078, 77.63728332519531, 80.17928314208984, 82.72128295898438, 85.26327514648438, 87.80528259277344, 90.34727478027344, 92.8892822265625, 95.43128204345703, 97.97328186035156, 100.5152816772461, 103.05728149414062, 105.59927368164062, 108.14128112792969, 110.68327331542969, 113.22527313232422, 115.76727294921875, 118.30927276611328, 120.85127258300781, 123.39327239990234, 125.93527221679688, 128.47726440429688, 131.01927185058594, 133.56126403808594]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 6.0, 5.0, 5.0, 6.0, 4.0, 9.0, 10.0, 9.0, 17.0, 12.0, 6.0, 19.0, 30.0, 33.0, 38.0, 36.0, 34.0, 33.0, 48.0, 38.0, 42.0, 40.0, 49.0, 48.0, 41.0, 51.0, 31.0, 42.0, 31.0, 24.0, 40.0, 19.0, 24.0, 25.0, 18.0, 12.0, 15.0, 11.0, 12.0, 8.0, 9.0, 6.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.853904724121094, -18.2478084564209, -17.641714096069336, -17.03561782836914, -16.429523468017578, -15.823427200317383, -15.217331886291504, -14.611236572265625, -14.00514030456543, -13.39904499053955, -12.792949676513672, -12.186853408813477, -11.580758094787598, -10.974662780761719, -10.36856746673584, -9.762472152709961, -9.156376838684082, -8.550281524658203, -7.944185733795166, -7.338090419769287, -6.73199462890625, -6.125899314880371, -5.519804000854492, -4.913708209991455, -4.307612895965576, -3.701517343521118, -3.09542179107666, -2.4893264770507812, -1.8832309246063232, -1.2771353721618652, -0.6710400581359863, -0.06494426727294922, 0.5411510467529297, 1.1472465991973877, 1.7533420324325562, 2.3594374656677246, 2.9655330181121826, 3.5716285705566406, 4.1777238845825195, 4.783819675445557, 5.3899149894714355, 5.9960103034973145, 6.602106094360352, 7.2082014083862305, 7.814296722412109, 8.420392990112305, 9.026487350463867, 9.632583618164062, 10.238678932189941, 10.84477424621582, 11.4508695602417, 12.056964874267578, 12.663061141967773, 13.269156455993652, 13.875251770019531, 14.481348037719727, 15.087442398071289, 15.693537712097168, 16.299633026123047, 16.905729293823242, 17.511823654174805, 18.117919921875, 18.724014282226562, 19.330110549926758, 19.936206817626953]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 11.0, 7.0, 5.0, 6.0, 8.0, 7.0, 16.0, 22.0, 14.0, 29.0, 25.0, 26.0, 32.0, 33.0, 33.0, 45.0, 44.0, 41.0, 44.0, 39.0, 39.0, 47.0, 34.0, 45.0, 28.0, 31.0, 36.0, 35.0, 29.0, 40.0, 34.0, 19.0, 14.0, 14.0, 15.0, 10.0, 13.0, 9.0, 3.0, 7.0, 3.0, 4.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-3.328125, -3.236297607421875, -3.14447021484375, -3.052642822265625, -2.9608154296875, -2.868988037109375, -2.77716064453125, -2.685333251953125, -2.593505859375, -2.501678466796875, -2.40985107421875, -2.318023681640625, -2.2261962890625, -2.134368896484375, -2.04254150390625, -1.950714111328125, -1.85888671875, -1.767059326171875, -1.67523193359375, -1.583404541015625, -1.4915771484375, -1.399749755859375, -1.30792236328125, -1.216094970703125, -1.124267578125, -1.032440185546875, -0.94061279296875, -0.848785400390625, -0.7569580078125, -0.665130615234375, -0.57330322265625, -0.481475830078125, -0.3896484375, -0.297821044921875, -0.20599365234375, -0.114166259765625, -0.0223388671875, 0.069488525390625, 0.16131591796875, 0.253143310546875, 0.344970703125, 0.436798095703125, 0.52862548828125, 0.620452880859375, 0.7122802734375, 0.804107666015625, 0.89593505859375, 0.987762451171875, 1.07958984375, 1.171417236328125, 1.26324462890625, 1.355072021484375, 1.4468994140625, 1.538726806640625, 1.63055419921875, 1.722381591796875, 1.814208984375, 1.906036376953125, 1.99786376953125, 2.089691162109375, 2.1815185546875, 2.273345947265625, 2.36517333984375, 2.457000732421875, 2.548828125]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 5.0, 0.0, 6.0, 5.0, 5.0, 16.0, 14.0, 33.0, 46.0, 50.0, 104.0, 140.0, 173.0, 279.0, 405.0, 568.0, 916.0, 1438.0, 2182.0, 3184.0, 4859.0, 7624.0, 11832.0, 18857.0, 30888.0, 50218.0, 85151.0, 145657.0, 223175.0, 184707.0, 108962.0, 63364.0, 38649.0, 23642.0, 14626.0, 9249.0, 5920.0, 3981.0, 2586.0, 1657.0, 1128.0, 751.0, 487.0, 345.0, 219.0, 144.0, 112.0, 60.0, 46.0, 36.0, 32.0, 8.0, 6.0, 12.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.309814453125, -0.2997322082519531, -0.28964996337890625, -0.2795677185058594, -0.2694854736328125, -0.2594032287597656, -0.24932098388671875, -0.23923873901367188, -0.229156494140625, -0.21907424926757812, -0.20899200439453125, -0.19890975952148438, -0.1888275146484375, -0.17874526977539062, -0.16866302490234375, -0.15858078002929688, -0.14849853515625, -0.13841629028320312, -0.12833404541015625, -0.11825180053710938, -0.1081695556640625, -0.09808731079101562, -0.08800506591796875, -0.07792282104492188, -0.067840576171875, -0.057758331298828125, -0.04767608642578125, -0.037593841552734375, -0.0275115966796875, -0.017429351806640625, -0.00734710693359375, 0.002735137939453125, 0.0128173828125, 0.022899627685546875, 0.03298187255859375, 0.043064117431640625, 0.0531463623046875, 0.06322860717773438, 0.07331085205078125, 0.08339309692382812, 0.093475341796875, 0.10355758666992188, 0.11363983154296875, 0.12372207641601562, 0.1338043212890625, 0.14388656616210938, 0.15396881103515625, 0.16405105590820312, 0.17413330078125, 0.18421554565429688, 0.19429779052734375, 0.20438003540039062, 0.2144622802734375, 0.22454452514648438, 0.23462677001953125, 0.24470901489257812, 0.254791259765625, 0.2648735046386719, 0.27495574951171875, 0.2850379943847656, 0.2951202392578125, 0.3052024841308594, 0.31528472900390625, 0.3253669738769531, 0.33544921875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 5.0, 1.0, 3.0, 5.0, 7.0, 5.0, 6.0, 7.0, 11.0, 15.0, 4.0, 12.0, 16.0, 21.0, 16.0, 25.0, 32.0, 24.0, 27.0, 31.0, 33.0, 38.0, 38.0, 39.0, 52.0, 1060.0, 51.0, 50.0, 32.0, 35.0, 30.0, 35.0, 32.0, 32.0, 31.0, 30.0, 20.0, 13.0, 24.0, 17.0, 14.0, 14.0, 9.0, 8.0, 9.0, 6.0, 6.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.560546875, -1.505767822265625, -1.45098876953125, -1.396209716796875, -1.3414306640625, -1.286651611328125, -1.23187255859375, -1.177093505859375, -1.122314453125, -1.067535400390625, -1.01275634765625, -0.957977294921875, -0.9031982421875, -0.848419189453125, -0.79364013671875, -0.738861083984375, -0.68408203125, -0.629302978515625, -0.57452392578125, -0.519744873046875, -0.4649658203125, -0.410186767578125, -0.35540771484375, -0.300628662109375, -0.245849609375, -0.191070556640625, -0.13629150390625, -0.081512451171875, -0.0267333984375, 0.028045654296875, 0.08282470703125, 0.137603759765625, 0.1923828125, 0.247161865234375, 0.30194091796875, 0.356719970703125, 0.4114990234375, 0.466278076171875, 0.52105712890625, 0.575836181640625, 0.630615234375, 0.685394287109375, 0.74017333984375, 0.794952392578125, 0.8497314453125, 0.904510498046875, 0.95928955078125, 1.014068603515625, 1.06884765625, 1.123626708984375, 1.17840576171875, 1.233184814453125, 1.2879638671875, 1.342742919921875, 1.39752197265625, 1.452301025390625, 1.507080078125, 1.561859130859375, 1.61663818359375, 1.671417236328125, 1.7261962890625, 1.780975341796875, 1.83575439453125, 1.890533447265625, 1.9453125]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 3.0, 5.0, 10.0, 16.0, 21.0, 23.0, 35.0, 56.0, 83.0, 146.0, 188.0, 272.0, 468.0, 659.0, 972.0, 1508.0, 2353.0, 3640.0, 5671.0, 8999.0, 14453.0, 23474.0, 39214.0, 66121.0, 115581.0, 199311.0, 1273222.0, 140118.0, 79842.0, 46663.0, 27699.0, 16856.0, 10501.0, 6723.0, 4253.0, 2718.0, 1809.0, 1200.0, 790.0, 489.0, 343.0, 225.0, 151.0, 90.0, 57.0, 38.0, 27.0, 20.0, 14.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.305908203125, -0.2969551086425781, -0.28800201416015625, -0.2790489196777344, -0.2700958251953125, -0.2611427307128906, -0.25218963623046875, -0.24323654174804688, -0.234283447265625, -0.22533035278320312, -0.21637725830078125, -0.20742416381835938, -0.1984710693359375, -0.18951797485351562, -0.18056488037109375, -0.17161178588867188, -0.16265869140625, -0.15370559692382812, -0.14475250244140625, -0.13579940795898438, -0.1268463134765625, -0.11789321899414062, -0.10894012451171875, -0.09998703002929688, -0.091033935546875, -0.08208084106445312, -0.07312774658203125, -0.06417465209960938, -0.0552215576171875, -0.046268463134765625, -0.03731536865234375, -0.028362274169921875, -0.0194091796875, -0.010456085205078125, -0.00150299072265625, 0.007450103759765625, 0.0164031982421875, 0.025356292724609375, 0.03430938720703125, 0.043262481689453125, 0.052215576171875, 0.061168670654296875, 0.07012176513671875, 0.07907485961914062, 0.0880279541015625, 0.09698104858398438, 0.10593414306640625, 0.11488723754882812, 0.12384033203125, 0.13279342651367188, 0.14174652099609375, 0.15069961547851562, 0.1596527099609375, 0.16860580444335938, 0.17755889892578125, 0.18651199340820312, 0.195465087890625, 0.20441818237304688, 0.21337127685546875, 0.22232437133789062, 0.2312774658203125, 0.24023056030273438, 0.24918365478515625, 0.2581367492675781, 0.26708984375]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 7.0, 9.0, 9.0, 13.0, 23.0, 30.0, 38.0, 20.0, 35.0, 45.0, 44.0, 44.0, 66.0, 55.0, 60.0, 51.0, 57.0, 67.0, 45.0, 50.0, 37.0, 29.0, 36.0, 30.0, 20.0, 13.0, 15.0, 10.0, 14.0, 5.0, 6.0, 5.0, 2.0, 2.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008945465087890625, -0.000864759087562561, -0.0008349716663360596, -0.0008051842451095581, -0.0007753968238830566, -0.0007456094026565552, -0.0007158219814300537, -0.0006860345602035522, -0.0006562471389770508, -0.0006264597177505493, -0.0005966722965240479, -0.0005668848752975464, -0.0005370974540710449, -0.0005073100328445435, -0.000477522611618042, -0.00044773519039154053, -0.00041794776916503906, -0.0003881603479385376, -0.00035837292671203613, -0.00032858550548553467, -0.0002987980842590332, -0.00026901066303253174, -0.00023922324180603027, -0.0002094358205795288, -0.00017964839935302734, -0.00014986097812652588, -0.00012007355690002441, -9.028613567352295e-05, -6.0498714447021484e-05, -3.071129322052002e-05, -9.238719940185547e-07, 2.886354923248291e-05, 5.8650970458984375e-05, 8.843839168548584e-05, 0.0001182258129119873, 0.00014801323413848877, 0.00017780065536499023, 0.0002075880765914917, 0.00023737549781799316, 0.00026716291904449463, 0.0002969503402709961, 0.00032673776149749756, 0.000356525182723999, 0.0003863126039505005, 0.00041610002517700195, 0.0004458874464035034, 0.0004756748676300049, 0.0005054622888565063, 0.0005352497100830078, 0.0005650371313095093, 0.0005948245525360107, 0.0006246119737625122, 0.0006543993949890137, 0.0006841868162155151, 0.0007139742374420166, 0.0007437616586685181, 0.0007735490798950195, 0.000803336501121521, 0.0008331239223480225, 0.0008629113435745239, 0.0008926987648010254, 0.0009224861860275269, 0.0009522736072540283, 0.0009820610284805298, 0.0010118484497070312]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 0.0, 6.0, 4.0, 8.0, 13.0, 13.0, 16.0, 13.0, 26.0, 36.0, 45.0, 61.0, 71.0, 96.0, 146.0, 291.0, 746.0, 10334.0, 1016861.0, 18014.0, 844.0, 299.0, 150.0, 115.0, 88.0, 65.0, 51.0, 47.0, 25.0, 19.0, 12.0, 9.0, 10.0, 9.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0223541259765625, -0.02170705795288086, -0.02105998992919922, -0.020412921905517578, -0.019765853881835938, -0.019118785858154297, -0.018471717834472656, -0.017824649810791016, -0.017177581787109375, -0.016530513763427734, -0.015883445739746094, -0.015236377716064453, -0.014589309692382812, -0.013942241668701172, -0.013295173645019531, -0.01264810562133789, -0.01200103759765625, -0.01135396957397461, -0.010706901550292969, -0.010059833526611328, -0.009412765502929688, -0.008765697479248047, -0.008118629455566406, -0.007471561431884766, -0.006824493408203125, -0.006177425384521484, -0.005530357360839844, -0.004883289337158203, -0.0042362213134765625, -0.003589153289794922, -0.0029420852661132812, -0.0022950172424316406, -0.00164794921875, -0.0010008811950683594, -0.00035381317138671875, 0.0002932548522949219, 0.0009403228759765625, 0.0015873908996582031, 0.0022344589233398438, 0.0028815269470214844, 0.003528594970703125, 0.004175662994384766, 0.004822731018066406, 0.005469799041748047, 0.0061168670654296875, 0.006763935089111328, 0.007411003112792969, 0.00805807113647461, 0.00870513916015625, 0.00935220718383789, 0.009999275207519531, 0.010646343231201172, 0.011293411254882812, 0.011940479278564453, 0.012587547302246094, 0.013234615325927734, 0.013881683349609375, 0.014528751373291016, 0.015175819396972656, 0.015822887420654297, 0.016469955444335938, 0.017117023468017578, 0.01776409149169922, 0.01841115951538086, 0.0190582275390625]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 4.0, 9.0, 51.0, 178.0, 325.0, 273.0, 135.0, 32.0, 9.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00036826252471655607, -0.0003052189131267369, -0.00024217528698500246, -0.00017913166084326804, -0.00011608804925344884, -5.304443766362965e-05, 9.999203030019999e-06, 7.304281461983919e-05, 0.00013608642620965838, 0.00019913003779947758, 0.00026217364938929677, 0.0003252172900829464, 0.0003882609016727656, 0.0004513045132625848, 0.0005143481539562345, 0.0005773917655460536, 0.0006404353771358728, 0.000703478988725692, 0.0007665226003155112, 0.0008295662701129913, 0.0008926098234951496, 0.0009556534932926297, 0.0010186971630901098, 0.001081740716472268, 0.0011447842698544264, 0.0012078279396519065, 0.0012708714930340648, 0.0013339151628315449, 0.0013969587162137032, 0.0014600023860111833, 0.0015230460558086634, 0.0015860896091908216, 0.0016491333954036236, 0.0017121770652011037, 0.001775220618583262, 0.001838264288380742, 0.0019013078417629004, 0.0019643513951450586, 0.0020273951813578606, 0.002090438734740019, 0.002153482288122177, 0.0022165258415043354, 0.0022795696277171373, 0.0023426131810992956, 0.002405656734481454, 0.002468700287863612, 0.002531744074076414, 0.0025947876274585724, 0.0026578311808407307, 0.002720874734222889, 0.002783918520435691, 0.002846962073817849, 0.0029100056272000074, 0.0029730491805821657, 0.0030360929667949677, 0.003099136520177126, 0.003162180306389928, 0.003225223859772086, 0.003288267645984888, 0.0033513111993670464, 0.0034143547527492046, 0.003477398306131363, 0.003540442092344165, 0.003603485645726323, 0.0036665291991084814]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 3.0, 2.0, 3.0, 4.0, 7.0, 16.0, 15.0, 12.0, 20.0, 19.0, 28.0, 27.0, 30.0, 25.0, 35.0, 38.0, 41.0, 38.0, 33.0, 39.0, 33.0, 33.0, 45.0, 43.0, 46.0, 32.0, 48.0, 29.0, 34.0, 33.0, 32.0, 24.0, 22.0, 16.0, 25.0, 10.0, 13.0, 7.0, 9.0, 6.0, 4.0, 3.0, 9.0, 7.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0004811286926269531, -0.0004660738632082939, -0.0004510190337896347, -0.0004359642043709755, -0.0004209093749523163, -0.0004058545455336571, -0.00039079971611499786, -0.00037574488669633865, -0.00036069005727767944, -0.00034563522785902023, -0.000330580398440361, -0.0003155255690217018, -0.0003004707396030426, -0.0002854159101843834, -0.0002703610807657242, -0.00025530625134706497, -0.00024025142192840576, -0.00022519659250974655, -0.00021014176309108734, -0.00019508693367242813, -0.00018003210425376892, -0.0001649772748351097, -0.0001499224454164505, -0.0001348676159977913, -0.00011981278657913208, -0.00010475795716047287, -8.970312774181366e-05, -7.464829832315445e-05, -5.959346890449524e-05, -4.453863948583603e-05, -2.948381006717682e-05, -1.4428980648517609e-05, 6.258487701416016e-07, 1.5680678188800812e-05, 3.073550760746002e-05, 4.579033702611923e-05, 6.084516644477844e-05, 7.589999586343765e-05, 9.095482528209686e-05, 0.00010600965470075607, 0.00012106448411941528, 0.0001361193135380745, 0.0001511741429567337, 0.00016622897237539291, 0.00018128380179405212, 0.00019633863121271133, 0.00021139346063137054, 0.00022644829005002975, 0.00024150311946868896, 0.0002565579488873482, 0.0002716127783060074, 0.0002866676077246666, 0.0003017224371433258, 0.000316777266561985, 0.0003318320959806442, 0.00034688692539930344, 0.00036194175481796265, 0.00037699658423662186, 0.00039205141365528107, 0.0004071062430739403, 0.0004221610724925995, 0.0004372159019112587, 0.0004522707313299179, 0.0004673255607485771, 0.00048238039016723633]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 11.0, 7.0, 5.0, 6.0, 8.0, 7.0, 16.0, 22.0, 14.0, 29.0, 25.0, 26.0, 32.0, 33.0, 33.0, 45.0, 44.0, 41.0, 44.0, 39.0, 39.0, 47.0, 34.0, 45.0, 28.0, 31.0, 36.0, 35.0, 29.0, 41.0, 33.0, 19.0, 14.0, 14.0, 15.0, 10.0, 13.0, 9.0, 3.0, 7.0, 3.0, 4.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-3.328125, -3.236297607421875, -3.14447021484375, -3.052642822265625, -2.9608154296875, -2.868988037109375, -2.77716064453125, -2.685333251953125, -2.593505859375, -2.501678466796875, -2.40985107421875, -2.318023681640625, -2.2261962890625, -2.134368896484375, -2.04254150390625, -1.950714111328125, -1.85888671875, -1.767059326171875, -1.67523193359375, -1.583404541015625, -1.4915771484375, -1.399749755859375, -1.30792236328125, -1.216094970703125, -1.124267578125, -1.032440185546875, -0.94061279296875, -0.848785400390625, -0.7569580078125, -0.665130615234375, -0.57330322265625, -0.481475830078125, -0.3896484375, -0.297821044921875, -0.20599365234375, -0.114166259765625, -0.0223388671875, 0.069488525390625, 0.16131591796875, 0.253143310546875, 0.344970703125, 0.436798095703125, 0.52862548828125, 0.620452880859375, 0.7122802734375, 0.804107666015625, 0.89593505859375, 0.987762451171875, 1.07958984375, 1.171417236328125, 1.26324462890625, 1.355072021484375, 1.4468994140625, 1.538726806640625, 1.63055419921875, 1.722381591796875, 1.814208984375, 1.906036376953125, 1.99786376953125, 2.089691162109375, 2.1815185546875, 2.273345947265625, 2.36517333984375, 2.457000732421875, 2.548828125]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 2.0, 6.0, 8.0, 11.0, 16.0, 15.0, 16.0, 22.0, 27.0, 30.0, 53.0, 66.0, 68.0, 120.0, 191.0, 376.0, 743.0, 1672.0, 3992.0, 9455.0, 22631.0, 52859.0, 120691.0, 278313.0, 313941.0, 137597.0, 60436.0, 25803.0, 11000.0, 4521.0, 1922.0, 817.0, 394.0, 211.0, 146.0, 80.0, 72.0, 56.0, 41.0, 27.0, 26.0, 25.0, 12.0, 14.0, 12.0, 5.0, 7.0, 4.0, 4.0, 2.0, 1.0, 3.0], "bins": [-3.48046875, -3.384002685546875, -3.28753662109375, -3.191070556640625, -3.0946044921875, -2.998138427734375, -2.90167236328125, -2.805206298828125, -2.708740234375, -2.612274169921875, -2.51580810546875, -2.419342041015625, -2.3228759765625, -2.226409912109375, -2.12994384765625, -2.033477783203125, -1.93701171875, -1.840545654296875, -1.74407958984375, -1.647613525390625, -1.5511474609375, -1.454681396484375, -1.35821533203125, -1.261749267578125, -1.165283203125, -1.068817138671875, -0.97235107421875, -0.875885009765625, -0.7794189453125, -0.682952880859375, -0.58648681640625, -0.490020751953125, -0.3935546875, -0.297088623046875, -0.20062255859375, -0.104156494140625, -0.0076904296875, 0.088775634765625, 0.18524169921875, 0.281707763671875, 0.378173828125, 0.474639892578125, 0.57110595703125, 0.667572021484375, 0.7640380859375, 0.860504150390625, 0.95697021484375, 1.053436279296875, 1.14990234375, 1.246368408203125, 1.34283447265625, 1.439300537109375, 1.5357666015625, 1.632232666015625, 1.72869873046875, 1.825164794921875, 1.921630859375, 2.018096923828125, 2.11456298828125, 2.211029052734375, 2.3074951171875, 2.403961181640625, 2.50042724609375, 2.596893310546875, 2.693359375]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 3.0, 11.0, 8.0, 8.0, 5.0, 12.0, 23.0, 16.0, 14.0, 23.0, 32.0, 37.0, 30.0, 34.0, 39.0, 36.0, 46.0, 58.0, 88.0, 187.0, 1442.0, 306.0, 132.0, 66.0, 43.0, 41.0, 40.0, 35.0, 25.0, 27.0, 24.0, 30.0, 21.0, 18.0, 12.0, 13.0, 10.0, 7.0, 11.0, 11.0, 10.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-8.796875, -8.520263671875, -8.24365234375, -7.967041015625, -7.6904296875, -7.413818359375, -7.13720703125, -6.860595703125, -6.583984375, -6.307373046875, -6.03076171875, -5.754150390625, -5.4775390625, -5.200927734375, -4.92431640625, -4.647705078125, -4.37109375, -4.094482421875, -3.81787109375, -3.541259765625, -3.2646484375, -2.988037109375, -2.71142578125, -2.434814453125, -2.158203125, -1.881591796875, -1.60498046875, -1.328369140625, -1.0517578125, -0.775146484375, -0.49853515625, -0.221923828125, 0.0546875, 0.331298828125, 0.60791015625, 0.884521484375, 1.1611328125, 1.437744140625, 1.71435546875, 1.990966796875, 2.267578125, 2.544189453125, 2.82080078125, 3.097412109375, 3.3740234375, 3.650634765625, 3.92724609375, 4.203857421875, 4.48046875, 4.757080078125, 5.03369140625, 5.310302734375, 5.5869140625, 5.863525390625, 6.14013671875, 6.416748046875, 6.693359375, 6.969970703125, 7.24658203125, 7.523193359375, 7.7998046875, 8.076416015625, 8.35302734375, 8.629638671875, 8.90625]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 7.0, 3.0, 2.0, 1.0, 3.0, 9.0, 8.0, 10.0, 16.0, 15.0, 16.0, 27.0, 33.0, 51.0, 56.0, 93.0, 135.0, 238.0, 514.0, 1176.0, 17447.0, 3116982.0, 6715.0, 1004.0, 434.0, 220.0, 139.0, 90.0, 62.0, 43.0, 32.0, 31.0, 17.0, 24.0, 13.0, 10.0, 4.0, 8.0, 5.0, 4.0, 5.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.09375, -38.85693359375, -37.6201171875, -36.38330078125, -35.146484375, -33.90966796875, -32.6728515625, -31.43603515625, -30.19921875, -28.96240234375, -27.7255859375, -26.48876953125, -25.251953125, -24.01513671875, -22.7783203125, -21.54150390625, -20.3046875, -19.06787109375, -17.8310546875, -16.59423828125, -15.357421875, -14.12060546875, -12.8837890625, -11.64697265625, -10.41015625, -9.17333984375, -7.9365234375, -6.69970703125, -5.462890625, -4.22607421875, -2.9892578125, -1.75244140625, -0.515625, 0.72119140625, 1.9580078125, 3.19482421875, 4.431640625, 5.66845703125, 6.9052734375, 8.14208984375, 9.37890625, 10.61572265625, 11.8525390625, 13.08935546875, 14.326171875, 15.56298828125, 16.7998046875, 18.03662109375, 19.2734375, 20.51025390625, 21.7470703125, 22.98388671875, 24.220703125, 25.45751953125, 26.6943359375, 27.93115234375, 29.16796875, 30.40478515625, 31.6416015625, 32.87841796875, 34.115234375, 35.35205078125, 36.5888671875, 37.82568359375, 39.0625]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 6.0, 67.0, 357.0, 404.0, 165.0, 18.0, 3.0], "bins": [-90.95111083984375, -89.43952941894531, -87.92794036865234, -86.4163589477539, -84.90476989746094, -83.3931884765625, -81.88160705566406, -80.3700180053711, -78.85843658447266, -77.34685516357422, -75.83526611328125, -74.32368469238281, -72.81209564208984, -71.3005142211914, -69.78892517089844, -68.27734375, -66.76575469970703, -65.2541732788086, -63.742584228515625, -62.23100280761719, -60.719417572021484, -59.20783233642578, -57.69624710083008, -56.184661865234375, -54.67308044433594, -53.161495208740234, -51.64990997314453, -50.138328552246094, -48.62674331665039, -47.11515808105469, -45.603572845458984, -44.09198760986328, -42.58039855957031, -41.06881332397461, -39.557228088378906, -38.04564666748047, -36.534061431884766, -35.02247619628906, -33.51089096069336, -31.999305725097656, -30.487722396850586, -28.976137161254883, -27.464553833007812, -25.95296859741211, -24.441383361816406, -22.929798126220703, -21.418214797973633, -19.90662956237793, -18.39504623413086, -16.883460998535156, -15.37187671661377, -13.860292434692383, -12.34870719909668, -10.837122917175293, -9.325538635253906, -7.813953399658203, -6.302368640899658, -4.790783882141113, -3.2791993618011475, -1.7676148414611816, -0.2560300827026367, 1.2555546760559082, 2.767138957977295, 4.278724193572998, 5.790308475494385]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 3.0, 3.0, 4.0, 5.0, 8.0, 6.0, 18.0, 18.0, 17.0, 13.0, 32.0, 28.0, 21.0, 24.0, 25.0, 22.0, 33.0, 27.0, 40.0, 33.0, 38.0, 33.0, 48.0, 38.0, 26.0, 31.0, 43.0, 30.0, 30.0, 29.0, 39.0, 33.0, 29.0, 26.0, 15.0, 26.0, 13.0, 12.0, 12.0, 9.0, 14.0, 13.0, 6.0, 7.0, 8.0, 5.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.692134857177734, -19.065324783325195, -18.438514709472656, -17.81170654296875, -17.18489646911621, -16.558086395263672, -15.931276321411133, -15.304466247558594, -14.677657127380371, -14.050847053527832, -13.42403793334961, -12.79722785949707, -12.170417785644531, -11.543608665466309, -10.91679859161377, -10.289989471435547, -9.663179397583008, -9.036369323730469, -8.409560203552246, -7.782750129699707, -7.155940532684326, -6.529130935668945, -5.902320861816406, -5.275511264801025, -4.6487016677856445, -4.021892070770264, -3.3950822353363037, -2.7682723999023438, -2.141462802886963, -1.514653205871582, -0.8878433704376221, -0.2610335350036621, 0.36577796936035156, 0.992587685585022, 1.6193974018096924, 2.2462072372436523, 2.873016834259033, 3.499826431274414, 4.126636505126953, 4.753446102142334, 5.380255699157715, 6.007065296173096, 6.633874893188477, 7.260684967041016, 7.8874945640563965, 8.514304161071777, 9.141114234924316, 9.767923355102539, 10.394733428955078, 11.021543502807617, 11.64835262298584, 12.275162696838379, 12.901971817016602, 13.52878189086914, 14.15559196472168, 14.782402038574219, 15.409211158752441, 16.036020278930664, 16.662830352783203, 17.289640426635742, 17.91645050048828, 18.543258666992188, 19.170068740844727, 19.796878814697266, 20.423688888549805]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 5.0, 6.0, 8.0, 6.0, 11.0, 9.0, 12.0, 8.0, 27.0, 16.0, 23.0, 34.0, 31.0, 29.0, 40.0, 28.0, 35.0, 43.0, 40.0, 40.0, 43.0, 40.0, 38.0, 56.0, 35.0, 35.0, 45.0, 31.0, 39.0, 26.0, 15.0, 32.0, 21.0, 15.0, 21.0, 10.0, 14.0, 12.0, 4.0, 9.0, 4.0, 4.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.455078125, -3.350677490234375, -3.24627685546875, -3.141876220703125, -3.0374755859375, -2.933074951171875, -2.82867431640625, -2.724273681640625, -2.619873046875, -2.515472412109375, -2.41107177734375, -2.306671142578125, -2.2022705078125, -2.097869873046875, -1.99346923828125, -1.889068603515625, -1.78466796875, -1.680267333984375, -1.57586669921875, -1.471466064453125, -1.3670654296875, -1.262664794921875, -1.15826416015625, -1.053863525390625, -0.949462890625, -0.845062255859375, -0.74066162109375, -0.636260986328125, -0.5318603515625, -0.427459716796875, -0.32305908203125, -0.218658447265625, -0.1142578125, -0.009857177734375, 0.09454345703125, 0.198944091796875, 0.3033447265625, 0.407745361328125, 0.51214599609375, 0.616546630859375, 0.720947265625, 0.825347900390625, 0.92974853515625, 1.034149169921875, 1.1385498046875, 1.242950439453125, 1.34735107421875, 1.451751708984375, 1.55615234375, 1.660552978515625, 1.76495361328125, 1.869354248046875, 1.9737548828125, 2.078155517578125, 2.18255615234375, 2.286956787109375, 2.391357421875, 2.495758056640625, 2.60015869140625, 2.704559326171875, 2.8089599609375, 2.913360595703125, 3.01776123046875, 3.122161865234375, 3.2265625]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 7.0, 16.0, 9.0, 23.0, 17.0, 24.0, 26.0, 29.0, 53.0, 63.0, 68.0, 95.0, 116.0, 158.0, 344.0, 1104.0, 13575.0, 467158.0, 3162709.0, 530768.0, 15528.0, 1274.0, 398.0, 155.0, 120.0, 70.0, 79.0, 61.0, 50.0, 43.0, 28.0, 26.0, 18.0, 14.0, 13.0, 10.0, 8.0, 11.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.171875, -9.868408203125, -9.56494140625, -9.261474609375, -8.9580078125, -8.654541015625, -8.35107421875, -8.047607421875, -7.744140625, -7.440673828125, -7.13720703125, -6.833740234375, -6.5302734375, -6.226806640625, -5.92333984375, -5.619873046875, -5.31640625, -5.012939453125, -4.70947265625, -4.406005859375, -4.1025390625, -3.799072265625, -3.49560546875, -3.192138671875, -2.888671875, -2.585205078125, -2.28173828125, -1.978271484375, -1.6748046875, -1.371337890625, -1.06787109375, -0.764404296875, -0.4609375, -0.157470703125, 0.14599609375, 0.449462890625, 0.7529296875, 1.056396484375, 1.35986328125, 1.663330078125, 1.966796875, 2.270263671875, 2.57373046875, 2.877197265625, 3.1806640625, 3.484130859375, 3.78759765625, 4.091064453125, 4.39453125, 4.697998046875, 5.00146484375, 5.304931640625, 5.6083984375, 5.911865234375, 6.21533203125, 6.518798828125, 6.822265625, 7.125732421875, 7.42919921875, 7.732666015625, 8.0361328125, 8.339599609375, 8.64306640625, 8.946533203125, 9.25]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 3.0, 10.0, 2.0, 3.0, 12.0, 10.0, 13.0, 23.0, 30.0, 30.0, 44.0, 58.0, 74.0, 95.0, 135.0, 197.0, 237.0, 339.0, 435.0, 473.0, 447.0, 363.0, 275.0, 196.0, 161.0, 101.0, 74.0, 56.0, 37.0, 41.0, 29.0, 11.0, 19.0, 12.0, 10.0, 2.0, 2.0, 4.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.37109375, -6.18682861328125, -6.0025634765625, -5.81829833984375, -5.634033203125, -5.44976806640625, -5.2655029296875, -5.08123779296875, -4.89697265625, -4.71270751953125, -4.5284423828125, -4.34417724609375, -4.159912109375, -3.97564697265625, -3.7913818359375, -3.60711669921875, -3.4228515625, -3.23858642578125, -3.0543212890625, -2.87005615234375, -2.685791015625, -2.50152587890625, -2.3172607421875, -2.13299560546875, -1.94873046875, -1.76446533203125, -1.5802001953125, -1.39593505859375, -1.211669921875, -1.02740478515625, -0.8431396484375, -0.65887451171875, -0.474609375, -0.29034423828125, -0.1060791015625, 0.07818603515625, 0.262451171875, 0.44671630859375, 0.6309814453125, 0.81524658203125, 0.99951171875, 1.18377685546875, 1.3680419921875, 1.55230712890625, 1.736572265625, 1.92083740234375, 2.1051025390625, 2.28936767578125, 2.4736328125, 2.65789794921875, 2.8421630859375, 3.02642822265625, 3.210693359375, 3.39495849609375, 3.5792236328125, 3.76348876953125, 3.94775390625, 4.13201904296875, 4.3162841796875, 4.50054931640625, 4.684814453125, 4.86907958984375, 5.0533447265625, 5.23760986328125, 5.421875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 4.0, 4.0, 3.0, 3.0, 16.0, 10.0, 17.0, 32.0, 34.0, 36.0, 57.0, 74.0, 103.0, 168.0, 222.0, 388.0, 632.0, 9093.0, 3940261.0, 240539.0, 1177.0, 439.0, 279.0, 191.0, 122.0, 89.0, 83.0, 43.0, 45.0, 26.0, 21.0, 15.0, 13.0, 11.0, 5.0, 5.0, 4.0, 7.0, 2.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.359375, -27.405517578125, -26.45166015625, -25.497802734375, -24.5439453125, -23.590087890625, -22.63623046875, -21.682373046875, -20.728515625, -19.774658203125, -18.82080078125, -17.866943359375, -16.9130859375, -15.959228515625, -15.00537109375, -14.051513671875, -13.09765625, -12.143798828125, -11.18994140625, -10.236083984375, -9.2822265625, -8.328369140625, -7.37451171875, -6.420654296875, -5.466796875, -4.512939453125, -3.55908203125, -2.605224609375, -1.6513671875, -0.697509765625, 0.25634765625, 1.210205078125, 2.1640625, 3.117919921875, 4.07177734375, 5.025634765625, 5.9794921875, 6.933349609375, 7.88720703125, 8.841064453125, 9.794921875, 10.748779296875, 11.70263671875, 12.656494140625, 13.6103515625, 14.564208984375, 15.51806640625, 16.471923828125, 17.42578125, 18.379638671875, 19.33349609375, 20.287353515625, 21.2412109375, 22.195068359375, 23.14892578125, 24.102783203125, 25.056640625, 26.010498046875, 26.96435546875, 27.918212890625, 28.8720703125, 29.825927734375, 30.77978515625, 31.733642578125, 32.6875]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 21.0, 75.0, 188.0, 310.0, 240.0, 136.0, 37.0, 7.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.42640495300293, -12.593167304992676, -10.759929656982422, -8.926691055297852, -7.093453407287598, -5.260215759277344, -3.4269771575927734, -1.5937395095825195, 0.23949813842773438, 2.0727360248565674, 3.9059739112854004, 5.7392120361328125, 7.572449684143066, 9.40568733215332, 11.23892593383789, 13.072163581848145, 14.905401229858398, 16.73863983154297, 18.571876525878906, 20.405115127563477, 22.238353729248047, 24.071590423583984, 25.904829025268555, 27.738067626953125, 29.571304321289062, 31.404542922973633, 33.2377815246582, 35.07101821899414, 36.90425491333008, 38.73749542236328, 40.57073211669922, 42.403968811035156, 44.237205505371094, 46.07044219970703, 47.903682708740234, 49.73691940307617, 51.57015609741211, 53.40339660644531, 55.23663330078125, 57.06986999511719, 58.903106689453125, 60.73634338378906, 62.569583892822266, 64.40281677246094, 66.2360610961914, 68.06929779052734, 69.90253448486328, 71.73577117919922, 73.56901550292969, 75.40225219726562, 77.23548889160156, 79.0687255859375, 80.90196990966797, 82.7352066040039, 84.56844329833984, 86.40167999267578, 88.23491668701172, 90.06815338134766, 91.9013900756836, 93.73463439941406, 95.56787109375, 97.40110778808594, 99.23434448242188, 101.06758117675781, 102.90081787109375]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 5.0, 2.0, 5.0, 8.0, 7.0, 11.0, 11.0, 17.0, 17.0, 16.0, 30.0, 27.0, 29.0, 29.0, 38.0, 41.0, 37.0, 49.0, 57.0, 52.0, 49.0, 41.0, 40.0, 34.0, 51.0, 30.0, 39.0, 36.0, 39.0, 30.0, 17.0, 26.0, 14.0, 12.0, 8.0, 12.0, 11.0, 9.0, 4.0, 7.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.768802642822266, -22.105358123779297, -21.441913604736328, -20.77846908569336, -20.11502456665039, -19.451580047607422, -18.788135528564453, -18.124691009521484, -17.461246490478516, -16.797801971435547, -16.134357452392578, -15.47091293334961, -14.80746841430664, -14.144023895263672, -13.48058032989502, -12.81713581085205, -12.153692245483398, -11.49024772644043, -10.826803207397461, -10.163358688354492, -9.499914169311523, -8.836469650268555, -8.173026084899902, -7.509581565856934, -6.846137046813965, -6.182692527770996, -5.519248008728027, -4.855803966522217, -4.192359447479248, -3.5289149284362793, -2.8654706478118896, -2.2020263671875, -1.5385799407958984, -0.8751355409622192, -0.21169114112854004, 0.45175325870513916, 1.1151976585388184, 1.778642177581787, 2.4420864582061768, 3.1055307388305664, 3.768975257873535, 4.432419776916504, 5.095864295959473, 5.759308338165283, 6.422752857208252, 7.086197376251221, 7.749641418457031, 8.4130859375, 9.076530456542969, 9.739974975585938, 10.403419494628906, 11.066864013671875, 11.730308532714844, 12.393753051757812, 13.057196617126465, 13.720641136169434, 14.384085655212402, 15.047530174255371, 15.71097469329834, 16.374418258666992, 17.03786277770996, 17.70130729675293, 18.3647518157959, 19.028196334838867, 19.691640853881836]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 3.0, 5.0, 7.0, 3.0, 10.0, 9.0, 9.0, 8.0, 19.0, 16.0, 22.0, 25.0, 22.0, 27.0, 36.0, 34.0, 36.0, 34.0, 27.0, 37.0, 54.0, 40.0, 37.0, 39.0, 42.0, 42.0, 39.0, 48.0, 40.0, 27.0, 26.0, 30.0, 28.0, 21.0, 11.0, 12.0, 19.0, 12.0, 17.0, 7.0, 9.0, 5.0, 6.0, 7.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-3.54296875, -3.4454345703125, -3.347900390625, -3.2503662109375, -3.15283203125, -3.0552978515625, -2.957763671875, -2.8602294921875, -2.7626953125, -2.6651611328125, -2.567626953125, -2.4700927734375, -2.37255859375, -2.2750244140625, -2.177490234375, -2.0799560546875, -1.982421875, -1.8848876953125, -1.787353515625, -1.6898193359375, -1.59228515625, -1.4947509765625, -1.397216796875, -1.2996826171875, -1.2021484375, -1.1046142578125, -1.007080078125, -0.9095458984375, -0.81201171875, -0.7144775390625, -0.616943359375, -0.5194091796875, -0.421875, -0.3243408203125, -0.226806640625, -0.1292724609375, -0.03173828125, 0.0657958984375, 0.163330078125, 0.2608642578125, 0.3583984375, 0.4559326171875, 0.553466796875, 0.6510009765625, 0.74853515625, 0.8460693359375, 0.943603515625, 1.0411376953125, 1.138671875, 1.2362060546875, 1.333740234375, 1.4312744140625, 1.52880859375, 1.6263427734375, 1.723876953125, 1.8214111328125, 1.9189453125, 2.0164794921875, 2.114013671875, 2.2115478515625, 2.30908203125, 2.4066162109375, 2.504150390625, 2.6016845703125, 2.69921875]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 4.0, 5.0, 14.0, 16.0, 23.0, 36.0, 75.0, 80.0, 104.0, 143.0, 210.0, 322.0, 444.0, 673.0, 808.0, 1266.0, 1721.0, 2394.0, 3479.0, 4890.0, 6853.0, 9853.0, 14136.0, 21067.0, 31714.0, 47856.0, 74776.0, 117316.0, 176022.0, 180315.0, 121587.0, 77489.0, 49603.0, 32404.0, 21797.0, 14797.0, 10144.0, 7063.0, 4980.0, 3517.0, 2474.0, 1779.0, 1231.0, 899.0, 648.0, 465.0, 322.0, 230.0, 165.0, 112.0, 73.0, 58.0, 42.0, 26.0, 16.0, 12.0, 6.0, 8.0, 2.0, 3.0, 2.0], "bins": [-0.297607421875, -0.2883186340332031, -0.27902984619140625, -0.2697410583496094, -0.2604522705078125, -0.2511634826660156, -0.24187469482421875, -0.23258590698242188, -0.223297119140625, -0.21400833129882812, -0.20471954345703125, -0.19543075561523438, -0.1861419677734375, -0.17685317993164062, -0.16756439208984375, -0.15827560424804688, -0.14898681640625, -0.13969802856445312, -0.13040924072265625, -0.12112045288085938, -0.1118316650390625, -0.10254287719726562, -0.09325408935546875, -0.08396530151367188, -0.074676513671875, -0.06538772583007812, -0.05609893798828125, -0.046810150146484375, -0.0375213623046875, -0.028232574462890625, -0.01894378662109375, -0.009654998779296875, -0.0003662109375, 0.008922576904296875, 0.01821136474609375, 0.027500152587890625, 0.0367889404296875, 0.046077728271484375, 0.05536651611328125, 0.06465530395507812, 0.073944091796875, 0.08323287963867188, 0.09252166748046875, 0.10181045532226562, 0.1110992431640625, 0.12038803100585938, 0.12967681884765625, 0.13896560668945312, 0.14825439453125, 0.15754318237304688, 0.16683197021484375, 0.17612075805664062, 0.1854095458984375, 0.19469833374023438, 0.20398712158203125, 0.21327590942382812, 0.222564697265625, 0.23185348510742188, 0.24114227294921875, 0.2504310607910156, 0.2597198486328125, 0.2690086364746094, 0.27829742431640625, 0.2875862121582031, 0.296875]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 7.0, 7.0, 7.0, 8.0, 15.0, 14.0, 13.0, 12.0, 22.0, 26.0, 25.0, 25.0, 23.0, 32.0, 31.0, 34.0, 49.0, 45.0, 44.0, 1060.0, 47.0, 57.0, 49.0, 44.0, 40.0, 36.0, 32.0, 24.0, 23.0, 34.0, 23.0, 22.0, 21.0, 14.0, 18.0, 12.0, 10.0, 5.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.2421875, -2.173797607421875, -2.10540771484375, -2.037017822265625, -1.9686279296875, -1.900238037109375, -1.83184814453125, -1.763458251953125, -1.695068359375, -1.626678466796875, -1.55828857421875, -1.489898681640625, -1.4215087890625, -1.353118896484375, -1.28472900390625, -1.216339111328125, -1.14794921875, -1.079559326171875, -1.01116943359375, -0.942779541015625, -0.8743896484375, -0.805999755859375, -0.73760986328125, -0.669219970703125, -0.600830078125, -0.532440185546875, -0.46405029296875, -0.395660400390625, -0.3272705078125, -0.258880615234375, -0.19049072265625, -0.122100830078125, -0.0537109375, 0.014678955078125, 0.08306884765625, 0.151458740234375, 0.2198486328125, 0.288238525390625, 0.35662841796875, 0.425018310546875, 0.493408203125, 0.561798095703125, 0.63018798828125, 0.698577880859375, 0.7669677734375, 0.835357666015625, 0.90374755859375, 0.972137451171875, 1.04052734375, 1.108917236328125, 1.17730712890625, 1.245697021484375, 1.3140869140625, 1.382476806640625, 1.45086669921875, 1.519256591796875, 1.587646484375, 1.656036376953125, 1.72442626953125, 1.792816162109375, 1.8612060546875, 1.929595947265625, 1.99798583984375, 2.066375732421875, 2.134765625]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 11.0, 13.0, 16.0, 28.0, 34.0, 56.0, 63.0, 94.0, 165.0, 216.0, 287.0, 425.0, 684.0, 942.0, 1432.0, 2282.0, 3350.0, 5305.0, 8113.0, 12844.0, 20096.0, 32685.0, 53131.0, 88320.0, 148627.0, 1260752.0, 177725.0, 108575.0, 64784.0, 38984.0, 24119.0, 14963.0, 9545.0, 6094.0, 4146.0, 2697.0, 1866.0, 1176.0, 790.0, 567.0, 393.0, 252.0, 162.0, 121.0, 67.0, 52.0, 36.0, 24.0, 8.0, 5.0, 3.0, 6.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.303466796875, -0.2944602966308594, -0.28545379638671875, -0.2764472961425781, -0.2674407958984375, -0.2584342956542969, -0.24942779541015625, -0.24042129516601562, -0.231414794921875, -0.22240829467773438, -0.21340179443359375, -0.20439529418945312, -0.1953887939453125, -0.18638229370117188, -0.17737579345703125, -0.16836929321289062, -0.15936279296875, -0.15035629272460938, -0.14134979248046875, -0.13234329223632812, -0.1233367919921875, -0.11433029174804688, -0.10532379150390625, -0.09631729125976562, -0.087310791015625, -0.07830429077148438, -0.06929779052734375, -0.060291290283203125, -0.0512847900390625, -0.042278289794921875, -0.03327178955078125, -0.024265289306640625, -0.0152587890625, -0.006252288818359375, 0.00275421142578125, 0.011760711669921875, 0.0207672119140625, 0.029773712158203125, 0.03878021240234375, 0.047786712646484375, 0.056793212890625, 0.06579971313476562, 0.07480621337890625, 0.08381271362304688, 0.0928192138671875, 0.10182571411132812, 0.11083221435546875, 0.11983871459960938, 0.12884521484375, 0.13785171508789062, 0.14685821533203125, 0.15586471557617188, 0.1648712158203125, 0.17387771606445312, 0.18288421630859375, 0.19189071655273438, 0.200897216796875, 0.20990371704101562, 0.21891021728515625, 0.22791671752929688, 0.2369232177734375, 0.24592971801757812, 0.25493621826171875, 0.2639427185058594, 0.27294921875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 9.0, 6.0, 13.0, 14.0, 11.0, 19.0, 11.0, 24.0, 45.0, 38.0, 38.0, 64.0, 65.0, 67.0, 71.0, 71.0, 64.0, 67.0, 49.0, 49.0, 43.0, 35.0, 22.0, 23.0, 18.0, 18.0, 13.0, 11.0, 6.0, 6.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001544952392578125, -0.0015029311180114746, -0.0014609098434448242, -0.0014188885688781738, -0.0013768672943115234, -0.001334846019744873, -0.0012928247451782227, -0.0012508034706115723, -0.0012087821960449219, -0.0011667609214782715, -0.001124739646911621, -0.0010827183723449707, -0.0010406970977783203, -0.00099867582321167, -0.0009566545486450195, -0.0009146332740783691, -0.0008726119995117188, -0.0008305907249450684, -0.000788569450378418, -0.0007465481758117676, -0.0007045269012451172, -0.0006625056266784668, -0.0006204843521118164, -0.000578463077545166, -0.0005364418029785156, -0.0004944205284118652, -0.00045239925384521484, -0.00041037797927856445, -0.00036835670471191406, -0.00032633543014526367, -0.0002843141555786133, -0.0002422928810119629, -0.0002002716064453125, -0.0001582503318786621, -0.00011622905731201172, -7.420778274536133e-05, -3.218650817871094e-05, 9.834766387939453e-06, 5.1856040954589844e-05, 9.387731552124023e-05, 0.00013589859008789062, 0.00017791986465454102, 0.0002199411392211914, 0.0002619624137878418, 0.0003039836883544922, 0.0003460049629211426, 0.00038802623748779297, 0.00043004751205444336, 0.00047206878662109375, 0.0005140900611877441, 0.0005561113357543945, 0.0005981326103210449, 0.0006401538848876953, 0.0006821751594543457, 0.0007241964340209961, 0.0007662177085876465, 0.0008082389831542969, 0.0008502602577209473, 0.0008922815322875977, 0.000934302806854248, 0.0009763240814208984, 0.0010183453559875488, 0.0010603666305541992, 0.0011023879051208496, 0.0011444091796875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 5.0, 13.0, 13.0, 14.0, 20.0, 22.0, 23.0, 49.0, 63.0, 77.0, 113.0, 149.0, 294.0, 659.0, 7015.0, 1032095.0, 6450.0, 668.0, 297.0, 137.0, 98.0, 76.0, 52.0, 34.0, 31.0, 21.0, 19.0, 12.0, 14.0, 3.0, 4.0, 9.0, 5.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0255889892578125, -0.024690866470336914, -0.023792743682861328, -0.022894620895385742, -0.021996498107910156, -0.02109837532043457, -0.020200252532958984, -0.0193021297454834, -0.018404006958007812, -0.017505884170532227, -0.01660776138305664, -0.015709638595581055, -0.014811515808105469, -0.013913393020629883, -0.013015270233154297, -0.012117147445678711, -0.011219024658203125, -0.010320901870727539, -0.009422779083251953, -0.008524656295776367, -0.007626533508300781, -0.006728410720825195, -0.005830287933349609, -0.0049321651458740234, -0.0040340423583984375, -0.0031359195709228516, -0.0022377967834472656, -0.0013396739959716797, -0.00044155120849609375, 0.0004565715789794922, 0.0013546943664550781, 0.002252817153930664, 0.00315093994140625, 0.004049062728881836, 0.004947185516357422, 0.005845308303833008, 0.006743431091308594, 0.00764155387878418, 0.008539676666259766, 0.009437799453735352, 0.010335922241210938, 0.011234045028686523, 0.01213216781616211, 0.013030290603637695, 0.013928413391113281, 0.014826536178588867, 0.015724658966064453, 0.01662278175354004, 0.017520904541015625, 0.01841902732849121, 0.019317150115966797, 0.020215272903442383, 0.02111339569091797, 0.022011518478393555, 0.02290964126586914, 0.023807764053344727, 0.024705886840820312, 0.0256040096282959, 0.026502132415771484, 0.02740025520324707, 0.028298377990722656, 0.029196500778198242, 0.030094623565673828, 0.030992746353149414, 0.031890869140625]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [9.0, 28.0, 216.0, 504.0, 226.0, 32.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00036319735227152705, -0.00025987246772274375, -0.00015654756862204522, -5.322266952134669e-05, 5.0102215027436614e-05, 0.00015342712868005037, 0.0002567520132288337, 0.000360076897777617, 0.0004634017823264003, 0.0005667266668751836, 0.0006700515514239669, 0.0007733764359727502, 0.0008767013205215335, 0.0009800263214856386, 0.001083351206034422, 0.0011866760905832052, 0.0012900009751319885, 0.0013933258596807718, 0.0014966507442295551, 0.0015999756287783384, 0.0017033005133271217, 0.001806625397875905, 0.0019099502824246883, 0.0020132751669734716, 0.002116600051522255, 0.0022199249360710382, 0.0023232498206198215, 0.002426574705168605, 0.002529899589717388, 0.0026332244742661715, 0.0027365493588149548, 0.002839874243363738, 0.002943199360743165, 0.0030465242452919483, 0.0031498491298407316, 0.003253174014389515, 0.0033564988989382982, 0.0034598237834870815, 0.003563148668035865, 0.003666473552584648, 0.0037697984371334314, 0.0038731233216822147, 0.003976448439061642, 0.004079773090779781, 0.004183098208159208, 0.004286422859877348, 0.004389747977256775, 0.0044930726289749146, 0.0045963977463543415, 0.0046997228637337685, 0.004803047515451908, 0.004906372632831335, 0.005009697284549475, 0.005113022401928902, 0.005216347053647041, 0.005319672171026468, 0.005422996822744608, 0.005526321940124035, 0.0056296465918421745, 0.0057329717092216015, 0.005836296360939741, 0.005939621478319168, 0.006042946130037308, 0.006146271247416735, 0.006249595899134874]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 4.0, 3.0, 5.0, 11.0, 9.0, 11.0, 11.0, 20.0, 17.0, 20.0, 22.0, 29.0, 28.0, 38.0, 29.0, 45.0, 37.0, 38.0, 33.0, 36.0, 30.0, 41.0, 43.0, 47.0, 37.0, 36.0, 29.0, 43.0, 39.0, 20.0, 35.0, 16.0, 18.0, 18.0, 27.0, 13.0, 17.0, 4.0, 5.0, 14.0, 5.0, 6.0, 6.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.000550389289855957, -0.0005315355956554413, -0.0005126819014549255, -0.0004938282072544098, -0.00047497451305389404, -0.0004561208188533783, -0.00043726712465286255, -0.0004184134304523468, -0.00039955973625183105, -0.0003807060420513153, -0.00036185234785079956, -0.0003429986536502838, -0.00032414495944976807, -0.0003052912652492523, -0.00028643757104873657, -0.0002675838768482208, -0.0002487301826477051, -0.00022987648844718933, -0.00021102279424667358, -0.00019216910004615784, -0.0001733154058456421, -0.00015446171164512634, -0.0001356080174446106, -0.00011675432324409485, -9.79006290435791e-05, -7.904693484306335e-05, -6.019324064254761e-05, -4.133954644203186e-05, -2.2485852241516113e-05, -3.632158041000366e-06, 1.5221536159515381e-05, 3.407523036003113e-05, 5.2928924560546875e-05, 7.178261876106262e-05, 9.063631296157837e-05, 0.00010949000716209412, 0.00012834370136260986, 0.0001471973955631256, 0.00016605108976364136, 0.0001849047839641571, 0.00020375847816467285, 0.0002226121723651886, 0.00024146586656570435, 0.0002603195607662201, 0.00027917325496673584, 0.0002980269491672516, 0.00031688064336776733, 0.0003357343375682831, 0.00035458803176879883, 0.0003734417259693146, 0.0003922954201698303, 0.00041114911437034607, 0.0004300028085708618, 0.00044885650277137756, 0.0004677101969718933, 0.00048656389117240906, 0.0005054175853729248, 0.0005242712795734406, 0.0005431249737739563, 0.000561978667974472, 0.0005808323621749878, 0.0005996860563755035, 0.0006185397505760193, 0.000637393444776535, 0.0006562471389770508]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 3.0, 5.0, 7.0, 3.0, 10.0, 9.0, 9.0, 8.0, 19.0, 16.0, 22.0, 25.0, 22.0, 27.0, 36.0, 34.0, 36.0, 34.0, 27.0, 37.0, 54.0, 40.0, 37.0, 39.0, 42.0, 42.0, 39.0, 48.0, 40.0, 27.0, 26.0, 30.0, 28.0, 20.0, 12.0, 12.0, 19.0, 12.0, 17.0, 7.0, 9.0, 5.0, 6.0, 7.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-3.54296875, -3.4454345703125, -3.347900390625, -3.2503662109375, -3.15283203125, -3.0552978515625, -2.957763671875, -2.8602294921875, -2.7626953125, -2.6651611328125, -2.567626953125, -2.4700927734375, -2.37255859375, -2.2750244140625, -2.177490234375, -2.0799560546875, -1.982421875, -1.8848876953125, -1.787353515625, -1.6898193359375, -1.59228515625, -1.4947509765625, -1.397216796875, -1.2996826171875, -1.2021484375, -1.1046142578125, -1.007080078125, -0.9095458984375, -0.81201171875, -0.7144775390625, -0.616943359375, -0.5194091796875, -0.421875, -0.3243408203125, -0.226806640625, -0.1292724609375, -0.03173828125, 0.0657958984375, 0.163330078125, 0.2608642578125, 0.3583984375, 0.4559326171875, 0.553466796875, 0.6510009765625, 0.74853515625, 0.8460693359375, 0.943603515625, 1.0411376953125, 1.138671875, 1.2362060546875, 1.333740234375, 1.4312744140625, 1.52880859375, 1.6263427734375, 1.723876953125, 1.8214111328125, 1.9189453125, 2.0164794921875, 2.114013671875, 2.2115478515625, 2.30908203125, 2.4066162109375, 2.504150390625, 2.6016845703125, 2.69921875]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 4.0, 3.0, 5.0, 7.0, 5.0, 8.0, 13.0, 15.0, 24.0, 25.0, 28.0, 36.0, 48.0, 81.0, 87.0, 133.0, 193.0, 408.0, 874.0, 3352.0, 17362.0, 92546.0, 594576.0, 279768.0, 46741.0, 8817.0, 1861.0, 600.0, 290.0, 182.0, 113.0, 89.0, 61.0, 46.0, 37.0, 30.0, 22.0, 14.0, 9.0, 10.0, 9.0, 13.0, 6.0, 4.0, 6.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-7.671875, -7.46337890625, -7.2548828125, -7.04638671875, -6.837890625, -6.62939453125, -6.4208984375, -6.21240234375, -6.00390625, -5.79541015625, -5.5869140625, -5.37841796875, -5.169921875, -4.96142578125, -4.7529296875, -4.54443359375, -4.3359375, -4.12744140625, -3.9189453125, -3.71044921875, -3.501953125, -3.29345703125, -3.0849609375, -2.87646484375, -2.66796875, -2.45947265625, -2.2509765625, -2.04248046875, -1.833984375, -1.62548828125, -1.4169921875, -1.20849609375, -1.0, -0.79150390625, -0.5830078125, -0.37451171875, -0.166015625, 0.04248046875, 0.2509765625, 0.45947265625, 0.66796875, 0.87646484375, 1.0849609375, 1.29345703125, 1.501953125, 1.71044921875, 1.9189453125, 2.12744140625, 2.3359375, 2.54443359375, 2.7529296875, 2.96142578125, 3.169921875, 3.37841796875, 3.5869140625, 3.79541015625, 4.00390625, 4.21240234375, 4.4208984375, 4.62939453125, 4.837890625, 5.04638671875, 5.2548828125, 5.46337890625, 5.671875]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 10.0, 1.0, 8.0, 12.0, 16.0, 16.0, 11.0, 10.0, 23.0, 20.0, 23.0, 37.0, 31.0, 32.0, 48.0, 53.0, 68.0, 98.0, 222.0, 1563.0, 227.0, 99.0, 60.0, 43.0, 39.0, 37.0, 41.0, 38.0, 26.0, 23.0, 19.0, 20.0, 21.0, 9.0, 9.0, 9.0, 5.0, 8.0, 3.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3828125, -9.0413818359375, -8.699951171875, -8.3585205078125, -8.01708984375, -7.6756591796875, -7.334228515625, -6.9927978515625, -6.6513671875, -6.3099365234375, -5.968505859375, -5.6270751953125, -5.28564453125, -4.9442138671875, -4.602783203125, -4.2613525390625, -3.919921875, -3.5784912109375, -3.237060546875, -2.8956298828125, -2.55419921875, -2.2127685546875, -1.871337890625, -1.5299072265625, -1.1884765625, -0.8470458984375, -0.505615234375, -0.1641845703125, 0.17724609375, 0.5186767578125, 0.860107421875, 1.2015380859375, 1.54296875, 1.8843994140625, 2.225830078125, 2.5672607421875, 2.90869140625, 3.2501220703125, 3.591552734375, 3.9329833984375, 4.2744140625, 4.6158447265625, 4.957275390625, 5.2987060546875, 5.64013671875, 5.9815673828125, 6.322998046875, 6.6644287109375, 7.005859375, 7.3472900390625, 7.688720703125, 8.0301513671875, 8.37158203125, 8.7130126953125, 9.054443359375, 9.3958740234375, 9.7373046875, 10.0787353515625, 10.420166015625, 10.7615966796875, 11.10302734375, 11.4444580078125, 11.785888671875, 12.1273193359375, 12.46875]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 5.0, 2.0, 6.0, 3.0, 8.0, 7.0, 16.0, 13.0, 9.0, 15.0, 35.0, 29.0, 30.0, 43.0, 68.0, 75.0, 101.0, 123.0, 193.0, 414.0, 976.0, 9924.0, 3097600.0, 33470.0, 1254.0, 481.0, 243.0, 132.0, 91.0, 78.0, 60.0, 40.0, 26.0, 30.0, 21.0, 19.0, 22.0, 18.0, 8.0, 8.0, 6.0, 6.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.71875, -34.65576171875, -33.5927734375, -32.52978515625, -31.466796875, -30.40380859375, -29.3408203125, -28.27783203125, -27.21484375, -26.15185546875, -25.0888671875, -24.02587890625, -22.962890625, -21.89990234375, -20.8369140625, -19.77392578125, -18.7109375, -17.64794921875, -16.5849609375, -15.52197265625, -14.458984375, -13.39599609375, -12.3330078125, -11.27001953125, -10.20703125, -9.14404296875, -8.0810546875, -7.01806640625, -5.955078125, -4.89208984375, -3.8291015625, -2.76611328125, -1.703125, -0.64013671875, 0.4228515625, 1.48583984375, 2.548828125, 3.61181640625, 4.6748046875, 5.73779296875, 6.80078125, 7.86376953125, 8.9267578125, 9.98974609375, 11.052734375, 12.11572265625, 13.1787109375, 14.24169921875, 15.3046875, 16.36767578125, 17.4306640625, 18.49365234375, 19.556640625, 20.61962890625, 21.6826171875, 22.74560546875, 23.80859375, 24.87158203125, 25.9345703125, 26.99755859375, 28.060546875, 29.12353515625, 30.1865234375, 31.24951171875, 32.3125]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 50.0, 317.0, 484.0, 149.0, 13.0, 1.0, 0.0, 1.0], "bins": [-88.41070556640625, -86.89360046386719, -85.37649536132812, -83.8593978881836, -82.34229278564453, -80.82518768310547, -79.3080825805664, -77.79097747802734, -76.27388000488281, -74.75677490234375, -73.23966979980469, -71.72257232666016, -70.2054672241211, -68.68836212158203, -67.17125701904297, -65.6541519165039, -64.13704681396484, -62.61994171142578, -61.102840423583984, -59.58573532104492, -58.068634033203125, -56.55152893066406, -55.034423828125, -53.5173225402832, -52.000221252441406, -50.483116149902344, -48.96601486206055, -47.448909759521484, -45.93180847167969, -44.414703369140625, -42.89759826660156, -41.380496978759766, -39.8633918762207, -38.34628677368164, -36.829185485839844, -35.31208038330078, -33.794979095458984, -32.27787399291992, -30.760770797729492, -29.243667602539062, -27.7265625, -26.20945930480957, -24.69235610961914, -23.175251007080078, -21.65814781188965, -20.14104461669922, -18.62394142150879, -17.10683822631836, -15.58973503112793, -14.0726318359375, -12.555527687072754, -11.038424491882324, -9.521320343017578, -8.004217147827148, -6.487113952636719, -4.970009803771973, -3.452906608581543, -1.9358030557632446, -0.4186995029449463, 1.0984039306640625, 2.6155076026916504, 4.132611274719238, 5.649714469909668, 7.166818618774414, 8.683921813964844]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 4.0, 2.0, 0.0, 4.0, 4.0, 0.0, 11.0, 8.0, 15.0, 17.0, 18.0, 17.0, 25.0, 34.0, 31.0, 38.0, 38.0, 40.0, 53.0, 48.0, 58.0, 48.0, 55.0, 51.0, 40.0, 54.0, 46.0, 39.0, 32.0, 36.0, 31.0, 20.0, 21.0, 16.0, 21.0, 14.0, 10.0, 8.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-42.62425231933594, -41.49089813232422, -40.3575439453125, -39.224185943603516, -38.0908317565918, -36.95747756958008, -35.82412338256836, -34.690765380859375, -33.557411193847656, -32.42405700683594, -31.290700912475586, -30.157346725463867, -29.023990631103516, -27.890636444091797, -26.757282257080078, -25.623926162719727, -24.490571975708008, -23.35721778869629, -22.223861694335938, -21.09050750732422, -19.957151412963867, -18.82379722595215, -17.690441131591797, -16.557086944580078, -15.423731803894043, -14.290376663208008, -13.157021522521973, -12.023666381835938, -10.890312194824219, -9.756956100463867, -8.623601913452148, -7.490246772766113, -6.356893539428711, -5.223538398742676, -4.090183258056641, -2.9568285942077637, -1.8234734535217285, -0.6901183128356934, 0.4432363510131836, 1.5765914916992188, 2.709946632385254, 3.843301773071289, 4.976656913757324, 6.110011577606201, 7.243366718292236, 8.37672233581543, 9.510076522827148, 10.643431663513184, 11.776786804199219, 12.910141944885254, 14.043497085571289, 15.176851272583008, 16.31020736694336, 17.443561553955078, 18.576915740966797, 19.71027183532715, 20.8436279296875, 21.97698211669922, 23.11033821105957, 24.24369239807129, 25.37704849243164, 26.51040267944336, 27.643756866455078, 28.77711296081543, 29.91046714782715]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 5.0, 5.0, 5.0, 10.0, 3.0, 9.0, 14.0, 16.0, 18.0, 16.0, 20.0, 20.0, 31.0, 29.0, 28.0, 28.0, 29.0, 30.0, 29.0, 31.0, 35.0, 46.0, 44.0, 47.0, 44.0, 39.0, 48.0, 37.0, 34.0, 38.0, 17.0, 29.0, 25.0, 17.0, 18.0, 15.0, 19.0, 9.0, 14.0, 7.0, 14.0, 8.0, 3.0, 5.0, 3.0, 5.0, 1.0, 4.0, 1.0, 0.0, 3.0], "bins": [-3.716796875, -3.61163330078125, -3.5064697265625, -3.40130615234375, -3.296142578125, -3.19097900390625, -3.0858154296875, -2.98065185546875, -2.87548828125, -2.77032470703125, -2.6651611328125, -2.55999755859375, -2.454833984375, -2.34967041015625, -2.2445068359375, -2.13934326171875, -2.0341796875, -1.92901611328125, -1.8238525390625, -1.71868896484375, -1.613525390625, -1.50836181640625, -1.4031982421875, -1.29803466796875, -1.19287109375, -1.08770751953125, -0.9825439453125, -0.87738037109375, -0.772216796875, -0.66705322265625, -0.5618896484375, -0.45672607421875, -0.3515625, -0.24639892578125, -0.1412353515625, -0.03607177734375, 0.069091796875, 0.17425537109375, 0.2794189453125, 0.38458251953125, 0.48974609375, 0.59490966796875, 0.7000732421875, 0.80523681640625, 0.910400390625, 1.01556396484375, 1.1207275390625, 1.22589111328125, 1.3310546875, 1.43621826171875, 1.5413818359375, 1.64654541015625, 1.751708984375, 1.85687255859375, 1.9620361328125, 2.06719970703125, 2.17236328125, 2.27752685546875, 2.3826904296875, 2.48785400390625, 2.593017578125, 2.69818115234375, 2.8033447265625, 2.90850830078125, 3.013671875]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 3.0, 6.0, 10.0, 12.0, 9.0, 10.0, 13.0, 23.0, 30.0, 39.0, 32.0, 62.0, 70.0, 111.0, 179.0, 269.0, 512.0, 1278.0, 3900.0, 17300.0, 86886.0, 394175.0, 1153568.0, 1506988.0, 760682.0, 211423.0, 43433.0, 8993.0, 2336.0, 831.0, 382.0, 227.0, 130.0, 84.0, 57.0, 42.0, 31.0, 43.0, 18.0, 16.0, 14.0, 7.0, 10.0, 9.0, 4.0, 9.0, 5.0, 3.0, 4.0, 0.0, 2.0, 2.0, 2.0], "bins": [-4.5, -4.36871337890625, -4.2374267578125, -4.10614013671875, -3.974853515625, -3.84356689453125, -3.7122802734375, -3.58099365234375, -3.44970703125, -3.31842041015625, -3.1871337890625, -3.05584716796875, -2.924560546875, -2.79327392578125, -2.6619873046875, -2.53070068359375, -2.3994140625, -2.26812744140625, -2.1368408203125, -2.00555419921875, -1.874267578125, -1.74298095703125, -1.6116943359375, -1.48040771484375, -1.34912109375, -1.21783447265625, -1.0865478515625, -0.95526123046875, -0.823974609375, -0.69268798828125, -0.5614013671875, -0.43011474609375, -0.298828125, -0.16754150390625, -0.0362548828125, 0.09503173828125, 0.226318359375, 0.35760498046875, 0.4888916015625, 0.62017822265625, 0.75146484375, 0.88275146484375, 1.0140380859375, 1.14532470703125, 1.276611328125, 1.40789794921875, 1.5391845703125, 1.67047119140625, 1.8017578125, 1.93304443359375, 2.0643310546875, 2.19561767578125, 2.326904296875, 2.45819091796875, 2.5894775390625, 2.72076416015625, 2.85205078125, 2.98333740234375, 3.1146240234375, 3.24591064453125, 3.377197265625, 3.50848388671875, 3.6397705078125, 3.77105712890625, 3.90234375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 5.0, 6.0, 8.0, 7.0, 11.0, 16.0, 15.0, 17.0, 29.0, 34.0, 42.0, 62.0, 77.0, 95.0, 122.0, 173.0, 187.0, 245.0, 321.0, 350.0, 406.0, 389.0, 312.0, 253.0, 183.0, 158.0, 145.0, 98.0, 80.0, 44.0, 43.0, 31.0, 22.0, 18.0, 19.0, 13.0, 12.0, 10.0, 6.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4296875, -5.262451171875, -5.09521484375, -4.927978515625, -4.7607421875, -4.593505859375, -4.42626953125, -4.259033203125, -4.091796875, -3.924560546875, -3.75732421875, -3.590087890625, -3.4228515625, -3.255615234375, -3.08837890625, -2.921142578125, -2.75390625, -2.586669921875, -2.41943359375, -2.252197265625, -2.0849609375, -1.917724609375, -1.75048828125, -1.583251953125, -1.416015625, -1.248779296875, -1.08154296875, -0.914306640625, -0.7470703125, -0.579833984375, -0.41259765625, -0.245361328125, -0.078125, 0.089111328125, 0.25634765625, 0.423583984375, 0.5908203125, 0.758056640625, 0.92529296875, 1.092529296875, 1.259765625, 1.427001953125, 1.59423828125, 1.761474609375, 1.9287109375, 2.095947265625, 2.26318359375, 2.430419921875, 2.59765625, 2.764892578125, 2.93212890625, 3.099365234375, 3.2666015625, 3.433837890625, 3.60107421875, 3.768310546875, 3.935546875, 4.102783203125, 4.27001953125, 4.437255859375, 4.6044921875, 4.771728515625, 4.93896484375, 5.106201171875, 5.2734375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 3.0, 6.0, 16.0, 8.0, 12.0, 19.0, 23.0, 27.0, 55.0, 58.0, 75.0, 155.0, 239.0, 353.0, 602.0, 1338.0, 4855.0, 512171.0, 3641168.0, 28972.0, 1996.0, 839.0, 447.0, 256.0, 177.0, 122.0, 89.0, 56.0, 41.0, 21.0, 20.0, 15.0, 15.0, 8.0, 13.0, 9.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.3125, -17.640380859375, -16.96826171875, -16.296142578125, -15.6240234375, -14.951904296875, -14.27978515625, -13.607666015625, -12.935546875, -12.263427734375, -11.59130859375, -10.919189453125, -10.2470703125, -9.574951171875, -8.90283203125, -8.230712890625, -7.55859375, -6.886474609375, -6.21435546875, -5.542236328125, -4.8701171875, -4.197998046875, -3.52587890625, -2.853759765625, -2.181640625, -1.509521484375, -0.83740234375, -0.165283203125, 0.5068359375, 1.178955078125, 1.85107421875, 2.523193359375, 3.1953125, 3.867431640625, 4.53955078125, 5.211669921875, 5.8837890625, 6.555908203125, 7.22802734375, 7.900146484375, 8.572265625, 9.244384765625, 9.91650390625, 10.588623046875, 11.2607421875, 11.932861328125, 12.60498046875, 13.277099609375, 13.94921875, 14.621337890625, 15.29345703125, 15.965576171875, 16.6376953125, 17.309814453125, 17.98193359375, 18.654052734375, 19.326171875, 19.998291015625, 20.67041015625, 21.342529296875, 22.0146484375, 22.686767578125, 23.35888671875, 24.031005859375, 24.703125]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 14.0, 257.0, 591.0, 148.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-144.32321166992188, -140.24261474609375, -136.16200256347656, -132.08140563964844, -128.0008087158203, -123.92019653320312, -119.839599609375, -115.75899505615234, -111.67839050292969, -107.59778594970703, -103.5171890258789, -99.43658447265625, -95.3559799194336, -91.27537536621094, -87.19477844238281, -83.11417388916016, -79.03357696533203, -74.95297241210938, -70.87237548828125, -66.7917709350586, -62.71116638183594, -58.63056564331055, -54.549964904785156, -50.4693603515625, -46.38875961303711, -42.30815887451172, -38.22755432128906, -34.14695358276367, -30.06635093688965, -25.985748291015625, -21.905147552490234, -17.82454490661621, -13.743942260742188, -9.663339614868164, -5.582737922668457, -1.50213623046875, 2.5784664154052734, 6.659069061279297, 10.739669799804688, 14.820272445678711, 18.900875091552734, 22.981477737426758, 27.06208038330078, 31.142681121826172, 35.22328186035156, 39.30388641357422, 43.38448715209961, 47.465087890625, 51.545692443847656, 55.62629318237305, 59.7068977355957, 63.787498474121094, 67.86810302734375, 71.94869995117188, 76.02930450439453, 80.10990905761719, 84.19050598144531, 88.27111053466797, 92.3517074584961, 96.43231201171875, 100.5129165649414, 104.59352111816406, 108.67411804199219, 112.75472259521484, 116.8353271484375]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 9.0, 12.0, 10.0, 6.0, 17.0, 13.0, 16.0, 32.0, 23.0, 33.0, 36.0, 28.0, 39.0, 49.0, 40.0, 39.0, 39.0, 31.0, 37.0, 37.0, 43.0, 42.0, 30.0, 44.0, 34.0, 34.0, 38.0, 21.0, 23.0, 27.0, 15.0, 15.0, 10.0, 13.0, 13.0, 10.0, 7.0, 8.0, 7.0, 4.0, 0.0, 3.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-19.16440200805664, -18.533411026000977, -17.902420043945312, -17.27142906188965, -16.640438079833984, -16.009445190429688, -15.378454208374023, -14.74746322631836, -14.116472244262695, -13.485481262207031, -12.854490280151367, -12.223498344421387, -11.592507362365723, -10.961516380310059, -10.330524444580078, -9.699533462524414, -9.06854248046875, -8.437551498413086, -7.806560039520264, -7.175568580627441, -6.544577598571777, -5.913586616516113, -5.282595157623291, -4.651603698730469, -4.020612716674805, -3.3896214962005615, -2.7586302757263184, -2.127639055252075, -1.496647834777832, -0.8656566143035889, -0.2346653938293457, 0.39632606506347656, 1.0273151397705078, 1.658306360244751, 2.289297580718994, 2.9202888011932373, 3.5512800216674805, 4.1822710037231445, 4.813262462615967, 5.444253921508789, 6.075244903564453, 6.706235885620117, 7.3372273445129395, 7.968218803405762, 8.599209785461426, 9.23020076751709, 9.86119270324707, 10.492183685302734, 11.123174667358398, 11.754165649414062, 12.385156631469727, 13.016148567199707, 13.647139549255371, 14.278130531311035, 14.909122467041016, 15.54011344909668, 16.171104431152344, 16.802095413208008, 17.433086395263672, 18.064077377319336, 18.695068359375, 19.326061248779297, 19.95705223083496, 20.588043212890625, 21.21903419494629]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 4.0, 3.0, 6.0, 8.0, 11.0, 10.0, 14.0, 11.0, 21.0, 11.0, 26.0, 26.0, 29.0, 25.0, 27.0, 41.0, 28.0, 45.0, 49.0, 38.0, 59.0, 36.0, 46.0, 38.0, 39.0, 38.0, 34.0, 32.0, 40.0, 38.0, 21.0, 24.0, 8.0, 24.0, 17.0, 20.0, 13.0, 5.0, 11.0, 8.0, 4.0, 6.0, 1.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.587890625, -3.486297607421875, -3.38470458984375, -3.283111572265625, -3.1815185546875, -3.079925537109375, -2.97833251953125, -2.876739501953125, -2.775146484375, -2.673553466796875, -2.57196044921875, -2.470367431640625, -2.3687744140625, -2.267181396484375, -2.16558837890625, -2.063995361328125, -1.96240234375, -1.860809326171875, -1.75921630859375, -1.657623291015625, -1.5560302734375, -1.454437255859375, -1.35284423828125, -1.251251220703125, -1.149658203125, -1.048065185546875, -0.94647216796875, -0.844879150390625, -0.7432861328125, -0.641693115234375, -0.54010009765625, -0.438507080078125, -0.3369140625, -0.235321044921875, -0.13372802734375, -0.032135009765625, 0.0694580078125, 0.171051025390625, 0.27264404296875, 0.374237060546875, 0.475830078125, 0.577423095703125, 0.67901611328125, 0.780609130859375, 0.8822021484375, 0.983795166015625, 1.08538818359375, 1.186981201171875, 1.28857421875, 1.390167236328125, 1.49176025390625, 1.593353271484375, 1.6949462890625, 1.796539306640625, 1.89813232421875, 1.999725341796875, 2.101318359375, 2.202911376953125, 2.30450439453125, 2.406097412109375, 2.5076904296875, 2.609283447265625, 2.71087646484375, 2.812469482421875, 2.9140625]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 4.0, 3.0, 11.0, 13.0, 38.0, 42.0, 64.0, 89.0, 124.0, 179.0, 244.0, 363.0, 539.0, 801.0, 1015.0, 1548.0, 2173.0, 3268.0, 4714.0, 6992.0, 10399.0, 15530.0, 23955.0, 38047.0, 62361.0, 104587.0, 178810.0, 222825.0, 143593.0, 83552.0, 50564.0, 31048.0, 20155.0, 13001.0, 8929.0, 5927.0, 3973.0, 2763.0, 1946.0, 1335.0, 923.0, 607.0, 445.0, 311.0, 238.0, 150.0, 104.0, 79.0, 66.0, 32.0, 22.0, 27.0, 15.0, 11.0, 3.0, 5.0, 0.0, 3.0], "bins": [-0.364990234375, -0.35402679443359375, -0.3430633544921875, -0.33209991455078125, -0.321136474609375, -0.31017303466796875, -0.2992095947265625, -0.28824615478515625, -0.27728271484375, -0.26631927490234375, -0.2553558349609375, -0.24439239501953125, -0.233428955078125, -0.22246551513671875, -0.2115020751953125, -0.20053863525390625, -0.1895751953125, -0.17861175537109375, -0.1676483154296875, -0.15668487548828125, -0.145721435546875, -0.13475799560546875, -0.1237945556640625, -0.11283111572265625, -0.10186767578125, -0.09090423583984375, -0.0799407958984375, -0.06897735595703125, -0.058013916015625, -0.04705047607421875, -0.0360870361328125, -0.02512359619140625, -0.01416015625, -0.00319671630859375, 0.0077667236328125, 0.01873016357421875, 0.029693603515625, 0.04065704345703125, 0.0516204833984375, 0.06258392333984375, 0.07354736328125, 0.08451080322265625, 0.0954742431640625, 0.10643768310546875, 0.117401123046875, 0.12836456298828125, 0.1393280029296875, 0.15029144287109375, 0.1612548828125, 0.17221832275390625, 0.1831817626953125, 0.19414520263671875, 0.205108642578125, 0.21607208251953125, 0.2270355224609375, 0.23799896240234375, 0.24896240234375, 0.25992584228515625, 0.2708892822265625, 0.28185272216796875, 0.292816162109375, 0.30377960205078125, 0.3147430419921875, 0.32570648193359375, 0.336669921875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 5.0, 4.0, 7.0, 4.0, 6.0, 9.0, 11.0, 12.0, 17.0, 17.0, 23.0, 28.0, 26.0, 33.0, 25.0, 31.0, 25.0, 39.0, 36.0, 34.0, 51.0, 33.0, 1072.0, 37.0, 38.0, 28.0, 36.0, 39.0, 38.0, 26.0, 30.0, 25.0, 26.0, 19.0, 21.0, 23.0, 18.0, 15.0, 12.0, 11.0, 8.0, 9.0, 10.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.9814453125, -1.92205810546875, -1.8626708984375, -1.80328369140625, -1.743896484375, -1.68450927734375, -1.6251220703125, -1.56573486328125, -1.50634765625, -1.44696044921875, -1.3875732421875, -1.32818603515625, -1.268798828125, -1.20941162109375, -1.1500244140625, -1.09063720703125, -1.03125, -0.97186279296875, -0.9124755859375, -0.85308837890625, -0.793701171875, -0.73431396484375, -0.6749267578125, -0.61553955078125, -0.55615234375, -0.49676513671875, -0.4373779296875, -0.37799072265625, -0.318603515625, -0.25921630859375, -0.1998291015625, -0.14044189453125, -0.0810546875, -0.02166748046875, 0.0377197265625, 0.09710693359375, 0.156494140625, 0.21588134765625, 0.2752685546875, 0.33465576171875, 0.39404296875, 0.45343017578125, 0.5128173828125, 0.57220458984375, 0.631591796875, 0.69097900390625, 0.7503662109375, 0.80975341796875, 0.869140625, 0.92852783203125, 0.9879150390625, 1.04730224609375, 1.106689453125, 1.16607666015625, 1.2254638671875, 1.28485107421875, 1.34423828125, 1.40362548828125, 1.4630126953125, 1.52239990234375, 1.581787109375, 1.64117431640625, 1.7005615234375, 1.75994873046875, 1.8193359375]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 7.0, 8.0, 14.0, 29.0, 44.0, 54.0, 63.0, 107.0, 141.0, 213.0, 249.0, 399.0, 539.0, 821.0, 1102.0, 1568.0, 2276.0, 3384.0, 5001.0, 7789.0, 11444.0, 17283.0, 26727.0, 41957.0, 67909.0, 114255.0, 185880.0, 1252087.0, 135622.0, 81107.0, 48547.0, 30626.0, 19516.0, 12918.0, 8464.0, 5936.0, 4056.0, 2817.0, 1908.0, 1299.0, 896.0, 668.0, 470.0, 324.0, 214.0, 139.0, 83.0, 67.0, 40.0, 25.0, 18.0, 14.0, 3.0, 8.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.27490234375, -0.2657890319824219, -0.25667572021484375, -0.24756240844726562, -0.2384490966796875, -0.22933578491210938, -0.22022247314453125, -0.21110916137695312, -0.201995849609375, -0.19288253784179688, -0.18376922607421875, -0.17465591430664062, -0.1655426025390625, -0.15642929077148438, -0.14731597900390625, -0.13820266723632812, -0.12908935546875, -0.11997604370117188, -0.11086273193359375, -0.10174942016601562, -0.0926361083984375, -0.08352279663085938, -0.07440948486328125, -0.06529617309570312, -0.056182861328125, -0.047069549560546875, -0.03795623779296875, -0.028842926025390625, -0.0197296142578125, -0.010616302490234375, -0.00150299072265625, 0.007610321044921875, 0.0167236328125, 0.025836944580078125, 0.03495025634765625, 0.044063568115234375, 0.0531768798828125, 0.062290191650390625, 0.07140350341796875, 0.08051681518554688, 0.089630126953125, 0.09874343872070312, 0.10785675048828125, 0.11697006225585938, 0.1260833740234375, 0.13519668579101562, 0.14430999755859375, 0.15342330932617188, 0.16253662109375, 0.17164993286132812, 0.18076324462890625, 0.18987655639648438, 0.1989898681640625, 0.20810317993164062, 0.21721649169921875, 0.22632980346679688, 0.235443115234375, 0.24455642700195312, 0.25366973876953125, 0.2627830505371094, 0.2718963623046875, 0.2810096740722656, 0.29012298583984375, 0.2992362976074219, 0.308349609375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 3.0, 4.0, 1.0, 7.0, 6.0, 9.0, 23.0, 17.0, 22.0, 35.0, 38.0, 52.0, 40.0, 65.0, 71.0, 69.0, 75.0, 71.0, 64.0, 83.0, 61.0, 44.0, 26.0, 31.0, 14.0, 14.0, 13.0, 15.0, 5.0, 5.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.0014362335205078125, -0.0013933032751083374, -0.0013503730297088623, -0.0013074427843093872, -0.0012645125389099121, -0.001221582293510437, -0.001178652048110962, -0.0011357218027114868, -0.0010927915573120117, -0.0010498613119125366, -0.0010069310665130615, -0.0009640008211135864, -0.0009210705757141113, -0.0008781403303146362, -0.0008352100849151611, -0.000792279839515686, -0.0007493495941162109, -0.0007064193487167358, -0.0006634891033172607, -0.0006205588579177856, -0.0005776286125183105, -0.0005346983671188354, -0.0004917681217193604, -0.00044883787631988525, -0.00040590763092041016, -0.00036297738552093506, -0.00032004714012145996, -0.00027711689472198486, -0.00023418664932250977, -0.00019125640392303467, -0.00014832615852355957, -0.00010539591312408447, -6.246566772460938e-05, -1.9535422325134277e-05, 2.339482307434082e-05, 6.632506847381592e-05, 0.00010925531387329102, 0.0001521855592727661, 0.0001951158046722412, 0.0002380460500717163, 0.0002809762954711914, 0.0003239065408706665, 0.0003668367862701416, 0.0004097670316696167, 0.0004526972770690918, 0.0004956275224685669, 0.000538557767868042, 0.0005814880132675171, 0.0006244182586669922, 0.0006673485040664673, 0.0007102787494659424, 0.0007532089948654175, 0.0007961392402648926, 0.0008390694856643677, 0.0008819997310638428, 0.0009249299764633179, 0.000967860221862793, 0.001010790467262268, 0.0010537207126617432, 0.0010966509580612183, 0.0011395812034606934, 0.0011825114488601685, 0.0012254416942596436, 0.0012683719396591187, 0.0013113021850585938]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 2.0, 6.0, 11.0, 10.0, 14.0, 17.0, 28.0, 32.0, 54.0, 59.0, 87.0, 136.0, 250.0, 496.0, 1402.0, 726922.0, 316644.0, 1229.0, 431.0, 208.0, 134.0, 87.0, 85.0, 51.0, 34.0, 32.0, 24.0, 14.0, 9.0, 8.0, 7.0, 5.0, 2.0, 4.0, 3.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02667236328125, -0.02581048011779785, -0.024948596954345703, -0.024086713790893555, -0.023224830627441406, -0.022362947463989258, -0.02150106430053711, -0.02063918113708496, -0.019777297973632812, -0.018915414810180664, -0.018053531646728516, -0.017191648483276367, -0.01632976531982422, -0.01546788215637207, -0.014605998992919922, -0.013744115829467773, -0.012882232666015625, -0.012020349502563477, -0.011158466339111328, -0.01029658317565918, -0.009434700012207031, -0.008572816848754883, -0.007710933685302734, -0.006849050521850586, -0.0059871673583984375, -0.005125284194946289, -0.004263401031494141, -0.003401517868041992, -0.0025396347045898438, -0.0016777515411376953, -0.0008158683776855469, 4.601478576660156e-05, 0.00090789794921875, 0.0017697811126708984, 0.002631664276123047, 0.0034935474395751953, 0.004355430603027344, 0.005217313766479492, 0.006079196929931641, 0.006941080093383789, 0.0078029632568359375, 0.008664846420288086, 0.009526729583740234, 0.010388612747192383, 0.011250495910644531, 0.01211237907409668, 0.012974262237548828, 0.013836145401000977, 0.014698028564453125, 0.015559911727905273, 0.016421794891357422, 0.01728367805480957, 0.01814556121826172, 0.019007444381713867, 0.019869327545166016, 0.020731210708618164, 0.021593093872070312, 0.02245497703552246, 0.02331686019897461, 0.024178743362426758, 0.025040626525878906, 0.025902509689331055, 0.026764392852783203, 0.02762627601623535, 0.0284881591796875]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 108.0, 875.0, 34.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0033679408952593803, -0.003117086598649621, -0.0028662323020398617, -0.002615378238260746, -0.0023645239416509867, -0.0021136696450412273, -0.0018628154648467898, -0.0016119612846523523, -0.001361106988042593, -0.0011102526914328337, -0.0008593985112383962, -0.0006085442728362978, -0.00035769003443419933, -0.00010683573782444, 0.0001440184423699975, 0.000394872622564435, 0.0006457269191741943, 0.0008965811575762928, 0.0011474353959783912, 0.0013982895761728287, 0.001649143872782588, 0.0018999981693923473, 0.002150852233171463, 0.0024017065297812223, 0.0026525608263909817, 0.002903415123000741, 0.0031542694196105003, 0.003405123483389616, 0.0036559777799993753, 0.003906832076609135, 0.00415768614038825, 0.004408540204167366, 0.004659393802285194, 0.00491024786606431, 0.005161102395504713, 0.005411956459283829, 0.005662810988724232, 0.005913665052503347, 0.006164519116282463, 0.006415373645722866, 0.006666227709501982, 0.006917081773281097, 0.0071679363027215, 0.007418790366500616, 0.007669644430279732, 0.007920498959720135, 0.008171353489160538, 0.008422207087278366, 0.008673061616718769, 0.008923916146159172, 0.009174769744277, 0.009425624273717403, 0.009676478803157806, 0.009927332401275635, 0.010178186930716038, 0.01042904146015644, 0.010679895058274269, 0.010930749587714672, 0.0111816031858325, 0.011432457715272903, 0.011683312244713306, 0.01193416677415371, 0.012185020372271538, 0.01243587490171194, 0.012686729431152344]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 4.0, 4.0, 7.0, 5.0, 6.0, 15.0, 8.0, 18.0, 21.0, 27.0, 30.0, 31.0, 34.0, 31.0, 31.0, 29.0, 33.0, 35.0, 27.0, 44.0, 44.0, 39.0, 54.0, 35.0, 48.0, 29.0, 36.0, 33.0, 39.0, 32.0, 29.0, 22.0, 26.0, 14.0, 21.0, 15.0, 11.0, 4.0, 12.0, 4.0, 3.0, 5.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0006464123725891113, -0.0006269291043281555, -0.0006074458360671997, -0.0005879625678062439, -0.0005684792995452881, -0.0005489960312843323, -0.0005295127630233765, -0.0005100294947624207, -0.0004905462265014648, -0.00047106295824050903, -0.0004515796899795532, -0.0004320964217185974, -0.0004126131534576416, -0.0003931298851966858, -0.00037364661693573, -0.00035416334867477417, -0.00033468008041381836, -0.00031519681215286255, -0.00029571354389190674, -0.00027623027563095093, -0.0002567470073699951, -0.0002372637391090393, -0.0002177804708480835, -0.00019829720258712769, -0.00017881393432617188, -0.00015933066606521606, -0.00013984739780426025, -0.00012036412954330444, -0.00010088086128234863, -8.139759302139282e-05, -6.191432476043701e-05, -4.24310564994812e-05, -2.294778823852539e-05, -3.46451997756958e-06, 1.601874828338623e-05, 3.550201654434204e-05, 5.498528480529785e-05, 7.446855306625366e-05, 9.395182132720947e-05, 0.00011343508958816528, 0.0001329183578491211, 0.0001524016261100769, 0.00017188489437103271, 0.00019136816263198853, 0.00021085143089294434, 0.00023033469915390015, 0.00024981796741485596, 0.00026930123567581177, 0.0002887845039367676, 0.0003082677721977234, 0.0003277510404586792, 0.000347234308719635, 0.0003667175769805908, 0.00038620084524154663, 0.00040568411350250244, 0.00042516738176345825, 0.00044465065002441406, 0.0004641339182853699, 0.0004836171865463257, 0.0005031004548072815, 0.0005225837230682373, 0.0005420669913291931, 0.0005615502595901489, 0.0005810335278511047, 0.0006005167961120605]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 4.0, 3.0, 6.0, 8.0, 11.0, 10.0, 14.0, 11.0, 21.0, 11.0, 26.0, 26.0, 29.0, 25.0, 27.0, 41.0, 28.0, 45.0, 49.0, 38.0, 59.0, 36.0, 46.0, 38.0, 39.0, 38.0, 34.0, 32.0, 40.0, 38.0, 21.0, 24.0, 8.0, 24.0, 17.0, 20.0, 13.0, 5.0, 11.0, 8.0, 4.0, 6.0, 1.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.587890625, -3.486297607421875, -3.38470458984375, -3.283111572265625, -3.1815185546875, -3.079925537109375, -2.97833251953125, -2.876739501953125, -2.775146484375, -2.673553466796875, -2.57196044921875, -2.470367431640625, -2.3687744140625, -2.267181396484375, -2.16558837890625, -2.063995361328125, -1.96240234375, -1.860809326171875, -1.75921630859375, -1.657623291015625, -1.5560302734375, -1.454437255859375, -1.35284423828125, -1.251251220703125, -1.149658203125, -1.048065185546875, -0.94647216796875, -0.844879150390625, -0.7432861328125, -0.641693115234375, -0.54010009765625, -0.438507080078125, -0.3369140625, -0.235321044921875, -0.13372802734375, -0.032135009765625, 0.0694580078125, 0.171051025390625, 0.27264404296875, 0.374237060546875, 0.475830078125, 0.577423095703125, 0.67901611328125, 0.780609130859375, 0.8822021484375, 0.983795166015625, 1.08538818359375, 1.186981201171875, 1.28857421875, 1.390167236328125, 1.49176025390625, 1.593353271484375, 1.6949462890625, 1.796539306640625, 1.89813232421875, 1.999725341796875, 2.101318359375, 2.202911376953125, 2.30450439453125, 2.406097412109375, 2.5076904296875, 2.609283447265625, 2.71087646484375, 2.812469482421875, 2.9140625]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 7.0, 8.0, 5.0, 12.0, 9.0, 16.0, 24.0, 17.0, 35.0, 53.0, 75.0, 162.0, 321.0, 714.0, 1766.0, 4537.0, 11566.0, 28811.0, 73688.0, 203260.0, 392157.0, 207330.0, 74790.0, 29555.0, 11766.0, 4555.0, 1839.0, 712.0, 329.0, 159.0, 96.0, 40.0, 32.0, 26.0, 24.0, 19.0, 5.0, 9.0, 8.0, 6.0, 7.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.13671875, -4.016845703125, -3.89697265625, -3.777099609375, -3.6572265625, -3.537353515625, -3.41748046875, -3.297607421875, -3.177734375, -3.057861328125, -2.93798828125, -2.818115234375, -2.6982421875, -2.578369140625, -2.45849609375, -2.338623046875, -2.21875, -2.098876953125, -1.97900390625, -1.859130859375, -1.7392578125, -1.619384765625, -1.49951171875, -1.379638671875, -1.259765625, -1.139892578125, -1.02001953125, -0.900146484375, -0.7802734375, -0.660400390625, -0.54052734375, -0.420654296875, -0.30078125, -0.180908203125, -0.06103515625, 0.058837890625, 0.1787109375, 0.298583984375, 0.41845703125, 0.538330078125, 0.658203125, 0.778076171875, 0.89794921875, 1.017822265625, 1.1376953125, 1.257568359375, 1.37744140625, 1.497314453125, 1.6171875, 1.737060546875, 1.85693359375, 1.976806640625, 2.0966796875, 2.216552734375, 2.33642578125, 2.456298828125, 2.576171875, 2.696044921875, 2.81591796875, 2.935791015625, 3.0556640625, 3.175537109375, 3.29541015625, 3.415283203125, 3.53515625]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 4.0, 3.0, 3.0, 7.0, 9.0, 8.0, 8.0, 8.0, 17.0, 11.0, 14.0, 13.0, 27.0, 25.0, 39.0, 38.0, 30.0, 36.0, 50.0, 64.0, 78.0, 152.0, 1404.0, 396.0, 134.0, 88.0, 59.0, 44.0, 46.0, 40.0, 33.0, 28.0, 19.0, 25.0, 20.0, 18.0, 11.0, 12.0, 8.0, 5.0, 7.0, 3.0, 4.0, 3.0, 5.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.7421875, -10.40576171875, -10.0693359375, -9.73291015625, -9.396484375, -9.06005859375, -8.7236328125, -8.38720703125, -8.05078125, -7.71435546875, -7.3779296875, -7.04150390625, -6.705078125, -6.36865234375, -6.0322265625, -5.69580078125, -5.359375, -5.02294921875, -4.6865234375, -4.35009765625, -4.013671875, -3.67724609375, -3.3408203125, -3.00439453125, -2.66796875, -2.33154296875, -1.9951171875, -1.65869140625, -1.322265625, -0.98583984375, -0.6494140625, -0.31298828125, 0.0234375, 0.35986328125, 0.6962890625, 1.03271484375, 1.369140625, 1.70556640625, 2.0419921875, 2.37841796875, 2.71484375, 3.05126953125, 3.3876953125, 3.72412109375, 4.060546875, 4.39697265625, 4.7333984375, 5.06982421875, 5.40625, 5.74267578125, 6.0791015625, 6.41552734375, 6.751953125, 7.08837890625, 7.4248046875, 7.76123046875, 8.09765625, 8.43408203125, 8.7705078125, 9.10693359375, 9.443359375, 9.77978515625, 10.1162109375, 10.45263671875, 10.7890625]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 1.0, 6.0, 7.0, 5.0, 5.0, 8.0, 24.0, 18.0, 28.0, 27.0, 42.0, 67.0, 96.0, 186.0, 286.0, 489.0, 1233.0, 11955.0, 3036414.0, 91263.0, 1888.0, 667.0, 364.0, 212.0, 121.0, 66.0, 47.0, 50.0, 33.0, 30.0, 18.0, 14.0, 10.0, 8.0, 5.0, 4.0, 2.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.625, -23.7353515625, -22.845703125, -21.9560546875, -21.06640625, -20.1767578125, -19.287109375, -18.3974609375, -17.5078125, -16.6181640625, -15.728515625, -14.8388671875, -13.94921875, -13.0595703125, -12.169921875, -11.2802734375, -10.390625, -9.5009765625, -8.611328125, -7.7216796875, -6.83203125, -5.9423828125, -5.052734375, -4.1630859375, -3.2734375, -2.3837890625, -1.494140625, -0.6044921875, 0.28515625, 1.1748046875, 2.064453125, 2.9541015625, 3.84375, 4.7333984375, 5.623046875, 6.5126953125, 7.40234375, 8.2919921875, 9.181640625, 10.0712890625, 10.9609375, 11.8505859375, 12.740234375, 13.6298828125, 14.51953125, 15.4091796875, 16.298828125, 17.1884765625, 18.078125, 18.9677734375, 19.857421875, 20.7470703125, 21.63671875, 22.5263671875, 23.416015625, 24.3056640625, 25.1953125, 26.0849609375, 26.974609375, 27.8642578125, 28.75390625, 29.6435546875, 30.533203125, 31.4228515625, 32.3125]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 371.0, 624.0, 16.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-211.21812438964844, -207.449462890625, -203.6807861328125, -199.91212463378906, -196.14346313476562, -192.3748016357422, -188.60614013671875, -184.83746337890625, -181.0688018798828, -177.30014038085938, -173.53146362304688, -169.76280212402344, -165.994140625, -162.22547912597656, -158.45681762695312, -154.68814086914062, -150.9194793701172, -147.15081787109375, -143.38214111328125, -139.6134796142578, -135.84481811523438, -132.07615661621094, -128.3074951171875, -124.538818359375, -120.77015686035156, -117.00149536132812, -113.23282623291016, -109.46415710449219, -105.69549560546875, -101.92683410644531, -98.15816497802734, -94.38949584960938, -90.62084197998047, -86.8521728515625, -83.08351135253906, -79.31484985351562, -75.54618072509766, -71.77751159667969, -68.00885009765625, -64.24018859863281, -60.471519470214844, -56.70285415649414, -52.93418884277344, -49.165523529052734, -45.39685821533203, -41.62819290161133, -37.859527587890625, -34.09086227416992, -30.32219696044922, -26.553531646728516, -22.784866333007812, -19.01620101928711, -15.247535705566406, -11.478870391845703, -7.710205078125, -3.941539764404297, -0.17287445068359375, 3.5957908630371094, 7.3644561767578125, 11.133121490478516, 14.901786804199219, 18.670452117919922, 22.439117431640625, 26.207782745361328, 29.97644805908203]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 8.0, 9.0, 12.0, 11.0, 23.0, 21.0, 30.0, 27.0, 42.0, 32.0, 38.0, 39.0, 43.0, 54.0, 63.0, 52.0, 56.0, 44.0, 44.0, 46.0, 42.0, 55.0, 26.0, 19.0, 28.0, 28.0, 18.0, 20.0, 11.0, 20.0, 10.0, 11.0, 7.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-30.94858741760254, -30.017314910888672, -29.086042404174805, -28.154769897460938, -27.22349739074707, -26.292224884033203, -25.360952377319336, -24.42967987060547, -23.4984073638916, -22.567134857177734, -21.635862350463867, -20.70458984375, -19.773317337036133, -18.842044830322266, -17.9107723236084, -16.97949981689453, -16.04822540283203, -15.116952896118164, -14.185680389404297, -13.25440788269043, -12.323135375976562, -11.391862869262695, -10.460590362548828, -9.529317855834961, -8.598045349121094, -7.666772842407227, -6.735500335693359, -5.804227828979492, -4.872955322265625, -3.9416823387145996, -3.0104098320007324, -2.0791373252868652, -1.1478652954101562, -0.2165927290916443, 0.7146798372268677, 1.6459524631500244, 2.5772249698638916, 3.508497714996338, 4.439770221710205, 5.371042728424072, 6.3023152351379395, 7.233587741851807, 8.164860725402832, 9.0961332321167, 10.027405738830566, 10.958678245544434, 11.8899507522583, 12.821223258972168, 13.752495765686035, 14.683768272399902, 15.61504077911377, 16.546314239501953, 17.47758674621582, 18.408859252929688, 19.340131759643555, 20.271404266357422, 21.20267677307129, 22.133949279785156, 23.065221786499023, 23.99649429321289, 24.927766799926758, 25.859039306640625, 26.790311813354492, 27.72158432006836, 28.652856826782227]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 6.0, 6.0, 9.0, 7.0, 14.0, 12.0, 14.0, 23.0, 21.0, 15.0, 27.0, 18.0, 23.0, 47.0, 47.0, 42.0, 37.0, 39.0, 49.0, 58.0, 41.0, 33.0, 43.0, 37.0, 35.0, 42.0, 28.0, 44.0, 29.0, 15.0, 23.0, 17.0, 21.0, 18.0, 14.0, 17.0, 4.0, 10.0, 4.0, 5.0, 3.0, 4.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8046875, -3.688934326171875, -3.57318115234375, -3.457427978515625, -3.3416748046875, -3.225921630859375, -3.11016845703125, -2.994415283203125, -2.878662109375, -2.762908935546875, -2.64715576171875, -2.531402587890625, -2.4156494140625, -2.299896240234375, -2.18414306640625, -2.068389892578125, -1.95263671875, -1.836883544921875, -1.72113037109375, -1.605377197265625, -1.4896240234375, -1.373870849609375, -1.25811767578125, -1.142364501953125, -1.026611328125, -0.910858154296875, -0.79510498046875, -0.679351806640625, -0.5635986328125, -0.447845458984375, -0.33209228515625, -0.216339111328125, -0.1005859375, 0.015167236328125, 0.13092041015625, 0.246673583984375, 0.3624267578125, 0.478179931640625, 0.59393310546875, 0.709686279296875, 0.825439453125, 0.941192626953125, 1.05694580078125, 1.172698974609375, 1.2884521484375, 1.404205322265625, 1.51995849609375, 1.635711669921875, 1.75146484375, 1.867218017578125, 1.98297119140625, 2.098724365234375, 2.2144775390625, 2.330230712890625, 2.44598388671875, 2.561737060546875, 2.677490234375, 2.793243408203125, 2.90899658203125, 3.024749755859375, 3.1405029296875, 3.256256103515625, 3.37200927734375, 3.487762451171875, 3.603515625]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 7.0, 1.0, 5.0, 6.0, 5.0, 11.0, 11.0, 13.0, 13.0, 17.0, 16.0, 23.0, 32.0, 34.0, 62.0, 68.0, 75.0, 138.0, 238.0, 573.0, 6314.0, 267336.0, 3126033.0, 772834.0, 18503.0, 1054.0, 268.0, 124.0, 109.0, 82.0, 51.0, 39.0, 30.0, 30.0, 23.0, 27.0, 13.0, 17.0, 11.0, 11.0, 4.0, 9.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.6875, -10.369873046875, -10.05224609375, -9.734619140625, -9.4169921875, -9.099365234375, -8.78173828125, -8.464111328125, -8.146484375, -7.828857421875, -7.51123046875, -7.193603515625, -6.8759765625, -6.558349609375, -6.24072265625, -5.923095703125, -5.60546875, -5.287841796875, -4.97021484375, -4.652587890625, -4.3349609375, -4.017333984375, -3.69970703125, -3.382080078125, -3.064453125, -2.746826171875, -2.42919921875, -2.111572265625, -1.7939453125, -1.476318359375, -1.15869140625, -0.841064453125, -0.5234375, -0.205810546875, 0.11181640625, 0.429443359375, 0.7470703125, 1.064697265625, 1.38232421875, 1.699951171875, 2.017578125, 2.335205078125, 2.65283203125, 2.970458984375, 3.2880859375, 3.605712890625, 3.92333984375, 4.240966796875, 4.55859375, 4.876220703125, 5.19384765625, 5.511474609375, 5.8291015625, 6.146728515625, 6.46435546875, 6.781982421875, 7.099609375, 7.417236328125, 7.73486328125, 8.052490234375, 8.3701171875, 8.687744140625, 9.00537109375, 9.322998046875, 9.640625]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 4.0, 4.0, 5.0, 16.0, 13.0, 20.0, 31.0, 44.0, 70.0, 113.0, 135.0, 236.0, 353.0, 504.0, 610.0, 573.0, 449.0, 328.0, 207.0, 148.0, 66.0, 52.0, 37.0, 25.0, 13.0, 9.0, 5.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0], "bins": [-11.015625, -10.775390625, -10.53515625, -10.294921875, -10.0546875, -9.814453125, -9.57421875, -9.333984375, -9.09375, -8.853515625, -8.61328125, -8.373046875, -8.1328125, -7.892578125, -7.65234375, -7.412109375, -7.171875, -6.931640625, -6.69140625, -6.451171875, -6.2109375, -5.970703125, -5.73046875, -5.490234375, -5.25, -5.009765625, -4.76953125, -4.529296875, -4.2890625, -4.048828125, -3.80859375, -3.568359375, -3.328125, -3.087890625, -2.84765625, -2.607421875, -2.3671875, -2.126953125, -1.88671875, -1.646484375, -1.40625, -1.166015625, -0.92578125, -0.685546875, -0.4453125, -0.205078125, 0.03515625, 0.275390625, 0.515625, 0.755859375, 0.99609375, 1.236328125, 1.4765625, 1.716796875, 1.95703125, 2.197265625, 2.4375, 2.677734375, 2.91796875, 3.158203125, 3.3984375, 3.638671875, 3.87890625, 4.119140625, 4.359375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 3.0, 2.0, 3.0, 15.0, 14.0, 20.0, 42.0, 64.0, 105.0, 162.0, 267.0, 440.0, 919.0, 5848.0, 1852466.0, 2324820.0, 6982.0, 892.0, 441.0, 279.0, 178.0, 108.0, 78.0, 40.0, 27.0, 21.0, 15.0, 15.0, 8.0, 5.0, 5.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.7890625, -14.0115966796875, -13.234130859375, -12.4566650390625, -11.67919921875, -10.9017333984375, -10.124267578125, -9.3468017578125, -8.5693359375, -7.7918701171875, -7.014404296875, -6.2369384765625, -5.45947265625, -4.6820068359375, -3.904541015625, -3.1270751953125, -2.349609375, -1.5721435546875, -0.794677734375, -0.0172119140625, 0.76025390625, 1.5377197265625, 2.315185546875, 3.0926513671875, 3.8701171875, 4.6475830078125, 5.425048828125, 6.2025146484375, 6.97998046875, 7.7574462890625, 8.534912109375, 9.3123779296875, 10.08984375, 10.8673095703125, 11.644775390625, 12.4222412109375, 13.19970703125, 13.9771728515625, 14.754638671875, 15.5321044921875, 16.3095703125, 17.0870361328125, 17.864501953125, 18.6419677734375, 19.41943359375, 20.1968994140625, 20.974365234375, 21.7518310546875, 22.529296875, 23.3067626953125, 24.084228515625, 24.8616943359375, 25.63916015625, 26.4166259765625, 27.194091796875, 27.9715576171875, 28.7490234375, 29.5264892578125, 30.303955078125, 31.0814208984375, 31.85888671875, 32.6363525390625, 33.413818359375, 34.1912841796875, 34.96875]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 107.0, 432.0, 384.0, 76.0, 11.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-111.24429321289062, -108.3926773071289, -105.54106903076172, -102.689453125, -99.83783721923828, -96.9862289428711, -94.13461303710938, -91.28300476074219, -88.43138885498047, -85.57977294921875, -82.72816467285156, -79.87654876708984, -77.02493286132812, -74.17332458496094, -71.32170867919922, -68.4700927734375, -65.61848449707031, -62.76687240600586, -59.91525650024414, -57.06364440917969, -54.212032318115234, -51.36042022705078, -48.50880432128906, -45.65719223022461, -42.805572509765625, -39.95396041870117, -37.10234451293945, -34.250732421875, -31.399120330810547, -28.54750633239746, -25.695892333984375, -22.844280242919922, -19.99266815185547, -17.141054153442383, -14.28944206237793, -11.437828063964844, -8.586215019226074, -5.734601974487305, -2.8829879760742188, -0.031375885009765625, 2.8202381134033203, 5.67185115814209, 8.52346420288086, 11.375078201293945, 14.226691246032715, 17.078304290771484, 19.92991828918457, 22.781530380249023, 25.63314437866211, 28.484758377075195, 31.33637046813965, 34.187984466552734, 37.03959655761719, 39.891212463378906, 42.74282455444336, 45.59443664550781, 48.44605255126953, 51.297664642333984, 54.1492805480957, 57.000892639160156, 59.85250473022461, 62.70411682128906, 65.55573272705078, 68.4073486328125, 71.25895690917969]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 3.0, 5.0, 1.0, 3.0, 4.0, 4.0, 6.0, 8.0, 10.0, 8.0, 12.0, 16.0, 17.0, 22.0, 19.0, 21.0, 27.0, 37.0, 34.0, 36.0, 33.0, 43.0, 50.0, 39.0, 46.0, 31.0, 30.0, 41.0, 36.0, 45.0, 36.0, 44.0, 28.0, 28.0, 25.0, 22.0, 22.0, 19.0, 11.0, 17.0, 10.0, 10.0, 10.0, 11.0, 9.0, 9.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0], "bins": [-19.536033630371094, -18.953569412231445, -18.37110710144043, -17.78864288330078, -17.206178665161133, -16.623716354370117, -16.04125213623047, -15.458788871765137, -14.876325607299805, -14.293862342834473, -13.711398124694824, -13.128934860229492, -12.54647159576416, -11.964008331298828, -11.38154411315918, -10.799080848693848, -10.2166166305542, -9.634153366088867, -9.051689147949219, -8.469225883483887, -7.886762619018555, -7.3042988777160645, -6.721835136413574, -6.139371871948242, -5.556908130645752, -4.974444389343262, -4.39198112487793, -3.8095173835754395, -3.2270538806915283, -2.644590377807617, -2.062126636505127, -1.479663372039795, -0.8971996307373047, -0.3147360682487488, 0.26772749423980713, 0.8501911163330078, 1.432654619216919, 2.01511812210083, 2.5975818634033203, 3.1800451278686523, 3.7625088691711426, 4.344972610473633, 4.927435874938965, 5.509899616241455, 6.092363357543945, 6.674826622009277, 7.257290363311768, 7.8397536277771, 8.42221736907959, 9.004680633544922, 9.58714485168457, 10.169608116149902, 10.752071380615234, 11.334535598754883, 11.916998863220215, 12.499462127685547, 13.081926345825195, 13.664389610290527, 14.246853828430176, 14.829317092895508, 15.41178035736084, 15.994243621826172, 16.57670783996582, 17.15917205810547, 17.741634368896484]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 5.0, 1.0, 4.0, 6.0, 11.0, 12.0, 8.0, 18.0, 13.0, 19.0, 28.0, 38.0, 27.0, 29.0, 36.0, 46.0, 36.0, 45.0, 51.0, 58.0, 40.0, 46.0, 51.0, 38.0, 41.0, 33.0, 34.0, 30.0, 31.0, 37.0, 18.0, 25.0, 18.0, 11.0, 14.0, 7.0, 8.0, 10.0, 6.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-4.4609375, -4.343902587890625, -4.22686767578125, -4.109832763671875, -3.9927978515625, -3.875762939453125, -3.75872802734375, -3.641693115234375, -3.524658203125, -3.407623291015625, -3.29058837890625, -3.173553466796875, -3.0565185546875, -2.939483642578125, -2.82244873046875, -2.705413818359375, -2.58837890625, -2.471343994140625, -2.35430908203125, -2.237274169921875, -2.1202392578125, -2.003204345703125, -1.88616943359375, -1.769134521484375, -1.652099609375, -1.535064697265625, -1.41802978515625, -1.300994873046875, -1.1839599609375, -1.066925048828125, -0.94989013671875, -0.832855224609375, -0.7158203125, -0.598785400390625, -0.48175048828125, -0.364715576171875, -0.2476806640625, -0.130645751953125, -0.01361083984375, 0.103424072265625, 0.220458984375, 0.337493896484375, 0.45452880859375, 0.571563720703125, 0.6885986328125, 0.805633544921875, 0.92266845703125, 1.039703369140625, 1.15673828125, 1.273773193359375, 1.39080810546875, 1.507843017578125, 1.6248779296875, 1.741912841796875, 1.85894775390625, 1.975982666015625, 2.093017578125, 2.210052490234375, 2.32708740234375, 2.444122314453125, 2.5611572265625, 2.678192138671875, 2.79522705078125, 2.912261962890625, 3.029296875]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 7.0, 7.0, 16.0, 22.0, 28.0, 58.0, 72.0, 94.0, 145.0, 225.0, 290.0, 456.0, 691.0, 917.0, 1422.0, 1965.0, 2951.0, 4023.0, 5814.0, 8666.0, 12424.0, 18592.0, 27952.0, 43040.0, 69962.0, 115558.0, 181873.0, 197081.0, 130305.0, 79765.0, 48647.0, 30906.0, 20249.0, 13717.0, 9458.0, 6453.0, 4591.0, 3148.0, 2161.0, 1481.0, 1026.0, 715.0, 527.0, 311.0, 245.0, 141.0, 130.0, 80.0, 46.0, 43.0, 29.0, 18.0, 9.0, 4.0, 5.0, 5.0, 1.0, 2.0], "bins": [-0.34521484375, -0.3347930908203125, -0.324371337890625, -0.3139495849609375, -0.30352783203125, -0.2931060791015625, -0.282684326171875, -0.2722625732421875, -0.2618408203125, -0.2514190673828125, -0.240997314453125, -0.2305755615234375, -0.22015380859375, -0.2097320556640625, -0.199310302734375, -0.1888885498046875, -0.178466796875, -0.1680450439453125, -0.157623291015625, -0.1472015380859375, -0.13677978515625, -0.1263580322265625, -0.115936279296875, -0.1055145263671875, -0.0950927734375, -0.0846710205078125, -0.074249267578125, -0.0638275146484375, -0.05340576171875, -0.0429840087890625, -0.032562255859375, -0.0221405029296875, -0.01171875, -0.0012969970703125, 0.009124755859375, 0.0195465087890625, 0.02996826171875, 0.0403900146484375, 0.050811767578125, 0.0612335205078125, 0.0716552734375, 0.0820770263671875, 0.092498779296875, 0.1029205322265625, 0.11334228515625, 0.1237640380859375, 0.134185791015625, 0.1446075439453125, 0.155029296875, 0.1654510498046875, 0.175872802734375, 0.1862945556640625, 0.19671630859375, 0.2071380615234375, 0.217559814453125, 0.2279815673828125, 0.2384033203125, 0.2488250732421875, 0.259246826171875, 0.2696685791015625, 0.28009033203125, 0.2905120849609375, 0.300933837890625, 0.3113555908203125, 0.32177734375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 2.0, 4.0, 3.0, 9.0, 7.0, 9.0, 9.0, 13.0, 14.0, 12.0, 17.0, 21.0, 18.0, 21.0, 20.0, 40.0, 31.0, 47.0, 40.0, 34.0, 28.0, 39.0, 43.0, 1059.0, 32.0, 38.0, 30.0, 34.0, 28.0, 29.0, 33.0, 29.0, 31.0, 23.0, 33.0, 20.0, 19.0, 14.0, 13.0, 8.0, 12.0, 15.0, 11.0, 9.0, 5.0, 7.0, 3.0, 5.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.921875, -1.8609466552734375, -1.800018310546875, -1.7390899658203125, -1.67816162109375, -1.6172332763671875, -1.556304931640625, -1.4953765869140625, -1.4344482421875, -1.3735198974609375, -1.312591552734375, -1.2516632080078125, -1.19073486328125, -1.1298065185546875, -1.068878173828125, -1.0079498291015625, -0.947021484375, -0.8860931396484375, -0.825164794921875, -0.7642364501953125, -0.70330810546875, -0.6423797607421875, -0.581451416015625, -0.5205230712890625, -0.4595947265625, -0.3986663818359375, -0.337738037109375, -0.2768096923828125, -0.21588134765625, -0.1549530029296875, -0.094024658203125, -0.0330963134765625, 0.02783203125, 0.0887603759765625, 0.149688720703125, 0.2106170654296875, 0.27154541015625, 0.3324737548828125, 0.393402099609375, 0.4543304443359375, 0.5152587890625, 0.5761871337890625, 0.637115478515625, 0.6980438232421875, 0.75897216796875, 0.8199005126953125, 0.880828857421875, 0.9417572021484375, 1.002685546875, 1.0636138916015625, 1.124542236328125, 1.1854705810546875, 1.24639892578125, 1.3073272705078125, 1.368255615234375, 1.4291839599609375, 1.4901123046875, 1.5510406494140625, 1.611968994140625, 1.6728973388671875, 1.73382568359375, 1.7947540283203125, 1.855682373046875, 1.9166107177734375, 1.9775390625]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 5.0, 5.0, 8.0, 11.0, 22.0, 37.0, 47.0, 80.0, 144.0, 205.0, 324.0, 516.0, 753.0, 1285.0, 1997.0, 3355.0, 5610.0, 9706.0, 16581.0, 30057.0, 54682.0, 103819.0, 202310.0, 1317646.0, 161382.0, 83147.0, 44288.0, 24668.0, 14073.0, 8179.0, 4827.0, 2867.0, 1652.0, 1050.0, 624.0, 433.0, 266.0, 168.0, 107.0, 63.0, 46.0, 27.0, 22.0, 14.0, 13.0, 6.0, 2.0, 5.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.41552734375, -0.4034233093261719, -0.39131927490234375, -0.3792152404785156, -0.3671112060546875, -0.3550071716308594, -0.34290313720703125, -0.3307991027832031, -0.318695068359375, -0.3065910339355469, -0.29448699951171875, -0.2823829650878906, -0.2702789306640625, -0.2581748962402344, -0.24607086181640625, -0.23396682739257812, -0.22186279296875, -0.20975875854492188, -0.19765472412109375, -0.18555068969726562, -0.1734466552734375, -0.16134262084960938, -0.14923858642578125, -0.13713455200195312, -0.125030517578125, -0.11292648315429688, -0.10082244873046875, -0.08871841430664062, -0.0766143798828125, -0.06451034545898438, -0.05240631103515625, -0.040302276611328125, -0.0281982421875, -0.016094207763671875, -0.00399017333984375, 0.008113861083984375, 0.0202178955078125, 0.032321929931640625, 0.04442596435546875, 0.056529998779296875, 0.068634033203125, 0.08073806762695312, 0.09284210205078125, 0.10494613647460938, 0.1170501708984375, 0.12915420532226562, 0.14125823974609375, 0.15336227416992188, 0.16546630859375, 0.17757034301757812, 0.18967437744140625, 0.20177841186523438, 0.2138824462890625, 0.22598648071289062, 0.23809051513671875, 0.2501945495605469, 0.262298583984375, 0.2744026184082031, 0.28650665283203125, 0.2986106872558594, 0.3107147216796875, 0.3228187561035156, 0.33492279052734375, 0.3470268249511719, 0.359130859375]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 3.0, 1.0, 4.0, 6.0, 13.0, 15.0, 20.0, 26.0, 40.0, 44.0, 58.0, 68.0, 87.0, 81.0, 84.0, 85.0, 57.0, 59.0, 50.0, 48.0, 34.0, 26.0, 19.0, 12.0, 13.0, 17.0, 6.0, 6.0, 7.0, 3.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.001800537109375, -0.0017509311437606812, -0.0017013251781463623, -0.0016517192125320435, -0.0016021132469177246, -0.0015525072813034058, -0.001502901315689087, -0.001453295350074768, -0.0014036893844604492, -0.0013540834188461304, -0.0013044774532318115, -0.0012548714876174927, -0.0012052655220031738, -0.001155659556388855, -0.0011060535907745361, -0.0010564476251602173, -0.0010068416595458984, -0.0009572356939315796, -0.0009076297283172607, -0.0008580237627029419, -0.000808417797088623, -0.0007588118314743042, -0.0007092058658599854, -0.0006595999002456665, -0.0006099939346313477, -0.0005603879690170288, -0.00051078200340271, -0.0004611760377883911, -0.00041157007217407227, -0.0003619641065597534, -0.00031235814094543457, -0.0002627521753311157, -0.00021314620971679688, -0.00016354024410247803, -0.00011393427848815918, -6.432831287384033e-05, -1.4722347259521484e-05, 3.488361835479736e-05, 8.448958396911621e-05, 0.00013409554958343506, 0.0001837015151977539, 0.00023330748081207275, 0.0002829134464263916, 0.00033251941204071045, 0.0003821253776550293, 0.00043173134326934814, 0.000481337308883667, 0.0005309432744979858, 0.0005805492401123047, 0.0006301552057266235, 0.0006797611713409424, 0.0007293671369552612, 0.0007789731025695801, 0.0008285790681838989, 0.0008781850337982178, 0.0009277909994125366, 0.0009773969650268555, 0.0010270029306411743, 0.0010766088962554932, 0.001126214861869812, 0.0011758208274841309, 0.0012254267930984497, 0.0012750327587127686, 0.0013246387243270874, 0.0013742446899414062]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 1.0, 7.0, 8.0, 6.0, 11.0, 18.0, 23.0, 25.0, 37.0, 43.0, 73.0, 108.0, 156.0, 254.0, 618.0, 5978.0, 1036566.0, 3377.0, 548.0, 263.0, 143.0, 98.0, 55.0, 43.0, 28.0, 23.0, 11.0, 7.0, 3.0, 7.0, 3.0, 2.0, 8.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0294647216796875, -0.028391122817993164, -0.027317523956298828, -0.026243925094604492, -0.025170326232910156, -0.02409672737121582, -0.023023128509521484, -0.02194952964782715, -0.020875930786132812, -0.019802331924438477, -0.01872873306274414, -0.017655134201049805, -0.01658153533935547, -0.015507936477661133, -0.014434337615966797, -0.013360738754272461, -0.012287139892578125, -0.011213541030883789, -0.010139942169189453, -0.009066343307495117, -0.007992744445800781, -0.006919145584106445, -0.005845546722412109, -0.0047719478607177734, -0.0036983489990234375, -0.0026247501373291016, -0.0015511512756347656, -0.0004775524139404297, 0.0005960464477539062, 0.0016696453094482422, 0.002743244171142578, 0.003816843032836914, 0.00489044189453125, 0.005964040756225586, 0.007037639617919922, 0.008111238479614258, 0.009184837341308594, 0.01025843620300293, 0.011332035064697266, 0.012405633926391602, 0.013479232788085938, 0.014552831649780273, 0.01562643051147461, 0.016700029373168945, 0.01777362823486328, 0.018847227096557617, 0.019920825958251953, 0.02099442481994629, 0.022068023681640625, 0.02314162254333496, 0.024215221405029297, 0.025288820266723633, 0.02636241912841797, 0.027436017990112305, 0.02850961685180664, 0.029583215713500977, 0.030656814575195312, 0.03173041343688965, 0.032804012298583984, 0.03387761116027832, 0.034951210021972656, 0.03602480888366699, 0.03709840774536133, 0.038172006607055664, 0.03924560546875]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 11.0, 56.0, 274.0, 409.0, 215.0, 44.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.004250251222401857, -0.004160590935498476, -0.004070930648595095, -0.003981270361691713, -0.003891610074788332, -0.0038019500207155943, -0.003712289733812213, -0.0036226294469088316, -0.0035329691600054502, -0.003443308873102069, -0.0033536485861986876, -0.003263988299295306, -0.0031743282452225685, -0.003084667958319187, -0.002995007671415806, -0.0029053473845124245, -0.002815687097609043, -0.0027260268107056618, -0.0026363665238022804, -0.002546706236898899, -0.0024570459499955177, -0.00236738589592278, -0.0022777256090193987, -0.0021880653221160173, -0.002098405035212636, -0.0020087447483092546, -0.0019190844614058733, -0.0018294242909178138, -0.0017397640040144324, -0.001650103717111051, -0.0015604435466229916, -0.0014707832597196102, -0.0013811230892315507, -0.0012914628023281693, -0.0012018026318401098, -0.0011121423449367285, -0.0010224820580333471, -0.0009328217711299658, -0.0008431615424342453, -0.0007535013137385249, -0.0006638410268351436, -0.0005741807399317622, -0.0004845205112360418, -0.0003948602534364909, -0.00030519999563694, -0.0002155397378373891, -0.00012587948003783822, -3.6219251342117786e-05, 5.344103556126356e-05, 0.00014310129336081445, 0.00023276155116036534, 0.00032242180895991623, 0.0004120820667594671, 0.0005017423536628485, 0.0005914025823585689, 0.0006810628110542893, 0.0007707230979576707, 0.000860383384861052, 0.0009500436135567725, 0.001039703842252493, 0.0011293641291558743, 0.0012190244160592556, 0.001308684702962637, 0.0013983448734506965, 0.0014880051603540778]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 6.0, 13.0, 12.0, 21.0, 11.0, 13.0, 22.0, 23.0, 30.0, 29.0, 31.0, 45.0, 39.0, 31.0, 38.0, 55.0, 37.0, 42.0, 42.0, 42.0, 45.0, 45.0, 38.0, 30.0, 40.0, 33.0, 29.0, 30.0, 22.0, 20.0, 15.0, 19.0, 12.0, 8.0, 12.0, 9.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0007501840591430664, -0.0007274607196450233, -0.0007047373801469803, -0.0006820140406489372, -0.0006592907011508942, -0.0006365673616528511, -0.000613844022154808, -0.000591120682656765, -0.0005683973431587219, -0.0005456740036606789, -0.0005229506641626358, -0.0005002273246645927, -0.0004775039851665497, -0.0004547806456685066, -0.00043205730617046356, -0.0004093339666724205, -0.00038661062717437744, -0.0003638872876763344, -0.0003411639481782913, -0.00031844060868024826, -0.0002957172691822052, -0.00027299392968416214, -0.0002502705901861191, -0.00022754725068807602, -0.00020482391119003296, -0.0001821005716919899, -0.00015937723219394684, -0.00013665389269590378, -0.00011393055319786072, -9.120721369981766e-05, -6.84838742017746e-05, -4.576053470373154e-05, -2.3037195205688477e-05, -3.1385570764541626e-07, 2.2409483790397644e-05, 4.5132823288440704e-05, 6.785616278648376e-05, 9.057950228452682e-05, 0.00011330284178256989, 0.00013602618128061295, 0.000158749520778656, 0.00018147286027669907, 0.00020419619977474213, 0.0002269195392727852, 0.00024964287877082825, 0.0002723662182688713, 0.00029508955776691437, 0.00031781289726495743, 0.0003405362367630005, 0.00036325957626104355, 0.0003859829157590866, 0.00040870625525712967, 0.00043142959475517273, 0.0004541529342532158, 0.00047687627375125885, 0.0004995996132493019, 0.000522322952747345, 0.000545046292245388, 0.0005677696317434311, 0.0005904929712414742, 0.0006132163107395172, 0.0006359396502375603, 0.0006586629897356033, 0.0006813863292336464, 0.0007041096687316895]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 5.0, 1.0, 4.0, 6.0, 11.0, 12.0, 8.0, 18.0, 13.0, 19.0, 28.0, 38.0, 27.0, 29.0, 36.0, 46.0, 36.0, 45.0, 51.0, 58.0, 40.0, 46.0, 51.0, 38.0, 41.0, 33.0, 34.0, 30.0, 31.0, 37.0, 18.0, 25.0, 18.0, 11.0, 14.0, 7.0, 8.0, 10.0, 6.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-4.4609375, -4.343902587890625, -4.22686767578125, -4.109832763671875, -3.9927978515625, -3.875762939453125, -3.75872802734375, -3.641693115234375, -3.524658203125, -3.407623291015625, -3.29058837890625, -3.173553466796875, -3.0565185546875, -2.939483642578125, -2.82244873046875, -2.705413818359375, -2.58837890625, -2.471343994140625, -2.35430908203125, -2.237274169921875, -2.1202392578125, -2.003204345703125, -1.88616943359375, -1.769134521484375, -1.652099609375, -1.535064697265625, -1.41802978515625, -1.300994873046875, -1.1839599609375, -1.066925048828125, -0.94989013671875, -0.832855224609375, -0.7158203125, -0.598785400390625, -0.48175048828125, -0.364715576171875, -0.2476806640625, -0.130645751953125, -0.01361083984375, 0.103424072265625, 0.220458984375, 0.337493896484375, 0.45452880859375, 0.571563720703125, 0.6885986328125, 0.805633544921875, 0.92266845703125, 1.039703369140625, 1.15673828125, 1.273773193359375, 1.39080810546875, 1.507843017578125, 1.6248779296875, 1.741912841796875, 1.85894775390625, 1.975982666015625, 2.093017578125, 2.210052490234375, 2.32708740234375, 2.444122314453125, 2.5611572265625, 2.678192138671875, 2.79522705078125, 2.912261962890625, 3.029296875]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 2.0, 2.0, 3.0, 9.0, 10.0, 13.0, 14.0, 14.0, 32.0, 36.0, 37.0, 61.0, 83.0, 110.0, 162.0, 208.0, 307.0, 594.0, 1921.0, 8857.0, 43044.0, 317043.0, 573486.0, 81744.0, 15361.0, 3288.0, 840.0, 393.0, 233.0, 161.0, 125.0, 98.0, 65.0, 54.0, 34.0, 23.0, 16.0, 25.0, 16.0, 6.0, 8.0, 6.0, 7.0, 1.0, 1.0, 2.0, 2.0, 2.0], "bins": [-8.0390625, -7.8284912109375, -7.617919921875, -7.4073486328125, -7.19677734375, -6.9862060546875, -6.775634765625, -6.5650634765625, -6.3544921875, -6.1439208984375, -5.933349609375, -5.7227783203125, -5.51220703125, -5.3016357421875, -5.091064453125, -4.8804931640625, -4.669921875, -4.4593505859375, -4.248779296875, -4.0382080078125, -3.82763671875, -3.6170654296875, -3.406494140625, -3.1959228515625, -2.9853515625, -2.7747802734375, -2.564208984375, -2.3536376953125, -2.14306640625, -1.9324951171875, -1.721923828125, -1.5113525390625, -1.30078125, -1.0902099609375, -0.879638671875, -0.6690673828125, -0.45849609375, -0.2479248046875, -0.037353515625, 0.1732177734375, 0.3837890625, 0.5943603515625, 0.804931640625, 1.0155029296875, 1.22607421875, 1.4366455078125, 1.647216796875, 1.8577880859375, 2.068359375, 2.2789306640625, 2.489501953125, 2.7000732421875, 2.91064453125, 3.1212158203125, 3.331787109375, 3.5423583984375, 3.7529296875, 3.9635009765625, 4.174072265625, 4.3846435546875, 4.59521484375, 4.8057861328125, 5.016357421875, 5.2269287109375, 5.4375]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 5.0, 2.0, 2.0, 2.0, 2.0, 5.0, 8.0, 6.0, 10.0, 12.0, 12.0, 17.0, 17.0, 21.0, 16.0, 32.0, 30.0, 23.0, 23.0, 32.0, 38.0, 41.0, 56.0, 71.0, 182.0, 1515.0, 353.0, 104.0, 64.0, 37.0, 30.0, 41.0, 32.0, 33.0, 30.0, 29.0, 17.0, 21.0, 23.0, 9.0, 5.0, 8.0, 6.0, 10.0, 10.0, 3.0, 8.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.0234375, -9.6759033203125, -9.328369140625, -8.9808349609375, -8.63330078125, -8.2857666015625, -7.938232421875, -7.5906982421875, -7.2431640625, -6.8956298828125, -6.548095703125, -6.2005615234375, -5.85302734375, -5.5054931640625, -5.157958984375, -4.8104248046875, -4.462890625, -4.1153564453125, -3.767822265625, -3.4202880859375, -3.07275390625, -2.7252197265625, -2.377685546875, -2.0301513671875, -1.6826171875, -1.3350830078125, -0.987548828125, -0.6400146484375, -0.29248046875, 0.0550537109375, 0.402587890625, 0.7501220703125, 1.09765625, 1.4451904296875, 1.792724609375, 2.1402587890625, 2.48779296875, 2.8353271484375, 3.182861328125, 3.5303955078125, 3.8779296875, 4.2254638671875, 4.572998046875, 4.9205322265625, 5.26806640625, 5.6156005859375, 5.963134765625, 6.3106689453125, 6.658203125, 7.0057373046875, 7.353271484375, 7.7008056640625, 8.04833984375, 8.3958740234375, 8.743408203125, 9.0909423828125, 9.4384765625, 9.7860107421875, 10.133544921875, 10.4810791015625, 10.82861328125, 11.1761474609375, 11.523681640625, 11.8712158203125, 12.21875]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 7.0, 10.0, 5.0, 14.0, 13.0, 10.0, 16.0, 15.0, 24.0, 20.0, 41.0, 48.0, 60.0, 73.0, 118.0, 172.0, 240.0, 476.0, 1417.0, 20831.0, 3072607.0, 46033.0, 1879.0, 592.0, 298.0, 165.0, 112.0, 84.0, 50.0, 56.0, 37.0, 36.0, 33.0, 16.0, 21.0, 15.0, 11.0, 14.0, 8.0, 5.0, 7.0, 4.0, 2.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.6875, -24.8740234375, -24.060546875, -23.2470703125, -22.43359375, -21.6201171875, -20.806640625, -19.9931640625, -19.1796875, -18.3662109375, -17.552734375, -16.7392578125, -15.92578125, -15.1123046875, -14.298828125, -13.4853515625, -12.671875, -11.8583984375, -11.044921875, -10.2314453125, -9.41796875, -8.6044921875, -7.791015625, -6.9775390625, -6.1640625, -5.3505859375, -4.537109375, -3.7236328125, -2.91015625, -2.0966796875, -1.283203125, -0.4697265625, 0.34375, 1.1572265625, 1.970703125, 2.7841796875, 3.59765625, 4.4111328125, 5.224609375, 6.0380859375, 6.8515625, 7.6650390625, 8.478515625, 9.2919921875, 10.10546875, 10.9189453125, 11.732421875, 12.5458984375, 13.359375, 14.1728515625, 14.986328125, 15.7998046875, 16.61328125, 17.4267578125, 18.240234375, 19.0537109375, 19.8671875, 20.6806640625, 21.494140625, 22.3076171875, 23.12109375, 23.9345703125, 24.748046875, 25.5615234375, 26.375]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 9.0, 24.0, 83.0, 177.0, 253.0, 223.0, 157.0, 54.0, 19.0, 9.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.79281234741211, -38.02808380126953, -37.26335525512695, -36.49863052368164, -35.73390197753906, -34.969173431396484, -34.204444885253906, -33.439720153808594, -32.674991607666016, -31.910263061523438, -31.145536422729492, -30.380807876586914, -29.61608123779297, -28.85135269165039, -28.086626052856445, -27.321897506713867, -26.557170867919922, -25.792442321777344, -25.0277156829834, -24.26298713684082, -23.498260498046875, -22.733531951904297, -21.96880531311035, -21.204076766967773, -20.439348220825195, -19.674619674682617, -18.909893035888672, -18.145164489746094, -17.38043785095215, -16.61570930480957, -15.850982666015625, -15.086254119873047, -14.321528434753418, -13.556800842285156, -12.792073249816895, -12.027345657348633, -11.262618064880371, -10.49789047241211, -9.733161926269531, -8.968435287475586, -8.203706741333008, -7.438979148864746, -6.674251556396484, -5.909523963928223, -5.144796371459961, -4.380068778991699, -3.6153407096862793, -2.8506131172180176, -2.085886001586914, -1.3211584091186523, -0.5564306974411011, 0.2082970142364502, 0.9730246067047119, 1.7377521991729736, 2.5024800300598145, 3.267207622528076, 4.031935214996338, 4.7966628074646, 5.561390399932861, 6.326118469238281, 7.090846061706543, 7.855573654174805, 8.620301246643066, 9.385028839111328, 10.14975643157959]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 3.0, 3.0, 7.0, 3.0, 3.0, 5.0, 4.0, 11.0, 7.0, 8.0, 9.0, 18.0, 18.0, 20.0, 19.0, 14.0, 22.0, 23.0, 22.0, 32.0, 38.0, 47.0, 26.0, 34.0, 44.0, 49.0, 31.0, 44.0, 45.0, 36.0, 37.0, 37.0, 31.0, 28.0, 31.0, 25.0, 23.0, 20.0, 21.0, 14.0, 24.0, 11.0, 7.0, 9.0, 11.0, 9.0, 10.0, 6.0, 6.0, 2.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-23.435688018798828, -22.652280807495117, -21.868873596191406, -21.085464477539062, -20.30205726623535, -19.51865005493164, -18.73524284362793, -17.95183563232422, -17.168426513671875, -16.385019302368164, -15.601611137390137, -14.818203926086426, -14.034795761108398, -13.251388549804688, -12.467981338500977, -11.684574127197266, -10.901166915893555, -10.117759704589844, -9.334351539611816, -8.550944328308105, -7.767536640167236, -6.984128952026367, -6.200721740722656, -5.417314052581787, -4.633906364440918, -3.850498676300049, -3.067091226577759, -2.2836837768554688, -1.5002760887145996, -0.7168684005737305, 0.06653881072998047, 0.8499464988708496, 1.6333541870117188, 2.416761875152588, 3.200169324874878, 3.983576774597168, 4.766984462738037, 5.550392150878906, 6.333799362182617, 7.117207050323486, 7.9006147384643555, 8.684021949768066, 9.467430114746094, 10.250837326049805, 11.034244537353516, 11.817652702331543, 12.601059913635254, 13.384468078613281, 14.167875289916992, 14.951282501220703, 15.73469066619873, 16.518096923828125, 17.30150604248047, 18.08491325378418, 18.86832046508789, 19.6517276763916, 20.435134887695312, 21.218542098999023, 22.001949310302734, 22.785358428955078, 23.56876564025879, 24.3521728515625, 25.13558006286621, 25.918987274169922, 26.702396392822266]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 3.0, 4.0, 5.0, 3.0, 9.0, 4.0, 13.0, 15.0, 16.0, 17.0, 18.0, 27.0, 39.0, 24.0, 32.0, 45.0, 49.0, 56.0, 52.0, 46.0, 62.0, 48.0, 49.0, 32.0, 43.0, 39.0, 44.0, 42.0, 38.0, 23.0, 26.0, 16.0, 18.0, 13.0, 11.0, 9.0, 5.0, 6.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.07421875, -4.9346923828125, -4.795166015625, -4.6556396484375, -4.51611328125, -4.3765869140625, -4.237060546875, -4.0975341796875, -3.9580078125, -3.8184814453125, -3.678955078125, -3.5394287109375, -3.39990234375, -3.2603759765625, -3.120849609375, -2.9813232421875, -2.841796875, -2.7022705078125, -2.562744140625, -2.4232177734375, -2.28369140625, -2.1441650390625, -2.004638671875, -1.8651123046875, -1.7255859375, -1.5860595703125, -1.446533203125, -1.3070068359375, -1.16748046875, -1.0279541015625, -0.888427734375, -0.7489013671875, -0.609375, -0.4698486328125, -0.330322265625, -0.1907958984375, -0.05126953125, 0.0882568359375, 0.227783203125, 0.3673095703125, 0.5068359375, 0.6463623046875, 0.785888671875, 0.9254150390625, 1.06494140625, 1.2044677734375, 1.343994140625, 1.4835205078125, 1.623046875, 1.7625732421875, 1.902099609375, 2.0416259765625, 2.18115234375, 2.3206787109375, 2.460205078125, 2.5997314453125, 2.7392578125, 2.8787841796875, 3.018310546875, 3.1578369140625, 3.29736328125, 3.4368896484375, 3.576416015625, 3.7159423828125, 3.85546875]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 4.0, 4.0, 2.0, 9.0, 12.0, 16.0, 10.0, 15.0, 34.0, 31.0, 40.0, 49.0, 65.0, 90.0, 147.0, 368.0, 1603.0, 27088.0, 887211.0, 2946450.0, 319641.0, 9772.0, 882.0, 250.0, 122.0, 87.0, 69.0, 45.0, 42.0, 27.0, 19.0, 21.0, 17.0, 13.0, 11.0, 6.0, 7.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-10.9921875, -10.689697265625, -10.38720703125, -10.084716796875, -9.7822265625, -9.479736328125, -9.17724609375, -8.874755859375, -8.572265625, -8.269775390625, -7.96728515625, -7.664794921875, -7.3623046875, -7.059814453125, -6.75732421875, -6.454833984375, -6.15234375, -5.849853515625, -5.54736328125, -5.244873046875, -4.9423828125, -4.639892578125, -4.33740234375, -4.034912109375, -3.732421875, -3.429931640625, -3.12744140625, -2.824951171875, -2.5224609375, -2.219970703125, -1.91748046875, -1.614990234375, -1.3125, -1.010009765625, -0.70751953125, -0.405029296875, -0.1025390625, 0.199951171875, 0.50244140625, 0.804931640625, 1.107421875, 1.409912109375, 1.71240234375, 2.014892578125, 2.3173828125, 2.619873046875, 2.92236328125, 3.224853515625, 3.52734375, 3.829833984375, 4.13232421875, 4.434814453125, 4.7373046875, 5.039794921875, 5.34228515625, 5.644775390625, 5.947265625, 6.249755859375, 6.55224609375, 6.854736328125, 7.1572265625, 7.459716796875, 7.76220703125, 8.064697265625, 8.3671875]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 0.0, 2.0, 2.0, 5.0, 3.0, 5.0, 12.0, 11.0, 16.0, 19.0, 27.0, 23.0, 49.0, 66.0, 83.0, 118.0, 139.0, 195.0, 272.0, 308.0, 387.0, 429.0, 418.0, 346.0, 302.0, 190.0, 171.0, 114.0, 93.0, 81.0, 40.0, 50.0, 30.0, 18.0, 9.0, 11.0, 9.0, 11.0, 5.0, 3.0, 1.0, 3.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.3359375, -6.16796875, -6.0, -5.83203125, -5.6640625, -5.49609375, -5.328125, -5.16015625, -4.9921875, -4.82421875, -4.65625, -4.48828125, -4.3203125, -4.15234375, -3.984375, -3.81640625, -3.6484375, -3.48046875, -3.3125, -3.14453125, -2.9765625, -2.80859375, -2.640625, -2.47265625, -2.3046875, -2.13671875, -1.96875, -1.80078125, -1.6328125, -1.46484375, -1.296875, -1.12890625, -0.9609375, -0.79296875, -0.625, -0.45703125, -0.2890625, -0.12109375, 0.046875, 0.21484375, 0.3828125, 0.55078125, 0.71875, 0.88671875, 1.0546875, 1.22265625, 1.390625, 1.55859375, 1.7265625, 1.89453125, 2.0625, 2.23046875, 2.3984375, 2.56640625, 2.734375, 2.90234375, 3.0703125, 3.23828125, 3.40625, 3.57421875, 3.7421875, 3.91015625, 4.078125, 4.24609375, 4.4140625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 4.0, 4.0, 6.0, 12.0, 15.0, 16.0, 23.0, 30.0, 54.0, 71.0, 89.0, 144.0, 183.0, 273.0, 330.0, 597.0, 1472.0, 7947.0, 133455.0, 2928841.0, 1076976.0, 37774.0, 3305.0, 1003.0, 501.0, 331.0, 237.0, 158.0, 112.0, 87.0, 68.0, 46.0, 31.0, 28.0, 20.0, 11.0, 9.0, 5.0, 3.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.765625, -10.3638916015625, -9.962158203125, -9.5604248046875, -9.15869140625, -8.7569580078125, -8.355224609375, -7.9534912109375, -7.5517578125, -7.1500244140625, -6.748291015625, -6.3465576171875, -5.94482421875, -5.5430908203125, -5.141357421875, -4.7396240234375, -4.337890625, -3.9361572265625, -3.534423828125, -3.1326904296875, -2.73095703125, -2.3292236328125, -1.927490234375, -1.5257568359375, -1.1240234375, -0.7222900390625, -0.320556640625, 0.0811767578125, 0.48291015625, 0.8846435546875, 1.286376953125, 1.6881103515625, 2.08984375, 2.4915771484375, 2.893310546875, 3.2950439453125, 3.69677734375, 4.0985107421875, 4.500244140625, 4.9019775390625, 5.3037109375, 5.7054443359375, 6.107177734375, 6.5089111328125, 6.91064453125, 7.3123779296875, 7.714111328125, 8.1158447265625, 8.517578125, 8.9193115234375, 9.321044921875, 9.7227783203125, 10.12451171875, 10.5262451171875, 10.927978515625, 11.3297119140625, 11.7314453125, 12.1331787109375, 12.534912109375, 12.9366455078125, 13.33837890625, 13.7401123046875, 14.141845703125, 14.5435791015625, 14.9453125]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 12.0, 37.0, 118.0, 180.0, 223.0, 221.0, 133.0, 57.0, 25.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.236835479736328, -28.908466339111328, -27.580097198486328, -26.251728057861328, -24.923358917236328, -23.594989776611328, -22.266620635986328, -20.938251495361328, -19.609882354736328, -18.281513214111328, -16.953144073486328, -15.624774932861328, -14.296405792236328, -12.968036651611328, -11.639667510986328, -10.311298370361328, -8.982929229736328, -7.654560089111328, -6.326190948486328, -4.997821807861328, -3.669452667236328, -2.341083526611328, -1.0127143859863281, 0.3156547546386719, 1.6440238952636719, 2.972393035888672, 4.300762176513672, 5.629131317138672, 6.957500457763672, 8.285869598388672, 9.614238739013672, 10.942607879638672, 12.270973205566406, 13.599342346191406, 14.927711486816406, 16.256080627441406, 17.584449768066406, 18.912818908691406, 20.241188049316406, 21.569557189941406, 22.897926330566406, 24.226295471191406, 25.554664611816406, 26.883033752441406, 28.211402893066406, 29.539772033691406, 30.868141174316406, 32.196510314941406, 33.524879455566406, 34.853248596191406, 36.181617736816406, 37.509986877441406, 38.838356018066406, 40.166725158691406, 41.495094299316406, 42.823463439941406, 44.151832580566406, 45.480201721191406, 46.808570861816406, 48.136940002441406, 49.465309143066406, 50.793678283691406, 52.122047424316406, 53.450416564941406, 54.778785705566406]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 4.0, 10.0, 5.0, 14.0, 21.0, 12.0, 17.0, 25.0, 24.0, 27.0, 35.0, 33.0, 32.0, 38.0, 34.0, 49.0, 46.0, 50.0, 48.0, 46.0, 47.0, 42.0, 42.0, 32.0, 23.0, 38.0, 34.0, 40.0, 35.0, 16.0, 20.0, 13.0, 16.0, 10.0, 4.0, 4.0, 6.0, 8.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.979721069335938, -19.31089210510254, -18.64206314086914, -17.973234176635742, -17.304405212402344, -16.635576248168945, -15.966747283935547, -15.297918319702148, -14.62908935546875, -13.960260391235352, -13.291431427001953, -12.622602462768555, -11.953773498535156, -11.284944534301758, -10.61611557006836, -9.947286605834961, -9.278457641601562, -8.609628677368164, -7.940799713134766, -7.271970748901367, -6.603141784667969, -5.93431282043457, -5.265483856201172, -4.596654891967773, -3.927825927734375, -3.2589969635009766, -2.590167999267578, -1.9213390350341797, -1.2525100708007812, -0.5836811065673828, 0.08514785766601562, 0.7539768218994141, 1.4228057861328125, 2.091634750366211, 2.7604637145996094, 3.429292678833008, 4.098121643066406, 4.766950607299805, 5.435779571533203, 6.104608535766602, 6.7734375, 7.442266464233398, 8.111095428466797, 8.779924392700195, 9.448753356933594, 10.117582321166992, 10.78641128540039, 11.455240249633789, 12.124069213867188, 12.792898178100586, 13.461727142333984, 14.130556106567383, 14.799385070800781, 15.46821403503418, 16.137042999267578, 16.805871963500977, 17.474700927734375, 18.143529891967773, 18.812358856201172, 19.48118782043457, 20.15001678466797, 20.818845748901367, 21.487674713134766, 22.156503677368164, 22.825332641601562]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 8.0, 1.0, 9.0, 14.0, 13.0, 13.0, 31.0, 14.0, 24.0, 23.0, 25.0, 41.0, 38.0, 28.0, 36.0, 48.0, 33.0, 42.0, 37.0, 49.0, 38.0, 46.0, 37.0, 36.0, 29.0, 45.0, 34.0, 30.0, 25.0, 22.0, 20.0, 22.0, 19.0, 12.0, 13.0, 12.0, 7.0, 4.0, 10.0, 1.0, 1.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.958984375, -3.84307861328125, -3.7271728515625, -3.61126708984375, -3.495361328125, -3.37945556640625, -3.2635498046875, -3.14764404296875, -3.03173828125, -2.91583251953125, -2.7999267578125, -2.68402099609375, -2.568115234375, -2.45220947265625, -2.3363037109375, -2.22039794921875, -2.1044921875, -1.98858642578125, -1.8726806640625, -1.75677490234375, -1.640869140625, -1.52496337890625, -1.4090576171875, -1.29315185546875, -1.17724609375, -1.06134033203125, -0.9454345703125, -0.82952880859375, -0.713623046875, -0.59771728515625, -0.4818115234375, -0.36590576171875, -0.25, -0.13409423828125, -0.0181884765625, 0.09771728515625, 0.213623046875, 0.32952880859375, 0.4454345703125, 0.56134033203125, 0.67724609375, 0.79315185546875, 0.9090576171875, 1.02496337890625, 1.140869140625, 1.25677490234375, 1.3726806640625, 1.48858642578125, 1.6044921875, 1.72039794921875, 1.8363037109375, 1.95220947265625, 2.068115234375, 2.18402099609375, 2.2999267578125, 2.41583251953125, 2.53173828125, 2.64764404296875, 2.7635498046875, 2.87945556640625, 2.995361328125, 3.11126708984375, 3.2271728515625, 3.34307861328125, 3.458984375]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 3.0, 8.0, 5.0, 8.0, 25.0, 19.0, 27.0, 70.0, 76.0, 108.0, 175.0, 256.0, 360.0, 506.0, 734.0, 1133.0, 1585.0, 2318.0, 3606.0, 5367.0, 7956.0, 12431.0, 19265.0, 30791.0, 50382.0, 86115.0, 151602.0, 224592.0, 181484.0, 105328.0, 60777.0, 36482.0, 22478.0, 14309.0, 9279.0, 6057.0, 4119.0, 2761.0, 1872.0, 1307.0, 865.0, 617.0, 431.0, 250.0, 185.0, 136.0, 94.0, 57.0, 51.0, 33.0, 18.0, 17.0, 13.0, 7.0, 5.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0], "bins": [-0.370849609375, -0.3587608337402344, -0.34667205810546875, -0.3345832824707031, -0.3224945068359375, -0.3104057312011719, -0.29831695556640625, -0.2862281799316406, -0.274139404296875, -0.2620506286621094, -0.24996185302734375, -0.23787307739257812, -0.2257843017578125, -0.21369552612304688, -0.20160675048828125, -0.18951797485351562, -0.17742919921875, -0.16534042358398438, -0.15325164794921875, -0.14116287231445312, -0.1290740966796875, -0.11698532104492188, -0.10489654541015625, -0.09280776977539062, -0.080718994140625, -0.06863021850585938, -0.05654144287109375, -0.044452667236328125, -0.0323638916015625, -0.020275115966796875, -0.00818634033203125, 0.003902435302734375, 0.0159912109375, 0.028079986572265625, 0.04016876220703125, 0.052257537841796875, 0.0643463134765625, 0.07643508911132812, 0.08852386474609375, 0.10061264038085938, 0.112701416015625, 0.12479019165039062, 0.13687896728515625, 0.14896774291992188, 0.1610565185546875, 0.17314529418945312, 0.18523406982421875, 0.19732284545898438, 0.20941162109375, 0.22150039672851562, 0.23358917236328125, 0.24567794799804688, 0.2577667236328125, 0.2698554992675781, 0.28194427490234375, 0.2940330505371094, 0.306121826171875, 0.3182106018066406, 0.33029937744140625, 0.3423881530761719, 0.3544769287109375, 0.3665657043457031, 0.37865447998046875, 0.3907432556152344, 0.40283203125]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 2.0, 0.0, 4.0, 5.0, 7.0, 8.0, 8.0, 10.0, 14.0, 19.0, 19.0, 14.0, 23.0, 17.0, 35.0, 28.0, 29.0, 23.0, 42.0, 27.0, 35.0, 39.0, 36.0, 37.0, 1072.0, 40.0, 45.0, 29.0, 32.0, 29.0, 30.0, 30.0, 31.0, 24.0, 35.0, 16.0, 21.0, 20.0, 17.0, 15.0, 9.0, 14.0, 15.0, 4.0, 5.0, 9.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.14453125, -2.07452392578125, -2.0045166015625, -1.93450927734375, -1.864501953125, -1.79449462890625, -1.7244873046875, -1.65447998046875, -1.58447265625, -1.51446533203125, -1.4444580078125, -1.37445068359375, -1.304443359375, -1.23443603515625, -1.1644287109375, -1.09442138671875, -1.0244140625, -0.95440673828125, -0.8843994140625, -0.81439208984375, -0.744384765625, -0.67437744140625, -0.6043701171875, -0.53436279296875, -0.46435546875, -0.39434814453125, -0.3243408203125, -0.25433349609375, -0.184326171875, -0.11431884765625, -0.0443115234375, 0.02569580078125, 0.095703125, 0.16571044921875, 0.2357177734375, 0.30572509765625, 0.375732421875, 0.44573974609375, 0.5157470703125, 0.58575439453125, 0.65576171875, 0.72576904296875, 0.7957763671875, 0.86578369140625, 0.935791015625, 1.00579833984375, 1.0758056640625, 1.14581298828125, 1.2158203125, 1.28582763671875, 1.3558349609375, 1.42584228515625, 1.495849609375, 1.56585693359375, 1.6358642578125, 1.70587158203125, 1.77587890625, 1.84588623046875, 1.9158935546875, 1.98590087890625, 2.055908203125, 2.12591552734375, 2.1959228515625, 2.26593017578125, 2.3359375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 7.0, 7.0, 10.0, 19.0, 20.0, 46.0, 85.0, 89.0, 129.0, 195.0, 325.0, 459.0, 702.0, 1079.0, 1651.0, 2511.0, 3838.0, 6064.0, 9583.0, 15222.0, 25384.0, 43534.0, 76374.0, 139115.0, 1278204.0, 211194.0, 118201.0, 65738.0, 37937.0, 22306.0, 13555.0, 8365.0, 5220.0, 3367.0, 2162.0, 1477.0, 983.0, 626.0, 435.0, 303.0, 210.0, 130.0, 91.0, 53.0, 39.0, 31.0, 21.0, 26.0, 6.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.376220703125, -0.3651123046875, -0.35400390625, -0.3428955078125, -0.331787109375, -0.3206787109375, -0.3095703125, -0.2984619140625, -0.287353515625, -0.2762451171875, -0.26513671875, -0.2540283203125, -0.242919921875, -0.2318115234375, -0.220703125, -0.2095947265625, -0.198486328125, -0.1873779296875, -0.17626953125, -0.1651611328125, -0.154052734375, -0.1429443359375, -0.1318359375, -0.1207275390625, -0.109619140625, -0.0985107421875, -0.08740234375, -0.0762939453125, -0.065185546875, -0.0540771484375, -0.04296875, -0.0318603515625, -0.020751953125, -0.0096435546875, 0.00146484375, 0.0125732421875, 0.023681640625, 0.0347900390625, 0.0458984375, 0.0570068359375, 0.068115234375, 0.0792236328125, 0.09033203125, 0.1014404296875, 0.112548828125, 0.1236572265625, 0.134765625, 0.1458740234375, 0.156982421875, 0.1680908203125, 0.17919921875, 0.1903076171875, 0.201416015625, 0.2125244140625, 0.2236328125, 0.2347412109375, 0.245849609375, 0.2569580078125, 0.26806640625, 0.2791748046875, 0.290283203125, 0.3013916015625, 0.3125, 0.3236083984375, 0.334716796875]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 1.0, 4.0, 2.0, 0.0, 1.0, 5.0, 5.0, 5.0, 7.0, 6.0, 10.0, 11.0, 13.0, 20.0, 18.0, 37.0, 38.0, 47.0, 60.0, 89.0, 84.0, 79.0, 86.0, 71.0, 66.0, 53.0, 43.0, 27.0, 26.0, 18.0, 12.0, 14.0, 14.0, 8.0, 7.0, 4.0, 4.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013608932495117188, -0.0013131499290466309, -0.001265406608581543, -0.001217663288116455, -0.0011699199676513672, -0.0011221766471862793, -0.0010744333267211914, -0.0010266900062561035, -0.0009789466857910156, -0.0009312033653259277, -0.0008834600448608398, -0.000835716724395752, -0.0007879734039306641, -0.0007402300834655762, -0.0006924867630004883, -0.0006447434425354004, -0.0005970001220703125, -0.0005492568016052246, -0.0005015134811401367, -0.00045377016067504883, -0.00040602684020996094, -0.00035828351974487305, -0.00031054019927978516, -0.00026279687881469727, -0.00021505355834960938, -0.00016731023788452148, -0.0001195669174194336, -7.18235969543457e-05, -2.4080276489257812e-05, 2.3663043975830078e-05, 7.140636444091797e-05, 0.00011914968490600586, 0.00016689300537109375, 0.00021463632583618164, 0.00026237964630126953, 0.0003101229667663574, 0.0003578662872314453, 0.0004056096076965332, 0.0004533529281616211, 0.000501096248626709, 0.0005488395690917969, 0.0005965828895568848, 0.0006443262100219727, 0.0006920695304870605, 0.0007398128509521484, 0.0007875561714172363, 0.0008352994918823242, 0.0008830428123474121, 0.0009307861328125, 0.0009785294532775879, 0.0010262727737426758, 0.0010740160942077637, 0.0011217594146728516, 0.0011695027351379395, 0.0012172460556030273, 0.0012649893760681152, 0.0013127326965332031, 0.001360476016998291, 0.001408219337463379, 0.0014559626579284668, 0.0015037059783935547, 0.0015514492988586426, 0.0015991926193237305, 0.0016469359397888184, 0.0016946792602539062]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 1.0, 2.0, 4.0, 3.0, 5.0, 6.0, 12.0, 10.0, 11.0, 15.0, 31.0, 24.0, 51.0, 47.0, 91.0, 122.0, 202.0, 370.0, 821.0, 26696.0, 1016323.0, 2344.0, 538.0, 278.0, 164.0, 111.0, 75.0, 40.0, 28.0, 31.0, 26.0, 11.0, 11.0, 8.0, 11.0, 6.0, 6.0, 8.0, 1.0, 5.0, 4.0, 0.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.034088134765625, -0.03312230110168457, -0.03215646743774414, -0.03119063377380371, -0.03022480010986328, -0.02925896644592285, -0.028293132781982422, -0.027327299118041992, -0.026361465454101562, -0.025395631790161133, -0.024429798126220703, -0.023463964462280273, -0.022498130798339844, -0.021532297134399414, -0.020566463470458984, -0.019600629806518555, -0.018634796142578125, -0.017668962478637695, -0.016703128814697266, -0.015737295150756836, -0.014771461486816406, -0.013805627822875977, -0.012839794158935547, -0.011873960494995117, -0.010908126831054688, -0.009942293167114258, -0.008976459503173828, -0.008010625839233398, -0.007044792175292969, -0.006078958511352539, -0.005113124847412109, -0.00414729118347168, -0.00318145751953125, -0.0022156238555908203, -0.0012497901916503906, -0.00028395652770996094, 0.0006818771362304688, 0.0016477108001708984, 0.002613544464111328, 0.003579378128051758, 0.0045452117919921875, 0.005511045455932617, 0.006476879119873047, 0.0074427127838134766, 0.008408546447753906, 0.009374380111694336, 0.010340213775634766, 0.011306047439575195, 0.012271881103515625, 0.013237714767456055, 0.014203548431396484, 0.015169382095336914, 0.016135215759277344, 0.017101049423217773, 0.018066883087158203, 0.019032716751098633, 0.019998550415039062, 0.020964384078979492, 0.021930217742919922, 0.02289605140686035, 0.02386188507080078, 0.02482771873474121, 0.02579355239868164, 0.02675938606262207, 0.0277252197265625]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 159.0, 706.0, 142.0, 4.0, 0.0, 0.0, 2.0], "bins": [-0.00998278521001339, -0.00981210544705391, -0.009641426615417004, -0.009470746852457523, -0.009300067089498043, -0.009129387326538563, -0.008958708494901657, -0.008788028731942177, -0.008617348968982697, -0.008446669206023216, -0.00827599037438631, -0.00810531061142683, -0.00793463084846735, -0.007763951551169157, -0.007593271788209677, -0.007422592490911484, -0.0072519127279520035, -0.0070812334306538105, -0.00691055366769433, -0.006739874370396137, -0.006569194607436657, -0.006398515310138464, -0.006227835547178984, -0.006057156249880791, -0.005886476952582598, -0.005715797655284405, -0.0055451178923249245, -0.0053744385950267315, -0.005203758832067251, -0.005033079534769058, -0.004862399771809578, -0.004691720474511385, -0.004521040245890617, -0.004350360948592424, -0.004179681185632944, -0.004009001888334751, -0.003838322125375271, -0.003667642595246434, -0.0034969630651175976, -0.0033262837678194046, -0.0031556044705212116, -0.002984924940392375, -0.0028142454102635384, -0.0026435658801347017, -0.002472886350005865, -0.0023022068198770285, -0.002131527289748192, -0.001960847992449999, -0.0017901682294905186, -0.001619488699361682, -0.0014488091692328453, -0.0012781296391040087, -0.001107450108975172, -0.0009367706370539963, -0.0007660911651328206, -0.000595411635003984, -0.00042473210487514734, -0.0002540525747463107, -8.337307372130454e-05, 8.730642730370164e-05, 0.00025798595743253827, 0.0004286654875613749, 0.0005993449594825506, 0.0007700244896113873, 0.0009407040197402239]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 5.0, 2.0, 5.0, 4.0, 3.0, 8.0, 8.0, 9.0, 12.0, 11.0, 19.0, 20.0, 23.0, 24.0, 20.0, 23.0, 35.0, 24.0, 42.0, 37.0, 38.0, 38.0, 45.0, 33.0, 48.0, 37.0, 38.0, 49.0, 32.0, 40.0, 35.0, 26.0, 26.0, 29.0, 18.0, 20.0, 18.0, 16.0, 17.0, 15.0, 11.0, 10.0, 12.0, 5.0, 6.0, 3.0, 6.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.0006582736968994141, -0.0006378619000315666, -0.0006174501031637192, -0.0005970383062958717, -0.0005766265094280243, -0.0005562147125601768, -0.0005358029156923294, -0.000515391118824482, -0.0004949793219566345, -0.0004745675250887871, -0.00045415572822093964, -0.0004337439313530922, -0.00041333213448524475, -0.0003929203376173973, -0.00037250854074954987, -0.0003520967438817024, -0.000331684947013855, -0.00031127315014600754, -0.0002908613532781601, -0.00027044955641031265, -0.0002500377595424652, -0.00022962596267461777, -0.00020921416580677032, -0.00018880236893892288, -0.00016839057207107544, -0.000147978775203228, -0.00012756697833538055, -0.00010715518146753311, -8.674338459968567e-05, -6.633158773183823e-05, -4.5919790863990784e-05, -2.550799399614334e-05, -5.0961971282958984e-06, 1.5315599739551544e-05, 3.572739660739899e-05, 5.613919347524643e-05, 7.655099034309387e-05, 9.696278721094131e-05, 0.00011737458407878876, 0.0001377863809466362, 0.00015819817781448364, 0.00017860997468233109, 0.00019902177155017853, 0.00021943356841802597, 0.0002398453652858734, 0.00026025716215372086, 0.0002806689590215683, 0.00030108075588941574, 0.0003214925527572632, 0.0003419043496251106, 0.00036231614649295807, 0.0003827279433608055, 0.00040313974022865295, 0.0004235515370965004, 0.00044396333396434784, 0.0004643751308321953, 0.0004847869277000427, 0.0005051987245678902, 0.0005256105214357376, 0.000546022318303585, 0.0005664341151714325, 0.0005868459120392799, 0.0006072577089071274, 0.0006276695057749748, 0.0006480813026428223]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 8.0, 1.0, 9.0, 14.0, 13.0, 13.0, 31.0, 14.0, 24.0, 23.0, 25.0, 41.0, 38.0, 28.0, 36.0, 48.0, 33.0, 42.0, 37.0, 49.0, 38.0, 45.0, 38.0, 36.0, 29.0, 45.0, 34.0, 30.0, 25.0, 22.0, 20.0, 22.0, 19.0, 12.0, 13.0, 12.0, 7.0, 4.0, 10.0, 1.0, 1.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.958984375, -3.84307861328125, -3.7271728515625, -3.61126708984375, -3.495361328125, -3.37945556640625, -3.2635498046875, -3.14764404296875, -3.03173828125, -2.91583251953125, -2.7999267578125, -2.68402099609375, -2.568115234375, -2.45220947265625, -2.3363037109375, -2.22039794921875, -2.1044921875, -1.98858642578125, -1.8726806640625, -1.75677490234375, -1.640869140625, -1.52496337890625, -1.4090576171875, -1.29315185546875, -1.17724609375, -1.06134033203125, -0.9454345703125, -0.82952880859375, -0.713623046875, -0.59771728515625, -0.4818115234375, -0.36590576171875, -0.25, -0.13409423828125, -0.0181884765625, 0.09771728515625, 0.213623046875, 0.32952880859375, 0.4454345703125, 0.56134033203125, 0.67724609375, 0.79315185546875, 0.9090576171875, 1.02496337890625, 1.140869140625, 1.25677490234375, 1.3726806640625, 1.48858642578125, 1.6044921875, 1.72039794921875, 1.8363037109375, 1.95220947265625, 2.068115234375, 2.18402099609375, 2.2999267578125, 2.41583251953125, 2.53173828125, 2.64764404296875, 2.7635498046875, 2.87945556640625, 2.995361328125, 3.11126708984375, 3.2271728515625, 3.34307861328125, 3.458984375]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 6.0, 8.0, 6.0, 10.0, 11.0, 12.0, 18.0, 29.0, 39.0, 65.0, 66.0, 101.0, 118.0, 176.0, 249.0, 344.0, 434.0, 675.0, 1351.0, 4172.0, 20602.0, 155244.0, 764980.0, 80845.0, 12870.0, 2876.0, 1091.0, 584.0, 441.0, 292.0, 233.0, 134.0, 110.0, 93.0, 65.0, 51.0, 46.0, 28.0, 22.0, 18.0, 11.0, 4.0, 11.0, 4.0, 3.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-10.0, -9.708984375, -9.41796875, -9.126953125, -8.8359375, -8.544921875, -8.25390625, -7.962890625, -7.671875, -7.380859375, -7.08984375, -6.798828125, -6.5078125, -6.216796875, -5.92578125, -5.634765625, -5.34375, -5.052734375, -4.76171875, -4.470703125, -4.1796875, -3.888671875, -3.59765625, -3.306640625, -3.015625, -2.724609375, -2.43359375, -2.142578125, -1.8515625, -1.560546875, -1.26953125, -0.978515625, -0.6875, -0.396484375, -0.10546875, 0.185546875, 0.4765625, 0.767578125, 1.05859375, 1.349609375, 1.640625, 1.931640625, 2.22265625, 2.513671875, 2.8046875, 3.095703125, 3.38671875, 3.677734375, 3.96875, 4.259765625, 4.55078125, 4.841796875, 5.1328125, 5.423828125, 5.71484375, 6.005859375, 6.296875, 6.587890625, 6.87890625, 7.169921875, 7.4609375, 7.751953125, 8.04296875, 8.333984375, 8.625]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 7.0, 3.0, 14.0, 16.0, 15.0, 18.0, 22.0, 16.0, 29.0, 32.0, 32.0, 42.0, 44.0, 50.0, 46.0, 64.0, 129.0, 367.0, 1508.0, 151.0, 79.0, 56.0, 49.0, 47.0, 37.0, 27.0, 31.0, 22.0, 16.0, 18.0, 11.0, 12.0, 10.0, 9.0, 10.0, 6.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8359375, -12.4364013671875, -12.036865234375, -11.6373291015625, -11.23779296875, -10.8382568359375, -10.438720703125, -10.0391845703125, -9.6396484375, -9.2401123046875, -8.840576171875, -8.4410400390625, -8.04150390625, -7.6419677734375, -7.242431640625, -6.8428955078125, -6.443359375, -6.0438232421875, -5.644287109375, -5.2447509765625, -4.84521484375, -4.4456787109375, -4.046142578125, -3.6466064453125, -3.2470703125, -2.8475341796875, -2.447998046875, -2.0484619140625, -1.64892578125, -1.2493896484375, -0.849853515625, -0.4503173828125, -0.05078125, 0.3487548828125, 0.748291015625, 1.1478271484375, 1.54736328125, 1.9468994140625, 2.346435546875, 2.7459716796875, 3.1455078125, 3.5450439453125, 3.944580078125, 4.3441162109375, 4.74365234375, 5.1431884765625, 5.542724609375, 5.9422607421875, 6.341796875, 6.7413330078125, 7.140869140625, 7.5404052734375, 7.93994140625, 8.3394775390625, 8.739013671875, 9.1385498046875, 9.5380859375, 9.9376220703125, 10.337158203125, 10.7366943359375, 11.13623046875, 11.5357666015625, 11.935302734375, 12.3348388671875, 12.734375]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 10.0, 6.0, 13.0, 11.0, 17.0, 17.0, 17.0, 23.0, 29.0, 43.0, 50.0, 75.0, 106.0, 173.0, 287.0, 588.0, 2416.0, 90797.0, 3039312.0, 9318.0, 1192.0, 406.0, 211.0, 146.0, 100.0, 72.0, 43.0, 42.0, 36.0, 31.0, 20.0, 15.0, 15.0, 20.0, 18.0, 10.0, 5.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.125, -33.09912109375, -32.0732421875, -31.04736328125, -30.021484375, -28.99560546875, -27.9697265625, -26.94384765625, -25.91796875, -24.89208984375, -23.8662109375, -22.84033203125, -21.814453125, -20.78857421875, -19.7626953125, -18.73681640625, -17.7109375, -16.68505859375, -15.6591796875, -14.63330078125, -13.607421875, -12.58154296875, -11.5556640625, -10.52978515625, -9.50390625, -8.47802734375, -7.4521484375, -6.42626953125, -5.400390625, -4.37451171875, -3.3486328125, -2.32275390625, -1.296875, -0.27099609375, 0.7548828125, 1.78076171875, 2.806640625, 3.83251953125, 4.8583984375, 5.88427734375, 6.91015625, 7.93603515625, 8.9619140625, 9.98779296875, 11.013671875, 12.03955078125, 13.0654296875, 14.09130859375, 15.1171875, 16.14306640625, 17.1689453125, 18.19482421875, 19.220703125, 20.24658203125, 21.2724609375, 22.29833984375, 23.32421875, 24.35009765625, 25.3759765625, 26.40185546875, 27.427734375, 28.45361328125, 29.4794921875, 30.50537109375, 31.53125]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 8.0, 61.0, 278.0, 421.0, 200.0, 41.0, 7.0], "bins": [-79.4412612915039, -78.12487030029297, -76.80847930908203, -75.4920883178711, -74.17569732666016, -72.85929870605469, -71.54290771484375, -70.22651672363281, -68.91012573242188, -67.59373474121094, -66.27734375, -64.96095275878906, -63.64455795288086, -62.32816696166992, -61.011775970458984, -59.69538497924805, -58.37899398803711, -57.06260299682617, -55.746212005615234, -54.42981719970703, -53.113426208496094, -51.797035217285156, -50.48064422607422, -49.16425323486328, -47.847862243652344, -46.531471252441406, -45.21508026123047, -43.898685455322266, -42.58229446411133, -41.26590347290039, -39.94951248168945, -38.633121490478516, -37.31672668457031, -36.000335693359375, -34.68394470214844, -33.367549896240234, -32.0511589050293, -30.73476791381836, -29.418376922607422, -28.101985931396484, -26.785593032836914, -25.469202041625977, -24.152809143066406, -22.83641815185547, -21.52002716064453, -20.20363426208496, -18.887243270874023, -17.570850372314453, -16.254459381103516, -14.938067436218262, -13.621675491333008, -12.30528450012207, -10.988892555236816, -9.672500610351562, -8.356109619140625, -7.039717674255371, -5.723326206207275, -4.40693473815918, -3.090542793273926, -1.774151086807251, -0.45775938034057617, 0.8586325645446777, 2.1750240325927734, 3.491415500640869, 4.807807445526123]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 8.0, 4.0, 6.0, 9.0, 7.0, 11.0, 11.0, 12.0, 19.0, 18.0, 19.0, 24.0, 29.0, 31.0, 38.0, 40.0, 35.0, 40.0, 40.0, 42.0, 39.0, 39.0, 45.0, 42.0, 35.0, 44.0, 44.0, 30.0, 30.0, 42.0, 28.0, 18.0, 17.0, 19.0, 15.0, 20.0, 14.0, 10.0, 8.0, 11.0, 5.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-27.759864807128906, -26.878202438354492, -25.996538162231445, -25.11487579345703, -24.233213424682617, -23.351551055908203, -22.469886779785156, -21.588224411010742, -20.706562042236328, -19.824899673461914, -18.943235397338867, -18.061573028564453, -17.17991065979004, -16.298248291015625, -15.416584014892578, -14.534921646118164, -13.653257369995117, -12.771594047546387, -11.889931678771973, -11.008268356323242, -10.126605987548828, -9.244942665100098, -8.363279342651367, -7.481616497039795, -6.599953651428223, -5.71829080581665, -4.836627960205078, -3.9549646377563477, -3.0733017921447754, -2.191638946533203, -1.3099756240844727, -0.4283127784729004, 0.4533500671386719, 1.3350130319595337, 2.2166759967803955, 3.098339080810547, 3.980001926422119, 4.861664772033691, 5.743328094482422, 6.624990940093994, 7.506653785705566, 8.388317108154297, 9.269979476928711, 10.151642799377441, 11.033306121826172, 11.914968490600586, 12.796631813049316, 13.678295135498047, 14.559957504272461, 15.441620826721191, 16.323284149169922, 17.204946517944336, 18.08660888671875, 18.968273162841797, 19.84993553161621, 20.731597900390625, 21.613262176513672, 22.494924545288086, 23.376588821411133, 24.258251190185547, 25.13991355895996, 26.021575927734375, 26.903240203857422, 27.784902572631836, 28.66656494140625]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 5.0, 2.0, 3.0, 2.0, 5.0, 4.0, 11.0, 8.0, 14.0, 12.0, 8.0, 23.0, 28.0, 22.0, 26.0, 30.0, 32.0, 41.0, 39.0, 37.0, 40.0, 35.0, 49.0, 41.0, 43.0, 42.0, 36.0, 49.0, 33.0, 41.0, 31.0, 27.0, 31.0, 28.0, 15.0, 19.0, 19.0, 16.0, 9.0, 10.0, 17.0, 11.0, 6.0, 0.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.876953125, -3.75433349609375, -3.6317138671875, -3.50909423828125, -3.386474609375, -3.26385498046875, -3.1412353515625, -3.01861572265625, -2.89599609375, -2.77337646484375, -2.6507568359375, -2.52813720703125, -2.405517578125, -2.28289794921875, -2.1602783203125, -2.03765869140625, -1.9150390625, -1.79241943359375, -1.6697998046875, -1.54718017578125, -1.424560546875, -1.30194091796875, -1.1793212890625, -1.05670166015625, -0.93408203125, -0.81146240234375, -0.6888427734375, -0.56622314453125, -0.443603515625, -0.32098388671875, -0.1983642578125, -0.07574462890625, 0.046875, 0.16949462890625, 0.2921142578125, 0.41473388671875, 0.537353515625, 0.65997314453125, 0.7825927734375, 0.90521240234375, 1.02783203125, 1.15045166015625, 1.2730712890625, 1.39569091796875, 1.518310546875, 1.64093017578125, 1.7635498046875, 1.88616943359375, 2.0087890625, 2.13140869140625, 2.2540283203125, 2.37664794921875, 2.499267578125, 2.62188720703125, 2.7445068359375, 2.86712646484375, 2.98974609375, 3.11236572265625, 3.2349853515625, 3.35760498046875, 3.480224609375, 3.60284423828125, 3.7254638671875, 3.84808349609375, 3.970703125]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 10.0, 10.0, 6.0, 10.0, 12.0, 19.0, 25.0, 27.0, 35.0, 44.0, 54.0, 75.0, 81.0, 120.0, 186.0, 252.0, 459.0, 1038.0, 5100.0, 53703.0, 606519.0, 2326709.0, 1072038.0, 114698.0, 9853.0, 1568.0, 570.0, 288.0, 182.0, 152.0, 92.0, 64.0, 64.0, 59.0, 42.0, 25.0, 27.0, 20.0, 11.0, 16.0, 7.0, 5.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.9921875, -6.77801513671875, -6.5638427734375, -6.34967041015625, -6.135498046875, -5.92132568359375, -5.7071533203125, -5.49298095703125, -5.27880859375, -5.06463623046875, -4.8504638671875, -4.63629150390625, -4.422119140625, -4.20794677734375, -3.9937744140625, -3.77960205078125, -3.5654296875, -3.35125732421875, -3.1370849609375, -2.92291259765625, -2.708740234375, -2.49456787109375, -2.2803955078125, -2.06622314453125, -1.85205078125, -1.63787841796875, -1.4237060546875, -1.20953369140625, -0.995361328125, -0.78118896484375, -0.5670166015625, -0.35284423828125, -0.138671875, 0.07550048828125, 0.2896728515625, 0.50384521484375, 0.718017578125, 0.93218994140625, 1.1463623046875, 1.36053466796875, 1.57470703125, 1.78887939453125, 2.0030517578125, 2.21722412109375, 2.431396484375, 2.64556884765625, 2.8597412109375, 3.07391357421875, 3.2880859375, 3.50225830078125, 3.7164306640625, 3.93060302734375, 4.144775390625, 4.35894775390625, 4.5731201171875, 4.78729248046875, 5.00146484375, 5.21563720703125, 5.4298095703125, 5.64398193359375, 5.858154296875, 6.07232666015625, 6.2864990234375, 6.50067138671875, 6.71484375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 7.0, 8.0, 14.0, 11.0, 23.0, 22.0, 31.0, 44.0, 69.0, 94.0, 108.0, 175.0, 244.0, 319.0, 372.0, 408.0, 427.0, 385.0, 344.0, 247.0, 211.0, 136.0, 108.0, 78.0, 60.0, 24.0, 23.0, 24.0, 16.0, 13.0, 6.0, 7.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.6953125, -6.5205078125, -6.345703125, -6.1708984375, -5.99609375, -5.8212890625, -5.646484375, -5.4716796875, -5.296875, -5.1220703125, -4.947265625, -4.7724609375, -4.59765625, -4.4228515625, -4.248046875, -4.0732421875, -3.8984375, -3.7236328125, -3.548828125, -3.3740234375, -3.19921875, -3.0244140625, -2.849609375, -2.6748046875, -2.5, -2.3251953125, -2.150390625, -1.9755859375, -1.80078125, -1.6259765625, -1.451171875, -1.2763671875, -1.1015625, -0.9267578125, -0.751953125, -0.5771484375, -0.40234375, -0.2275390625, -0.052734375, 0.1220703125, 0.296875, 0.4716796875, 0.646484375, 0.8212890625, 0.99609375, 1.1708984375, 1.345703125, 1.5205078125, 1.6953125, 1.8701171875, 2.044921875, 2.2197265625, 2.39453125, 2.5693359375, 2.744140625, 2.9189453125, 3.09375, 3.2685546875, 3.443359375, 3.6181640625, 3.79296875, 3.9677734375, 4.142578125, 4.3173828125, 4.4921875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 4.0, 3.0, 9.0, 17.0, 13.0, 27.0, 35.0, 53.0, 65.0, 119.0, 185.0, 289.0, 499.0, 1047.0, 3012.0, 29619.0, 1121585.0, 2940172.0, 89081.0, 5464.0, 1334.0, 617.0, 373.0, 200.0, 141.0, 106.0, 52.0, 44.0, 40.0, 25.0, 14.0, 12.0, 3.0, 7.0, 6.0, 7.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.4609375, -12.0023193359375, -11.543701171875, -11.0850830078125, -10.62646484375, -10.1678466796875, -9.709228515625, -9.2506103515625, -8.7919921875, -8.3333740234375, -7.874755859375, -7.4161376953125, -6.95751953125, -6.4989013671875, -6.040283203125, -5.5816650390625, -5.123046875, -4.6644287109375, -4.205810546875, -3.7471923828125, -3.28857421875, -2.8299560546875, -2.371337890625, -1.9127197265625, -1.4541015625, -0.9954833984375, -0.536865234375, -0.0782470703125, 0.38037109375, 0.8389892578125, 1.297607421875, 1.7562255859375, 2.21484375, 2.6734619140625, 3.132080078125, 3.5906982421875, 4.04931640625, 4.5079345703125, 4.966552734375, 5.4251708984375, 5.8837890625, 6.3424072265625, 6.801025390625, 7.2596435546875, 7.71826171875, 8.1768798828125, 8.635498046875, 9.0941162109375, 9.552734375, 10.0113525390625, 10.469970703125, 10.9285888671875, 11.38720703125, 11.8458251953125, 12.304443359375, 12.7630615234375, 13.2216796875, 13.6802978515625, 14.138916015625, 14.5975341796875, 15.05615234375, 15.5147705078125, 15.973388671875, 16.4320068359375, 16.890625]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 70.0, 939.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-425.3030090332031, -416.13153076171875, -406.9600524902344, -397.78857421875, -388.6170959472656, -379.44561767578125, -370.2741394042969, -361.1026611328125, -351.9311828613281, -342.75970458984375, -333.5882263183594, -324.416748046875, -315.2452697753906, -306.07379150390625, -296.9023132324219, -287.7308349609375, -278.5593566894531, -269.38787841796875, -260.2164001464844, -251.044921875, -241.87344360351562, -232.70196533203125, -223.53048706054688, -214.3590087890625, -205.18753051757812, -196.01605224609375, -186.84457397460938, -177.673095703125, -168.50161743164062, -159.33013916015625, -150.15866088867188, -140.9871826171875, -131.815673828125, -122.64419555664062, -113.47271728515625, -104.30123901367188, -95.1297607421875, -85.95828247070312, -76.78680419921875, -67.61532592773438, -58.44384765625, -49.272369384765625, -40.10089111328125, -30.929412841796875, -21.7579345703125, -12.586456298828125, -3.41497802734375, 5.756500244140625, 14.927978515625, 24.099456787109375, 33.27093505859375, 42.442413330078125, 51.6138916015625, 60.785369873046875, 69.95684814453125, 79.12832641601562, 88.2998046875, 97.47128295898438, 106.64276123046875, 115.81423950195312, 124.9857177734375, 134.15719604492188, 143.32867431640625, 152.50015258789062, 161.671630859375]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 1.0, 3.0, 2.0, 5.0, 11.0, 20.0, 8.0, 20.0, 22.0, 18.0, 32.0, 32.0, 38.0, 38.0, 26.0, 43.0, 41.0, 49.0, 57.0, 49.0, 50.0, 50.0, 58.0, 44.0, 34.0, 35.0, 39.0, 34.0, 25.0, 30.0, 13.0, 21.0, 17.0, 12.0, 7.0, 11.0, 5.0, 5.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.179353713989258, -20.442554473876953, -19.70575523376465, -18.968955993652344, -18.23215675354004, -17.495357513427734, -16.75855827331543, -16.021759033203125, -15.28495979309082, -14.548160552978516, -13.811361312866211, -13.074562072753906, -12.337762832641602, -11.600963592529297, -10.864164352416992, -10.127365112304688, -9.390565872192383, -8.653766632080078, -7.916967391967773, -7.180168151855469, -6.443368911743164, -5.706569671630859, -4.969770431518555, -4.23297119140625, -3.4961719512939453, -2.7593727111816406, -2.022573471069336, -1.2857742309570312, -0.5489749908447266, 0.18782424926757812, 0.9246234893798828, 1.6614227294921875, 2.398223876953125, 3.1350231170654297, 3.8718223571777344, 4.608621597290039, 5.345420837402344, 6.082220077514648, 6.819019317626953, 7.555818557739258, 8.292617797851562, 9.029417037963867, 9.766216278076172, 10.503015518188477, 11.239814758300781, 11.976613998413086, 12.71341323852539, 13.450212478637695, 14.18701171875, 14.923810958862305, 15.66061019897461, 16.397409439086914, 17.13420867919922, 17.871007919311523, 18.607807159423828, 19.344606399536133, 20.081405639648438, 20.818204879760742, 21.555004119873047, 22.29180335998535, 23.028602600097656, 23.76540184020996, 24.502201080322266, 25.23900032043457, 25.975799560546875]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 3.0, 4.0, 3.0, 8.0, 7.0, 7.0, 13.0, 16.0, 9.0, 21.0, 20.0, 22.0, 26.0, 38.0, 33.0, 35.0, 31.0, 29.0, 43.0, 32.0, 56.0, 42.0, 45.0, 42.0, 49.0, 38.0, 31.0, 41.0, 27.0, 24.0, 21.0, 33.0, 27.0, 25.0, 28.0, 19.0, 13.0, 8.0, 5.0, 7.0, 6.0, 7.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.634765625, -3.513580322265625, -3.39239501953125, -3.271209716796875, -3.1500244140625, -3.028839111328125, -2.90765380859375, -2.786468505859375, -2.665283203125, -2.544097900390625, -2.42291259765625, -2.301727294921875, -2.1805419921875, -2.059356689453125, -1.93817138671875, -1.816986083984375, -1.69580078125, -1.574615478515625, -1.45343017578125, -1.332244873046875, -1.2110595703125, -1.089874267578125, -0.96868896484375, -0.847503662109375, -0.726318359375, -0.605133056640625, -0.48394775390625, -0.362762451171875, -0.2415771484375, -0.120391845703125, 0.00079345703125, 0.121978759765625, 0.2431640625, 0.364349365234375, 0.48553466796875, 0.606719970703125, 0.7279052734375, 0.849090576171875, 0.97027587890625, 1.091461181640625, 1.212646484375, 1.333831787109375, 1.45501708984375, 1.576202392578125, 1.6973876953125, 1.818572998046875, 1.93975830078125, 2.060943603515625, 2.18212890625, 2.303314208984375, 2.42449951171875, 2.545684814453125, 2.6668701171875, 2.788055419921875, 2.90924072265625, 3.030426025390625, 3.151611328125, 3.272796630859375, 3.39398193359375, 3.515167236328125, 3.6363525390625, 3.757537841796875, 3.87872314453125, 3.999908447265625, 4.12109375]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 9.0, 9.0, 22.0, 23.0, 56.0, 79.0, 81.0, 170.0, 268.0, 384.0, 680.0, 1040.0, 1692.0, 2773.0, 4503.0, 7607.0, 12930.0, 22494.0, 39809.0, 73337.0, 142832.0, 261754.0, 222556.0, 114686.0, 59715.0, 32911.0, 18773.0, 10863.0, 6522.0, 3784.0, 2360.0, 1431.0, 880.0, 569.0, 356.0, 216.0, 130.0, 93.0, 56.0, 42.0, 25.0, 20.0, 9.0, 4.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4775390625, -0.4625396728515625, -0.447540283203125, -0.4325408935546875, -0.41754150390625, -0.4025421142578125, -0.387542724609375, -0.3725433349609375, -0.3575439453125, -0.3425445556640625, -0.327545166015625, -0.3125457763671875, -0.29754638671875, -0.2825469970703125, -0.267547607421875, -0.2525482177734375, -0.237548828125, -0.2225494384765625, -0.207550048828125, -0.1925506591796875, -0.17755126953125, -0.1625518798828125, -0.147552490234375, -0.1325531005859375, -0.1175537109375, -0.1025543212890625, -0.087554931640625, -0.0725555419921875, -0.05755615234375, -0.0425567626953125, -0.027557373046875, -0.0125579833984375, 0.00244140625, 0.0174407958984375, 0.032440185546875, 0.0474395751953125, 0.06243896484375, 0.0774383544921875, 0.092437744140625, 0.1074371337890625, 0.1224365234375, 0.1374359130859375, 0.152435302734375, 0.1674346923828125, 0.18243408203125, 0.1974334716796875, 0.212432861328125, 0.2274322509765625, 0.242431640625, 0.2574310302734375, 0.272430419921875, 0.2874298095703125, 0.30242919921875, 0.3174285888671875, 0.332427978515625, 0.3474273681640625, 0.3624267578125, 0.3774261474609375, 0.392425537109375, 0.4074249267578125, 0.42242431640625, 0.4374237060546875, 0.452423095703125, 0.4674224853515625, 0.482421875]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 7.0, 7.0, 5.0, 4.0, 11.0, 7.0, 16.0, 16.0, 18.0, 24.0, 26.0, 17.0, 24.0, 28.0, 42.0, 34.0, 38.0, 41.0, 40.0, 39.0, 44.0, 1071.0, 27.0, 47.0, 37.0, 43.0, 48.0, 36.0, 40.0, 28.0, 24.0, 32.0, 13.0, 18.0, 16.0, 12.0, 9.0, 6.0, 8.0, 4.0, 5.0, 5.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.576171875, -2.498870849609375, -2.42156982421875, -2.344268798828125, -2.2669677734375, -2.189666748046875, -2.11236572265625, -2.035064697265625, -1.957763671875, -1.880462646484375, -1.80316162109375, -1.725860595703125, -1.6485595703125, -1.571258544921875, -1.49395751953125, -1.416656494140625, -1.33935546875, -1.262054443359375, -1.18475341796875, -1.107452392578125, -1.0301513671875, -0.952850341796875, -0.87554931640625, -0.798248291015625, -0.720947265625, -0.643646240234375, -0.56634521484375, -0.489044189453125, -0.4117431640625, -0.334442138671875, -0.25714111328125, -0.179840087890625, -0.1025390625, -0.025238037109375, 0.05206298828125, 0.129364013671875, 0.2066650390625, 0.283966064453125, 0.36126708984375, 0.438568115234375, 0.515869140625, 0.593170166015625, 0.67047119140625, 0.747772216796875, 0.8250732421875, 0.902374267578125, 0.97967529296875, 1.056976318359375, 1.13427734375, 1.211578369140625, 1.28887939453125, 1.366180419921875, 1.4434814453125, 1.520782470703125, 1.59808349609375, 1.675384521484375, 1.752685546875, 1.829986572265625, 1.90728759765625, 1.984588623046875, 2.0618896484375, 2.139190673828125, 2.21649169921875, 2.293792724609375, 2.37109375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [5.0, 4.0, 5.0, 10.0, 10.0, 14.0, 11.0, 30.0, 49.0, 75.0, 90.0, 134.0, 178.0, 285.0, 445.0, 546.0, 841.0, 1210.0, 1668.0, 2529.0, 3754.0, 5523.0, 8190.0, 12372.0, 19052.0, 29228.0, 45948.0, 74117.0, 121006.0, 237182.0, 1189389.0, 126964.0, 77771.0, 48236.0, 30836.0, 20049.0, 12876.0, 8679.0, 5654.0, 3780.0, 2586.0, 1894.0, 1190.0, 857.0, 573.0, 382.0, 265.0, 185.0, 173.0, 112.0, 68.0, 32.0, 36.0, 16.0, 13.0, 13.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.28173828125, -0.27236175537109375, -0.2629852294921875, -0.25360870361328125, -0.244232177734375, -0.23485565185546875, -0.2254791259765625, -0.21610260009765625, -0.20672607421875, -0.19734954833984375, -0.1879730224609375, -0.17859649658203125, -0.169219970703125, -0.15984344482421875, -0.1504669189453125, -0.14109039306640625, -0.1317138671875, -0.12233734130859375, -0.1129608154296875, -0.10358428955078125, -0.094207763671875, -0.08483123779296875, -0.0754547119140625, -0.06607818603515625, -0.05670166015625, -0.04732513427734375, -0.0379486083984375, -0.02857208251953125, -0.019195556640625, -0.00981903076171875, -0.0004425048828125, 0.00893402099609375, 0.018310546875, 0.02768707275390625, 0.0370635986328125, 0.04644012451171875, 0.055816650390625, 0.06519317626953125, 0.0745697021484375, 0.08394622802734375, 0.09332275390625, 0.10269927978515625, 0.1120758056640625, 0.12145233154296875, 0.130828857421875, 0.14020538330078125, 0.1495819091796875, 0.15895843505859375, 0.1683349609375, 0.17771148681640625, 0.1870880126953125, 0.19646453857421875, 0.205841064453125, 0.21521759033203125, 0.2245941162109375, 0.23397064208984375, 0.24334716796875, 0.25272369384765625, 0.2621002197265625, 0.27147674560546875, 0.280853271484375, 0.29022979736328125, 0.2996063232421875, 0.30898284912109375, 0.318359375]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 3.0, 6.0, 7.0, 4.0, 7.0, 9.0, 12.0, 24.0, 30.0, 26.0, 39.0, 54.0, 86.0, 92.0, 84.0, 87.0, 87.0, 68.0, 48.0, 48.0, 39.0, 31.0, 22.0, 16.0, 14.0, 15.0, 10.0, 8.0, 3.0, 5.0, 4.0, 3.0, 2.0, 7.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0019969940185546875, -0.0019449293613433838, -0.00189286470413208, -0.0018408000469207764, -0.0017887353897094727, -0.001736670732498169, -0.0016846060752868652, -0.0016325414180755615, -0.0015804767608642578, -0.001528412103652954, -0.0014763474464416504, -0.0014242827892303467, -0.001372218132019043, -0.0013201534748077393, -0.0012680888175964355, -0.0012160241603851318, -0.0011639595031738281, -0.0011118948459625244, -0.0010598301887512207, -0.001007765531539917, -0.0009557008743286133, -0.0009036362171173096, -0.0008515715599060059, -0.0007995069026947021, -0.0007474422454833984, -0.0006953775882720947, -0.000643312931060791, -0.0005912482738494873, -0.0005391836166381836, -0.0004871189594268799, -0.00043505430221557617, -0.00038298964500427246, -0.00033092498779296875, -0.00027886033058166504, -0.00022679567337036133, -0.00017473101615905762, -0.0001226663589477539, -7.06017017364502e-05, -1.8537044525146484e-05, 3.3527612686157227e-05, 8.559226989746094e-05, 0.00013765692710876465, 0.00018972158432006836, 0.00024178624153137207, 0.0002938508987426758, 0.0003459155559539795, 0.0003979802131652832, 0.0004500448703765869, 0.0005021095275878906, 0.0005541741847991943, 0.000606238842010498, 0.0006583034992218018, 0.0007103681564331055, 0.0007624328136444092, 0.0008144974708557129, 0.0008665621280670166, 0.0009186267852783203, 0.000970691442489624, 0.0010227560997009277, 0.0010748207569122314, 0.0011268854141235352, 0.0011789500713348389, 0.0012310147285461426, 0.0012830793857574463, 0.00133514404296875]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 8.0, 5.0, 6.0, 11.0, 7.0, 9.0, 14.0, 16.0, 20.0, 35.0, 29.0, 53.0, 62.0, 106.0, 143.0, 246.0, 464.0, 1309.0, 636225.0, 407332.0, 1233.0, 478.0, 253.0, 150.0, 89.0, 69.0, 50.0, 39.0, 18.0, 18.0, 16.0, 9.0, 8.0, 6.0, 6.0, 2.0, 7.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.025115966796875, -0.024148941040039062, -0.023181915283203125, -0.022214889526367188, -0.02124786376953125, -0.020280838012695312, -0.019313812255859375, -0.018346786499023438, -0.0173797607421875, -0.016412734985351562, -0.015445709228515625, -0.014478683471679688, -0.01351165771484375, -0.012544631958007812, -0.011577606201171875, -0.010610580444335938, -0.0096435546875, -0.008676528930664062, -0.007709503173828125, -0.0067424774169921875, -0.00577545166015625, -0.0048084259033203125, -0.003841400146484375, -0.0028743743896484375, -0.0019073486328125, -0.0009403228759765625, 2.6702880859375e-05, 0.0009937286376953125, 0.00196075439453125, 0.0029277801513671875, 0.003894805908203125, 0.0048618316650390625, 0.005828857421875, 0.0067958831787109375, 0.007762908935546875, 0.008729934692382812, 0.00969696044921875, 0.010663986206054688, 0.011631011962890625, 0.012598037719726562, 0.0135650634765625, 0.014532089233398438, 0.015499114990234375, 0.016466140747070312, 0.01743316650390625, 0.018400192260742188, 0.019367218017578125, 0.020334243774414062, 0.02130126953125, 0.022268295288085938, 0.023235321044921875, 0.024202346801757812, 0.02516937255859375, 0.026136398315429688, 0.027103424072265625, 0.028070449829101562, 0.0290374755859375, 0.030004501342773438, 0.030971527099609375, 0.03193855285644531, 0.03290557861328125, 0.03387260437011719, 0.034839630126953125, 0.03580665588378906, 0.036773681640625]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 502.0, 514.0, 1.0, 0.0, 1.0], "bins": [-0.024783875793218613, -0.024370895698666573, -0.023957915604114532, -0.02354493737220764, -0.0231319572776556, -0.02271897718310356, -0.02230599708855152, -0.02189301699399948, -0.02148003876209259, -0.02106705866754055, -0.02065407857298851, -0.02024110034108162, -0.01982812024652958, -0.01941514015197754, -0.0190021600574255, -0.01858917996287346, -0.018176201730966568, -0.017763221636414528, -0.017350241541862488, -0.016937263309955597, -0.016524283215403557, -0.016111303120851517, -0.015698323026299477, -0.015285343863070011, -0.014872362837195396, -0.014459382742643356, -0.01404640357941389, -0.01363342348486185, -0.013220444321632385, -0.012807464227080345, -0.012394484132528305, -0.01198150496929884, -0.011568525806069374, -0.011155545711517334, -0.010742566548287868, -0.010329586453735828, -0.009916607290506363, -0.009503627195954323, -0.009090647101402283, -0.008677667938172817, -0.008264688774943352, -0.007851708680391312, -0.007438729517161846, -0.007025749422609806, -0.006612770259380341, -0.0061997901648283005, -0.005786810535937548, -0.005373830907046795, -0.004960850812494755, -0.004547871183604002, -0.004134891554713249, -0.0037219116929918528, -0.0033089320641011, -0.002895952435210347, -0.0024829725734889507, -0.002069992944598198, -0.0016570135485380888, -0.001244033919647336, -0.0008310541743412614, -0.00041807442903518677, -5.094800144433975e-06, 0.0004078848287463188, 0.0008208646904677153, 0.001233844319358468, 0.0016468239482492208]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 6.0, 9.0, 14.0, 17.0, 21.0, 27.0, 24.0, 40.0, 36.0, 39.0, 55.0, 60.0, 52.0, 58.0, 58.0, 55.0, 65.0, 50.0, 54.0, 43.0, 44.0, 38.0, 38.0, 16.0, 19.0, 14.0, 14.0, 12.0, 9.0, 8.0, 2.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007422566413879395, -0.0007111327722668648, -0.0006800089031457901, -0.0006488850340247154, -0.0006177611649036407, -0.0005866372957825661, -0.0005555134266614914, -0.0005243895575404167, -0.000493265688419342, -0.00046214181929826736, -0.0004310179501771927, -0.000399894081056118, -0.00036877021193504333, -0.00033764634281396866, -0.000306522473692894, -0.0002753986045718193, -0.00024427473545074463, -0.00021315086632966995, -0.00018202699720859528, -0.0001509031280875206, -0.00011977925896644592, -8.865538984537125e-05, -5.753152072429657e-05, -2.6407651603221893e-05, 4.716217517852783e-06, 3.584008663892746e-05, 6.696395576000214e-05, 9.808782488107681e-05, 0.0001292116940021515, 0.00016033556312322617, 0.00019145943224430084, 0.00022258330136537552, 0.0002537071704864502, 0.00028483103960752487, 0.00031595490872859955, 0.0003470787778496742, 0.0003782026469707489, 0.0004093265160918236, 0.00044045038521289825, 0.00047157425433397293, 0.0005026981234550476, 0.0005338219925761223, 0.000564945861697197, 0.0005960697308182716, 0.0006271935999393463, 0.000658317469060421, 0.0006894413381814957, 0.0007205652073025703, 0.000751689076423645, 0.0007828129455447197, 0.0008139368146657944, 0.000845060683786869, 0.0008761845529079437, 0.0009073084220290184, 0.0009384322911500931, 0.0009695561602711678, 0.0010006800293922424, 0.001031803898513317, 0.0010629277676343918, 0.0010940516367554665, 0.0011251755058765411, 0.0011562993749976158, 0.0011874232441186905, 0.0012185471132397652, 0.0012496709823608398]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 3.0, 4.0, 3.0, 8.0, 7.0, 7.0, 13.0, 16.0, 9.0, 21.0, 20.0, 23.0, 25.0, 38.0, 33.0, 35.0, 31.0, 29.0, 43.0, 32.0, 56.0, 42.0, 45.0, 42.0, 49.0, 38.0, 31.0, 41.0, 27.0, 24.0, 21.0, 33.0, 27.0, 25.0, 28.0, 19.0, 13.0, 8.0, 5.0, 7.0, 6.0, 7.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.634765625, -3.513580322265625, -3.39239501953125, -3.271209716796875, -3.1500244140625, -3.028839111328125, -2.90765380859375, -2.786468505859375, -2.665283203125, -2.544097900390625, -2.42291259765625, -2.301727294921875, -2.1805419921875, -2.059356689453125, -1.93817138671875, -1.816986083984375, -1.69580078125, -1.574615478515625, -1.45343017578125, -1.332244873046875, -1.2110595703125, -1.089874267578125, -0.96868896484375, -0.847503662109375, -0.726318359375, -0.605133056640625, -0.48394775390625, -0.362762451171875, -0.2415771484375, -0.120391845703125, 0.00079345703125, 0.121978759765625, 0.2431640625, 0.364349365234375, 0.48553466796875, 0.606719970703125, 0.7279052734375, 0.849090576171875, 0.97027587890625, 1.091461181640625, 1.212646484375, 1.333831787109375, 1.45501708984375, 1.576202392578125, 1.6973876953125, 1.818572998046875, 1.93975830078125, 2.060943603515625, 2.18212890625, 2.303314208984375, 2.42449951171875, 2.545684814453125, 2.6668701171875, 2.788055419921875, 2.90924072265625, 3.030426025390625, 3.151611328125, 3.272796630859375, 3.39398193359375, 3.515167236328125, 3.6363525390625, 3.757537841796875, 3.87872314453125, 3.999908447265625, 4.12109375]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 6.0, 10.0, 5.0, 19.0, 18.0, 16.0, 32.0, 40.0, 43.0, 53.0, 79.0, 125.0, 155.0, 250.0, 370.0, 654.0, 1318.0, 2651.0, 6146.0, 16214.0, 44478.0, 124309.0, 357191.0, 321648.0, 108313.0, 39231.0, 14285.0, 5495.0, 2393.0, 1169.0, 625.0, 349.0, 250.0, 193.0, 107.0, 87.0, 65.0, 44.0, 27.0, 26.0, 19.0, 11.0, 14.0, 3.0, 9.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.53515625, -4.3836669921875, -4.232177734375, -4.0806884765625, -3.92919921875, -3.7777099609375, -3.626220703125, -3.4747314453125, -3.3232421875, -3.1717529296875, -3.020263671875, -2.8687744140625, -2.71728515625, -2.5657958984375, -2.414306640625, -2.2628173828125, -2.111328125, -1.9598388671875, -1.808349609375, -1.6568603515625, -1.50537109375, -1.3538818359375, -1.202392578125, -1.0509033203125, -0.8994140625, -0.7479248046875, -0.596435546875, -0.4449462890625, -0.29345703125, -0.1419677734375, 0.009521484375, 0.1610107421875, 0.3125, 0.4639892578125, 0.615478515625, 0.7669677734375, 0.91845703125, 1.0699462890625, 1.221435546875, 1.3729248046875, 1.5244140625, 1.6759033203125, 1.827392578125, 1.9788818359375, 2.13037109375, 2.2818603515625, 2.433349609375, 2.5848388671875, 2.736328125, 2.8878173828125, 3.039306640625, 3.1907958984375, 3.34228515625, 3.4937744140625, 3.645263671875, 3.7967529296875, 3.9482421875, 4.0997314453125, 4.251220703125, 4.4027099609375, 4.55419921875, 4.7056884765625, 4.857177734375, 5.0086669921875, 5.16015625]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 1.0, 2.0, 4.0, 4.0, 3.0, 3.0, 11.0, 3.0, 4.0, 14.0, 12.0, 23.0, 25.0, 14.0, 30.0, 26.0, 29.0, 34.0, 35.0, 38.0, 57.0, 60.0, 79.0, 139.0, 325.0, 1380.0, 160.0, 98.0, 84.0, 42.0, 41.0, 32.0, 35.0, 28.0, 30.0, 25.0, 15.0, 13.0, 17.0, 14.0, 14.0, 9.0, 6.0, 6.0, 5.0, 7.0, 7.0, 3.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-10.953125, -10.6112060546875, -10.269287109375, -9.9273681640625, -9.58544921875, -9.2435302734375, -8.901611328125, -8.5596923828125, -8.2177734375, -7.8758544921875, -7.533935546875, -7.1920166015625, -6.85009765625, -6.5081787109375, -6.166259765625, -5.8243408203125, -5.482421875, -5.1405029296875, -4.798583984375, -4.4566650390625, -4.11474609375, -3.7728271484375, -3.430908203125, -3.0889892578125, -2.7470703125, -2.4051513671875, -2.063232421875, -1.7213134765625, -1.37939453125, -1.0374755859375, -0.695556640625, -0.3536376953125, -0.01171875, 0.3302001953125, 0.672119140625, 1.0140380859375, 1.35595703125, 1.6978759765625, 2.039794921875, 2.3817138671875, 2.7236328125, 3.0655517578125, 3.407470703125, 3.7493896484375, 4.09130859375, 4.4332275390625, 4.775146484375, 5.1170654296875, 5.458984375, 5.8009033203125, 6.142822265625, 6.4847412109375, 6.82666015625, 7.1685791015625, 7.510498046875, 7.8524169921875, 8.1943359375, 8.5362548828125, 8.878173828125, 9.2200927734375, 9.56201171875, 9.9039306640625, 10.245849609375, 10.5877685546875, 10.9296875]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 5.0, 3.0, 8.0, 16.0, 10.0, 14.0, 14.0, 20.0, 32.0, 46.0, 69.0, 100.0, 156.0, 242.0, 343.0, 617.0, 1314.0, 12657.0, 2546385.0, 575466.0, 5600.0, 1070.0, 532.0, 335.0, 204.0, 125.0, 81.0, 67.0, 44.0, 28.0, 20.0, 19.0, 16.0, 9.0, 7.0, 10.0, 9.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-24.734375, -24.00439453125, -23.2744140625, -22.54443359375, -21.814453125, -21.08447265625, -20.3544921875, -19.62451171875, -18.89453125, -18.16455078125, -17.4345703125, -16.70458984375, -15.974609375, -15.24462890625, -14.5146484375, -13.78466796875, -13.0546875, -12.32470703125, -11.5947265625, -10.86474609375, -10.134765625, -9.40478515625, -8.6748046875, -7.94482421875, -7.21484375, -6.48486328125, -5.7548828125, -5.02490234375, -4.294921875, -3.56494140625, -2.8349609375, -2.10498046875, -1.375, -0.64501953125, 0.0849609375, 0.81494140625, 1.544921875, 2.27490234375, 3.0048828125, 3.73486328125, 4.46484375, 5.19482421875, 5.9248046875, 6.65478515625, 7.384765625, 8.11474609375, 8.8447265625, 9.57470703125, 10.3046875, 11.03466796875, 11.7646484375, 12.49462890625, 13.224609375, 13.95458984375, 14.6845703125, 15.41455078125, 16.14453125, 16.87451171875, 17.6044921875, 18.33447265625, 19.064453125, 19.79443359375, 20.5244140625, 21.25439453125, 21.984375]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 866.0, 147.0, 0.0, 1.0], "bins": [-409.0158996582031, -402.2823486328125, -395.548828125, -388.8152770996094, -382.08172607421875, -375.34820556640625, -368.6146545410156, -361.881103515625, -355.1475830078125, -348.4140319824219, -341.6805114746094, -334.94696044921875, -328.2134094238281, -321.4798889160156, -314.746337890625, -308.0127868652344, -301.27923583984375, -294.5456848144531, -287.8121643066406, -281.07861328125, -274.3450622558594, -267.6115417480469, -260.87799072265625, -254.14443969726562, -247.41091918945312, -240.67738342285156, -233.94383239746094, -227.21029663085938, -220.4767608642578, -213.7432098388672, -207.00967407226562, -200.276123046875, -193.5426025390625, -186.80906677246094, -180.0755157470703, -173.34197998046875, -166.6084442138672, -159.87489318847656, -153.141357421875, -146.40780639648438, -139.6742706298828, -132.94073486328125, -126.20719146728516, -119.47364807128906, -112.74010467529297, -106.00656127929688, -99.27302551269531, -92.53948211669922, -85.80593872070312, -79.07239532470703, -72.33885955810547, -65.60531616210938, -58.87177276611328, -52.13823318481445, -45.404693603515625, -38.67115020751953, -31.937610626220703, -25.204069137573242, -18.47052764892578, -11.736988067626953, -5.003446578979492, 1.7300949096679688, 8.463634490966797, 15.19717788696289, 21.93071746826172]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 5.0, 5.0, 4.0, 8.0, 6.0, 8.0, 9.0, 17.0, 21.0, 22.0, 16.0, 18.0, 29.0, 34.0, 27.0, 45.0, 52.0, 42.0, 40.0, 36.0, 47.0, 33.0, 35.0, 34.0, 47.0, 49.0, 37.0, 37.0, 31.0, 34.0, 31.0, 24.0, 19.0, 23.0, 9.0, 15.0, 9.0, 13.0, 9.0, 6.0, 7.0, 5.0, 4.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.19073486328125, -21.389434814453125, -20.588134765625, -19.786834716796875, -18.98553466796875, -18.184234619140625, -17.3829345703125, -16.581634521484375, -15.78033447265625, -14.979034423828125, -14.177734375, -13.376434326171875, -12.57513427734375, -11.773834228515625, -10.9725341796875, -10.171234130859375, -9.369935035705566, -8.568634986877441, -7.767334938049316, -6.966034889221191, -6.164734840393066, -5.3634352684021, -4.562135219573975, -3.7608351707458496, -2.9595351219177246, -2.1582350730895996, -1.3569351434707642, -0.5556352138519287, 0.2456648349761963, 1.0469646453857422, 1.8482646942138672, 2.649564743041992, 3.450864791870117, 4.252164840698242, 5.053464889526367, 5.854764938354492, 6.656064987182617, 7.457364559173584, 8.258665084838867, 9.059965133666992, 9.861265182495117, 10.662565231323242, 11.463865280151367, 12.265165328979492, 13.066465377807617, 13.867765426635742, 14.669065475463867, 15.470365524291992, 16.271663665771484, 17.07296371459961, 17.874263763427734, 18.67556381225586, 19.476863861083984, 20.27816390991211, 21.079463958740234, 21.88076400756836, 22.682064056396484, 23.48336410522461, 24.284664154052734, 25.08596420288086, 25.887264251708984, 26.68856430053711, 27.489864349365234, 28.29116439819336, 29.092464447021484]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 6.0, 3.0, 2.0, 3.0, 7.0, 9.0, 7.0, 8.0, 17.0, 8.0, 17.0, 22.0, 24.0, 29.0, 32.0, 26.0, 32.0, 31.0, 25.0, 24.0, 32.0, 36.0, 39.0, 38.0, 52.0, 46.0, 39.0, 46.0, 34.0, 37.0, 34.0, 32.0, 25.0, 26.0, 30.0, 20.0, 11.0, 17.0, 12.0, 12.0, 20.0, 8.0, 4.0, 8.0, 2.0, 5.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-3.6953125, -3.58001708984375, -3.4647216796875, -3.34942626953125, -3.234130859375, -3.11883544921875, -3.0035400390625, -2.88824462890625, -2.77294921875, -2.65765380859375, -2.5423583984375, -2.42706298828125, -2.311767578125, -2.19647216796875, -2.0811767578125, -1.96588134765625, -1.8505859375, -1.73529052734375, -1.6199951171875, -1.50469970703125, -1.389404296875, -1.27410888671875, -1.1588134765625, -1.04351806640625, -0.92822265625, -0.81292724609375, -0.6976318359375, -0.58233642578125, -0.467041015625, -0.35174560546875, -0.2364501953125, -0.12115478515625, -0.005859375, 0.10943603515625, 0.2247314453125, 0.34002685546875, 0.455322265625, 0.57061767578125, 0.6859130859375, 0.80120849609375, 0.91650390625, 1.03179931640625, 1.1470947265625, 1.26239013671875, 1.377685546875, 1.49298095703125, 1.6082763671875, 1.72357177734375, 1.8388671875, 1.95416259765625, 2.0694580078125, 2.18475341796875, 2.300048828125, 2.41534423828125, 2.5306396484375, 2.64593505859375, 2.76123046875, 2.87652587890625, 2.9918212890625, 3.10711669921875, 3.222412109375, 3.33770751953125, 3.4530029296875, 3.56829833984375, 3.68359375]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 3.0, 1.0, 5.0, 9.0, 15.0, 17.0, 7.0, 14.0, 19.0, 24.0, 17.0, 46.0, 70.0, 85.0, 111.0, 178.0, 300.0, 540.0, 1125.0, 3056.0, 9378.0, 34499.0, 137553.0, 499112.0, 1257892.0, 1379562.0, 624721.0, 181679.0, 45762.0, 11850.0, 3692.0, 1393.0, 616.0, 313.0, 177.0, 115.0, 86.0, 59.0, 46.0, 37.0, 20.0, 15.0, 12.0, 17.0, 8.0, 11.0, 5.0, 4.0, 4.0, 5.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.41796875, -3.29632568359375, -3.1746826171875, -3.05303955078125, -2.931396484375, -2.80975341796875, -2.6881103515625, -2.56646728515625, -2.44482421875, -2.32318115234375, -2.2015380859375, -2.07989501953125, -1.958251953125, -1.83660888671875, -1.7149658203125, -1.59332275390625, -1.4716796875, -1.35003662109375, -1.2283935546875, -1.10675048828125, -0.985107421875, -0.86346435546875, -0.7418212890625, -0.62017822265625, -0.49853515625, -0.37689208984375, -0.2552490234375, -0.13360595703125, -0.011962890625, 0.10968017578125, 0.2313232421875, 0.35296630859375, 0.474609375, 0.59625244140625, 0.7178955078125, 0.83953857421875, 0.961181640625, 1.08282470703125, 1.2044677734375, 1.32611083984375, 1.44775390625, 1.56939697265625, 1.6910400390625, 1.81268310546875, 1.934326171875, 2.05596923828125, 2.1776123046875, 2.29925537109375, 2.4208984375, 2.54254150390625, 2.6641845703125, 2.78582763671875, 2.907470703125, 3.02911376953125, 3.1507568359375, 3.27239990234375, 3.39404296875, 3.51568603515625, 3.6373291015625, 3.75897216796875, 3.880615234375, 4.00225830078125, 4.1239013671875, 4.24554443359375, 4.3671875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 5.0, 3.0, 11.0, 6.0, 13.0, 23.0, 34.0, 32.0, 48.0, 70.0, 97.0, 154.0, 204.0, 340.0, 399.0, 488.0, 491.0, 445.0, 354.0, 265.0, 157.0, 127.0, 73.0, 69.0, 46.0, 27.0, 23.0, 18.0, 13.0, 8.0, 15.0, 4.0, 2.0, 2.0, 8.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.453125, -5.27239990234375, -5.0916748046875, -4.91094970703125, -4.730224609375, -4.54949951171875, -4.3687744140625, -4.18804931640625, -4.00732421875, -3.82659912109375, -3.6458740234375, -3.46514892578125, -3.284423828125, -3.10369873046875, -2.9229736328125, -2.74224853515625, -2.5615234375, -2.38079833984375, -2.2000732421875, -2.01934814453125, -1.838623046875, -1.65789794921875, -1.4771728515625, -1.29644775390625, -1.11572265625, -0.93499755859375, -0.7542724609375, -0.57354736328125, -0.392822265625, -0.21209716796875, -0.0313720703125, 0.14935302734375, 0.330078125, 0.51080322265625, 0.6915283203125, 0.87225341796875, 1.052978515625, 1.23370361328125, 1.4144287109375, 1.59515380859375, 1.77587890625, 1.95660400390625, 2.1373291015625, 2.31805419921875, 2.498779296875, 2.67950439453125, 2.8602294921875, 3.04095458984375, 3.2216796875, 3.40240478515625, 3.5831298828125, 3.76385498046875, 3.944580078125, 4.12530517578125, 4.3060302734375, 4.48675537109375, 4.66748046875, 4.84820556640625, 5.0289306640625, 5.20965576171875, 5.390380859375, 5.57110595703125, 5.7518310546875, 5.93255615234375, 6.11328125]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 5.0, 11.0, 16.0, 11.0, 16.0, 20.0, 32.0, 34.0, 44.0, 75.0, 120.0, 146.0, 243.0, 510.0, 1101.0, 3298.0, 13664.0, 75624.0, 629399.0, 2748834.0, 625096.0, 76205.0, 13946.0, 3560.0, 1030.0, 487.0, 264.0, 144.0, 103.0, 71.0, 55.0, 35.0, 21.0, 14.0, 15.0, 11.0, 6.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.10546875, -6.85614013671875, -6.6068115234375, -6.35748291015625, -6.108154296875, -5.85882568359375, -5.6094970703125, -5.36016845703125, -5.11083984375, -4.86151123046875, -4.6121826171875, -4.36285400390625, -4.113525390625, -3.86419677734375, -3.6148681640625, -3.36553955078125, -3.1162109375, -2.86688232421875, -2.6175537109375, -2.36822509765625, -2.118896484375, -1.86956787109375, -1.6202392578125, -1.37091064453125, -1.12158203125, -0.87225341796875, -0.6229248046875, -0.37359619140625, -0.124267578125, 0.12506103515625, 0.3743896484375, 0.62371826171875, 0.873046875, 1.12237548828125, 1.3717041015625, 1.62103271484375, 1.870361328125, 2.11968994140625, 2.3690185546875, 2.61834716796875, 2.86767578125, 3.11700439453125, 3.3663330078125, 3.61566162109375, 3.864990234375, 4.11431884765625, 4.3636474609375, 4.61297607421875, 4.8623046875, 5.11163330078125, 5.3609619140625, 5.61029052734375, 5.859619140625, 6.10894775390625, 6.3582763671875, 6.60760498046875, 6.85693359375, 7.10626220703125, 7.3555908203125, 7.60491943359375, 7.854248046875, 8.10357666015625, 8.3529052734375, 8.60223388671875, 8.8515625]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 17.0, 62.0, 174.0, 331.0, 286.0, 109.0, 25.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.522146224975586, -18.76357650756836, -17.0050048828125, -15.246435165405273, -13.487865447998047, -11.729294776916504, -9.970724105834961, -8.212154388427734, -6.453583717346191, -4.695013523101807, -2.9364430904388428, -1.177872657775879, 0.5806975364685059, 2.3392677307128906, 4.097838401794434, 5.85640811920166, 7.614978790283203, 9.373549461364746, 11.132119178771973, 12.890689849853516, 14.649259567260742, 16.40782928466797, 18.166400909423828, 19.924970626831055, 21.68354034423828, 23.442110061645508, 25.200681686401367, 26.959251403808594, 28.71782112121582, 30.476390838623047, 32.234962463378906, 33.9935302734375, 35.75210189819336, 37.51067352294922, 39.26924133300781, 41.02781295776367, 42.78638458251953, 44.544952392578125, 46.303524017333984, 48.062095642089844, 49.82066345214844, 51.5792350769043, 53.33780288696289, 55.09637451171875, 56.85494613647461, 58.6135139465332, 60.37208557128906, 62.130653381347656, 63.88922882080078, 65.64779663085938, 67.4063720703125, 69.1649398803711, 70.92350769042969, 72.68208312988281, 74.4406509399414, 76.19921875, 77.9577865600586, 79.71635437011719, 81.47492980957031, 83.2334976196289, 84.9920654296875, 86.75064086914062, 88.50920867919922, 90.26777648925781, 92.02635192871094]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 3.0, 7.0, 4.0, 4.0, 6.0, 6.0, 5.0, 8.0, 12.0, 11.0, 14.0, 13.0, 16.0, 11.0, 25.0, 25.0, 35.0, 30.0, 36.0, 30.0, 35.0, 33.0, 40.0, 32.0, 39.0, 38.0, 43.0, 36.0, 35.0, 41.0, 40.0, 28.0, 26.0, 25.0, 24.0, 20.0, 26.0, 22.0, 18.0, 15.0, 13.0, 10.0, 5.0, 13.0, 13.0, 7.0, 7.0, 4.0, 6.0, 5.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-16.554866790771484, -16.042278289794922, -15.529691696166992, -15.01710319519043, -14.504515647888184, -13.991928100585938, -13.479340553283691, -12.966753005981445, -12.454164505004883, -11.941576957702637, -11.42898941040039, -10.916400909423828, -10.403813362121582, -9.891225814819336, -9.37863826751709, -8.866050720214844, -8.353463172912598, -7.840875625610352, -7.328287601470947, -6.815700054168701, -6.303112030029297, -5.790524482727051, -5.277936935424805, -4.765349388122559, -4.252761363983154, -3.740173578262329, -3.227585792541504, -2.714998245239258, -2.2024104595184326, -1.6898226737976074, -1.1772351264953613, -0.6646473407745361, -0.15205955505371094, 0.3605281710624695, 0.8731158971786499, 1.3857035636901855, 1.8982913494110107, 2.410879135131836, 2.923466682434082, 3.4360544681549072, 3.9486422538757324, 4.4612298011779785, 4.973817825317383, 5.486405372619629, 5.998992919921875, 6.511580944061279, 7.024168491363525, 7.53675651550293, 8.049344062805176, 8.561931610107422, 9.074519157409668, 9.587106704711914, 10.099695205688477, 10.612282752990723, 11.124870300292969, 11.637457847595215, 12.150045394897461, 12.662632942199707, 13.175220489501953, 13.687808990478516, 14.200396537780762, 14.712984085083008, 15.225571632385254, 15.7381591796875, 16.250747680664062]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 3.0, 6.0, 8.0, 2.0, 9.0, 11.0, 10.0, 19.0, 11.0, 19.0, 22.0, 16.0, 18.0, 30.0, 26.0, 32.0, 28.0, 27.0, 49.0, 28.0, 36.0, 48.0, 46.0, 44.0, 41.0, 39.0, 34.0, 46.0, 29.0, 32.0, 26.0, 26.0, 22.0, 24.0, 27.0, 21.0, 25.0, 12.0, 13.0, 10.0, 6.0, 6.0, 5.0, 4.0, 2.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0, 4.0], "bins": [-3.931640625, -3.819183349609375, -3.70672607421875, -3.594268798828125, -3.4818115234375, -3.369354248046875, -3.25689697265625, -3.144439697265625, -3.031982421875, -2.919525146484375, -2.80706787109375, -2.694610595703125, -2.5821533203125, -2.469696044921875, -2.35723876953125, -2.244781494140625, -2.13232421875, -2.019866943359375, -1.90740966796875, -1.794952392578125, -1.6824951171875, -1.570037841796875, -1.45758056640625, -1.345123291015625, -1.232666015625, -1.120208740234375, -1.00775146484375, -0.895294189453125, -0.7828369140625, -0.670379638671875, -0.55792236328125, -0.445465087890625, -0.3330078125, -0.220550537109375, -0.10809326171875, 0.004364013671875, 0.1168212890625, 0.229278564453125, 0.34173583984375, 0.454193115234375, 0.566650390625, 0.679107666015625, 0.79156494140625, 0.904022216796875, 1.0164794921875, 1.128936767578125, 1.24139404296875, 1.353851318359375, 1.46630859375, 1.578765869140625, 1.69122314453125, 1.803680419921875, 1.9161376953125, 2.028594970703125, 2.14105224609375, 2.253509521484375, 2.365966796875, 2.478424072265625, 2.59088134765625, 2.703338623046875, 2.8157958984375, 2.928253173828125, 3.04071044921875, 3.153167724609375, 3.265625]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 4.0, 2.0, 6.0, 9.0, 21.0, 33.0, 33.0, 52.0, 62.0, 85.0, 138.0, 201.0, 282.0, 462.0, 685.0, 996.0, 1428.0, 2222.0, 3274.0, 4930.0, 7561.0, 11269.0, 17392.0, 26774.0, 41979.0, 66920.0, 109831.0, 175003.0, 203299.0, 139047.0, 85698.0, 52881.0, 33208.0, 21415.0, 14000.0, 9116.0, 5970.0, 4026.0, 2638.0, 1816.0, 1206.0, 839.0, 598.0, 330.0, 297.0, 180.0, 110.0, 77.0, 53.0, 30.0, 28.0, 18.0, 17.0, 4.0, 7.0, 2.0, 1.0, 1.0, 1.0, 4.0], "bins": [-0.3671875, -0.3558006286621094, -0.34441375732421875, -0.3330268859863281, -0.3216400146484375, -0.3102531433105469, -0.29886627197265625, -0.2874794006347656, -0.276092529296875, -0.2647056579589844, -0.25331878662109375, -0.24193191528320312, -0.2305450439453125, -0.21915817260742188, -0.20777130126953125, -0.19638442993164062, -0.18499755859375, -0.17361068725585938, -0.16222381591796875, -0.15083694458007812, -0.1394500732421875, -0.12806320190429688, -0.11667633056640625, -0.10528945922851562, -0.093902587890625, -0.08251571655273438, -0.07112884521484375, -0.059741973876953125, -0.0483551025390625, -0.036968231201171875, -0.02558135986328125, -0.014194488525390625, -0.0028076171875, 0.008579254150390625, 0.01996612548828125, 0.031352996826171875, 0.0427398681640625, 0.054126739501953125, 0.06551361083984375, 0.07690048217773438, 0.088287353515625, 0.09967422485351562, 0.11106109619140625, 0.12244796752929688, 0.1338348388671875, 0.14522171020507812, 0.15660858154296875, 0.16799545288085938, 0.17938232421875, 0.19076919555664062, 0.20215606689453125, 0.21354293823242188, 0.2249298095703125, 0.23631668090820312, 0.24770355224609375, 0.2590904235839844, 0.270477294921875, 0.2818641662597656, 0.29325103759765625, 0.3046379089355469, 0.3160247802734375, 0.3274116516113281, 0.33879852294921875, 0.3501853942871094, 0.361572265625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 5.0, 2.0, 2.0, 6.0, 2.0, 6.0, 4.0, 3.0, 3.0, 6.0, 7.0, 5.0, 10.0, 13.0, 25.0, 22.0, 16.0, 32.0, 22.0, 18.0, 32.0, 32.0, 24.0, 42.0, 31.0, 43.0, 48.0, 37.0, 1053.0, 41.0, 35.0, 36.0, 32.0, 43.0, 42.0, 28.0, 30.0, 14.0, 23.0, 22.0, 23.0, 14.0, 17.0, 21.0, 14.0, 9.0, 6.0, 11.0, 10.0, 7.0, 2.0, 1.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.171875, -2.103302001953125, -2.03472900390625, -1.966156005859375, -1.8975830078125, -1.829010009765625, -1.76043701171875, -1.691864013671875, -1.623291015625, -1.554718017578125, -1.48614501953125, -1.417572021484375, -1.3489990234375, -1.280426025390625, -1.21185302734375, -1.143280029296875, -1.07470703125, -1.006134033203125, -0.93756103515625, -0.868988037109375, -0.8004150390625, -0.731842041015625, -0.66326904296875, -0.594696044921875, -0.526123046875, -0.457550048828125, -0.38897705078125, -0.320404052734375, -0.2518310546875, -0.183258056640625, -0.11468505859375, -0.046112060546875, 0.0224609375, 0.091033935546875, 0.15960693359375, 0.228179931640625, 0.2967529296875, 0.365325927734375, 0.43389892578125, 0.502471923828125, 0.571044921875, 0.639617919921875, 0.70819091796875, 0.776763916015625, 0.8453369140625, 0.913909912109375, 0.98248291015625, 1.051055908203125, 1.11962890625, 1.188201904296875, 1.25677490234375, 1.325347900390625, 1.3939208984375, 1.462493896484375, 1.53106689453125, 1.599639892578125, 1.668212890625, 1.736785888671875, 1.80535888671875, 1.873931884765625, 1.9425048828125, 2.011077880859375, 2.07965087890625, 2.148223876953125, 2.216796875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 9.0, 4.0, 16.0, 19.0, 30.0, 36.0, 61.0, 82.0, 152.0, 199.0, 270.0, 404.0, 574.0, 894.0, 1239.0, 1896.0, 2771.0, 3919.0, 5859.0, 8866.0, 13365.0, 20080.0, 30572.0, 47548.0, 76707.0, 127398.0, 1220707.0, 213047.0, 118933.0, 71664.0, 44847.0, 28792.0, 18385.0, 12168.0, 8187.0, 5470.0, 3714.0, 2541.0, 1694.0, 1217.0, 872.0, 590.0, 418.0, 323.0, 189.0, 116.0, 99.0, 64.0, 47.0, 29.0, 19.0, 11.0, 9.0, 9.0, 2.0, 3.0, 1.0, 6.0], "bins": [-0.31591796875, -0.3063240051269531, -0.29673004150390625, -0.2871360778808594, -0.2775421142578125, -0.2679481506347656, -0.25835418701171875, -0.24876022338867188, -0.239166259765625, -0.22957229614257812, -0.21997833251953125, -0.21038436889648438, -0.2007904052734375, -0.19119644165039062, -0.18160247802734375, -0.17200851440429688, -0.16241455078125, -0.15282058715820312, -0.14322662353515625, -0.13363265991210938, -0.1240386962890625, -0.11444473266601562, -0.10485076904296875, -0.09525680541992188, -0.085662841796875, -0.07606887817382812, -0.06647491455078125, -0.056880950927734375, -0.0472869873046875, -0.037693023681640625, -0.02809906005859375, -0.018505096435546875, -0.0089111328125, 0.000682830810546875, 0.01027679443359375, 0.019870758056640625, 0.0294647216796875, 0.039058685302734375, 0.04865264892578125, 0.058246612548828125, 0.067840576171875, 0.07743453979492188, 0.08702850341796875, 0.09662246704101562, 0.1062164306640625, 0.11581039428710938, 0.12540435791015625, 0.13499832153320312, 0.14459228515625, 0.15418624877929688, 0.16378021240234375, 0.17337417602539062, 0.1829681396484375, 0.19256210327148438, 0.20215606689453125, 0.21175003051757812, 0.221343994140625, 0.23093795776367188, 0.24053192138671875, 0.2501258850097656, 0.2597198486328125, 0.2693138122558594, 0.27890777587890625, 0.2885017395019531, 0.298095703125]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 8.0, 9.0, 11.0, 14.0, 15.0, 28.0, 20.0, 24.0, 53.0, 51.0, 66.0, 88.0, 99.0, 87.0, 80.0, 86.0, 53.0, 51.0, 29.0, 30.0, 24.0, 17.0, 8.0, 6.0, 4.0, 3.0, 3.0, 1.0, 4.0, 4.0, 4.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0018062591552734375, -0.0017526894807815552, -0.0016991198062896729, -0.0016455501317977905, -0.0015919804573059082, -0.0015384107828140259, -0.0014848411083221436, -0.0014312714338302612, -0.001377701759338379, -0.0013241320848464966, -0.0012705624103546143, -0.001216992735862732, -0.0011634230613708496, -0.0011098533868789673, -0.001056283712387085, -0.0010027140378952026, -0.0009491443634033203, -0.000895574688911438, -0.0008420050144195557, -0.0007884353399276733, -0.000734865665435791, -0.0006812959909439087, -0.0006277263164520264, -0.000574156641960144, -0.0005205869674682617, -0.0004670172929763794, -0.00041344761848449707, -0.00035987794399261475, -0.0003063082695007324, -0.0002527385950088501, -0.00019916892051696777, -0.00014559924602508545, -9.202957153320312e-05, -3.84598970413208e-05, 1.5109777450561523e-05, 6.867945194244385e-05, 0.00012224912643432617, 0.0001758188009262085, 0.00022938847541809082, 0.00028295814990997314, 0.00033652782440185547, 0.0003900974988937378, 0.0004436671733856201, 0.0004972368478775024, 0.0005508065223693848, 0.0006043761968612671, 0.0006579458713531494, 0.0007115155458450317, 0.0007650852203369141, 0.0008186548948287964, 0.0008722245693206787, 0.000925794243812561, 0.0009793639183044434, 0.0010329335927963257, 0.001086503267288208, 0.0011400729417800903, 0.0011936426162719727, 0.001247212290763855, 0.0013007819652557373, 0.0013543516397476196, 0.001407921314239502, 0.0014614909887313843, 0.0015150606632232666, 0.001568630337715149, 0.0016222000122070312]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 5.0, 9.0, 6.0, 3.0, 9.0, 10.0, 4.0, 12.0, 21.0, 31.0, 46.0, 78.0, 87.0, 123.0, 188.0, 325.0, 622.0, 3442.0, 1014472.0, 27127.0, 862.0, 350.0, 221.0, 139.0, 86.0, 62.0, 48.0, 36.0, 27.0, 29.0, 12.0, 4.0, 9.0, 3.0, 6.0, 8.0, 3.0, 6.0, 3.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0281524658203125, -0.027170896530151367, -0.026189327239990234, -0.0252077579498291, -0.02422618865966797, -0.023244619369506836, -0.022263050079345703, -0.02128148078918457, -0.020299911499023438, -0.019318342208862305, -0.018336772918701172, -0.01735520362854004, -0.016373634338378906, -0.015392065048217773, -0.01441049575805664, -0.013428926467895508, -0.012447357177734375, -0.011465787887573242, -0.01048421859741211, -0.009502649307250977, -0.008521080017089844, -0.007539510726928711, -0.006557941436767578, -0.005576372146606445, -0.0045948028564453125, -0.0036132335662841797, -0.002631664276123047, -0.001650094985961914, -0.0006685256958007812, 0.00031304359436035156, 0.0012946128845214844, 0.002276182174682617, 0.00325775146484375, 0.004239320755004883, 0.005220890045166016, 0.0062024593353271484, 0.007184028625488281, 0.008165597915649414, 0.009147167205810547, 0.01012873649597168, 0.011110305786132812, 0.012091875076293945, 0.013073444366455078, 0.014055013656616211, 0.015036582946777344, 0.016018152236938477, 0.01699972152709961, 0.017981290817260742, 0.018962860107421875, 0.019944429397583008, 0.02092599868774414, 0.021907567977905273, 0.022889137268066406, 0.02387070655822754, 0.024852275848388672, 0.025833845138549805, 0.026815414428710938, 0.02779698371887207, 0.028778553009033203, 0.029760122299194336, 0.03074169158935547, 0.0317232608795166, 0.032704830169677734, 0.03368639945983887, 0.03466796875]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 34.0, 964.0, 20.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.022569013759493828, -0.022176243364810944, -0.02178347110748291, -0.021390700712800026, -0.02099793031811714, -0.02060515806078911, -0.020212387666106224, -0.01981961727142334, -0.019426845014095306, -0.019034074619412422, -0.01864130236208439, -0.018248531967401505, -0.01785576157271862, -0.017462989315390587, -0.017070218920707703, -0.01667744852602482, -0.016284678131341934, -0.01589190773665905, -0.015499136410653591, -0.015106365084648132, -0.014713593758642673, -0.01432082336395979, -0.01392805203795433, -0.013535281643271446, -0.013142509385943413, -0.012749738059937954, -0.01235696766525507, -0.011964196339249611, -0.011571425013244152, -0.011178654618561268, -0.010785883292555809, -0.010393112897872925, -0.010000341571867466, -0.009607570245862007, -0.009214799851179123, -0.008822028525173664, -0.008429257199168205, -0.008036486804485321, -0.007643715478479862, -0.007250944618135691, -0.006858173292130232, -0.00646540243178606, -0.0060726311057806015, -0.00567986024543643, -0.0052870893850922585, -0.0048943180590868, -0.004501547198742628, -0.004108776338398457, -0.0037160052452236414, -0.0033232341520488262, -0.0029304632917046547, -0.0025376921985298395, -0.0021449211053550243, -0.0017521502450108528, -0.0013593791518360376, -0.0009666082914918661, -0.0005738371983170509, -0.00018106619245372713, 0.00021170481340959668, 0.000604475848376751, 0.0009972468251362443, 0.0013900178018957376, 0.0017827888950705528, 0.0021755597554147243, 0.0025683308485895395]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 5.0, 10.0, 8.0, 9.0, 14.0, 15.0, 18.0, 24.0, 24.0, 27.0, 27.0, 37.0, 47.0, 47.0, 49.0, 61.0, 55.0, 54.0, 55.0, 45.0, 50.0, 46.0, 51.0, 42.0, 36.0, 35.0, 16.0, 19.0, 18.0, 15.0, 13.0, 8.0, 12.0, 2.0, 6.0, 4.0, 6.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007165670394897461, -0.0006863139569759369, -0.0006560608744621277, -0.0006258077919483185, -0.0005955547094345093, -0.0005653016269207001, -0.0005350485444068909, -0.0005047954618930817, -0.00047454237937927246, -0.00044428929686546326, -0.00041403621435165405, -0.00038378313183784485, -0.00035353004932403564, -0.00032327696681022644, -0.00029302388429641724, -0.00026277080178260803, -0.00023251771926879883, -0.00020226463675498962, -0.00017201155424118042, -0.00014175847172737122, -0.00011150538921356201, -8.125230669975281e-05, -5.0999224185943604e-05, -2.07461416721344e-05, 9.506940841674805e-06, 3.976002335548401e-05, 7.001310586929321e-05, 0.00010026618838310242, 0.00013051927089691162, 0.00016077235341072083, 0.00019102543592453003, 0.00022127851843833923, 0.00025153160095214844, 0.00028178468346595764, 0.00031203776597976685, 0.00034229084849357605, 0.00037254393100738525, 0.00040279701352119446, 0.00043305009603500366, 0.00046330317854881287, 0.0004935562610626221, 0.0005238093435764313, 0.0005540624260902405, 0.0005843155086040497, 0.0006145685911178589, 0.0006448216736316681, 0.0006750747561454773, 0.0007053278386592865, 0.0007355809211730957, 0.0007658340036869049, 0.0007960870862007141, 0.0008263401687145233, 0.0008565932512283325, 0.0008868463337421417, 0.0009170994162559509, 0.0009473524987697601, 0.0009776055812835693, 0.0010078586637973785, 0.0010381117463111877, 0.001068364828824997, 0.0010986179113388062, 0.0011288709938526154, 0.0011591240763664246, 0.0011893771588802338, 0.001219630241394043]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 3.0, 6.0, 8.0, 2.0, 9.0, 11.0, 10.0, 19.0, 11.0, 19.0, 22.0, 16.0, 18.0, 30.0, 26.0, 32.0, 28.0, 27.0, 49.0, 28.0, 36.0, 48.0, 46.0, 44.0, 41.0, 39.0, 34.0, 46.0, 29.0, 32.0, 26.0, 26.0, 22.0, 24.0, 27.0, 21.0, 25.0, 12.0, 13.0, 10.0, 6.0, 6.0, 5.0, 4.0, 2.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0, 4.0], "bins": [-3.931640625, -3.819183349609375, -3.70672607421875, -3.594268798828125, -3.4818115234375, -3.369354248046875, -3.25689697265625, -3.144439697265625, -3.031982421875, -2.919525146484375, -2.80706787109375, -2.694610595703125, -2.5821533203125, -2.469696044921875, -2.35723876953125, -2.244781494140625, -2.13232421875, -2.019866943359375, -1.90740966796875, -1.794952392578125, -1.6824951171875, -1.570037841796875, -1.45758056640625, -1.345123291015625, -1.232666015625, -1.120208740234375, -1.00775146484375, -0.895294189453125, -0.7828369140625, -0.670379638671875, -0.55792236328125, -0.445465087890625, -0.3330078125, -0.220550537109375, -0.10809326171875, 0.004364013671875, 0.1168212890625, 0.229278564453125, 0.34173583984375, 0.454193115234375, 0.566650390625, 0.679107666015625, 0.79156494140625, 0.904022216796875, 1.0164794921875, 1.128936767578125, 1.24139404296875, 1.353851318359375, 1.46630859375, 1.578765869140625, 1.69122314453125, 1.803680419921875, 1.9161376953125, 2.028594970703125, 2.14105224609375, 2.253509521484375, 2.365966796875, 2.478424072265625, 2.59088134765625, 2.703338623046875, 2.8157958984375, 2.928253173828125, 3.04071044921875, 3.153167724609375, 3.265625]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 5.0, 10.0, 4.0, 5.0, 6.0, 8.0, 19.0, 22.0, 30.0, 38.0, 52.0, 91.0, 109.0, 112.0, 198.0, 226.0, 370.0, 602.0, 881.0, 1691.0, 3680.0, 9505.0, 28119.0, 88644.0, 253098.0, 374371.0, 190155.0, 62864.0, 19993.0, 6944.0, 2870.0, 1372.0, 808.0, 480.0, 293.0, 237.0, 169.0, 120.0, 91.0, 68.0, 58.0, 33.0, 27.0, 26.0, 16.0, 16.0, 10.0, 8.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3828125, -4.22821044921875, -4.0736083984375, -3.91900634765625, -3.764404296875, -3.60980224609375, -3.4552001953125, -3.30059814453125, -3.14599609375, -2.99139404296875, -2.8367919921875, -2.68218994140625, -2.527587890625, -2.37298583984375, -2.2183837890625, -2.06378173828125, -1.9091796875, -1.75457763671875, -1.5999755859375, -1.44537353515625, -1.290771484375, -1.13616943359375, -0.9815673828125, -0.82696533203125, -0.67236328125, -0.51776123046875, -0.3631591796875, -0.20855712890625, -0.053955078125, 0.10064697265625, 0.2552490234375, 0.40985107421875, 0.564453125, 0.71905517578125, 0.8736572265625, 1.02825927734375, 1.182861328125, 1.33746337890625, 1.4920654296875, 1.64666748046875, 1.80126953125, 1.95587158203125, 2.1104736328125, 2.26507568359375, 2.419677734375, 2.57427978515625, 2.7288818359375, 2.88348388671875, 3.0380859375, 3.19268798828125, 3.3472900390625, 3.50189208984375, 3.656494140625, 3.81109619140625, 3.9656982421875, 4.12030029296875, 4.27490234375, 4.42950439453125, 4.5841064453125, 4.73870849609375, 4.893310546875, 5.04791259765625, 5.2025146484375, 5.35711669921875, 5.51171875]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 5.0, 5.0, 9.0, 17.0, 10.0, 18.0, 11.0, 16.0, 25.0, 27.0, 30.0, 40.0, 50.0, 46.0, 70.0, 91.0, 131.0, 267.0, 1384.0, 223.0, 122.0, 86.0, 55.0, 45.0, 42.0, 35.0, 31.0, 36.0, 18.0, 24.0, 14.0, 15.0, 8.0, 11.0, 8.0, 16.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.1875, -9.85107421875, -9.5146484375, -9.17822265625, -8.841796875, -8.50537109375, -8.1689453125, -7.83251953125, -7.49609375, -7.15966796875, -6.8232421875, -6.48681640625, -6.150390625, -5.81396484375, -5.4775390625, -5.14111328125, -4.8046875, -4.46826171875, -4.1318359375, -3.79541015625, -3.458984375, -3.12255859375, -2.7861328125, -2.44970703125, -2.11328125, -1.77685546875, -1.4404296875, -1.10400390625, -0.767578125, -0.43115234375, -0.0947265625, 0.24169921875, 0.578125, 0.91455078125, 1.2509765625, 1.58740234375, 1.923828125, 2.26025390625, 2.5966796875, 2.93310546875, 3.26953125, 3.60595703125, 3.9423828125, 4.27880859375, 4.615234375, 4.95166015625, 5.2880859375, 5.62451171875, 5.9609375, 6.29736328125, 6.6337890625, 6.97021484375, 7.306640625, 7.64306640625, 7.9794921875, 8.31591796875, 8.65234375, 8.98876953125, 9.3251953125, 9.66162109375, 9.998046875, 10.33447265625, 10.6708984375, 11.00732421875, 11.34375]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 3.0, 4.0, 4.0, 7.0, 12.0, 13.0, 16.0, 16.0, 22.0, 39.0, 43.0, 52.0, 87.0, 93.0, 131.0, 208.0, 307.0, 455.0, 816.0, 1640.0, 14688.0, 2214064.0, 900653.0, 8863.0, 1447.0, 649.0, 395.0, 272.0, 185.0, 129.0, 90.0, 81.0, 57.0, 48.0, 27.0, 29.0, 17.0, 14.0, 9.0, 1.0, 6.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-21.6875, -21.083740234375, -20.47998046875, -19.876220703125, -19.2724609375, -18.668701171875, -18.06494140625, -17.461181640625, -16.857421875, -16.253662109375, -15.64990234375, -15.046142578125, -14.4423828125, -13.838623046875, -13.23486328125, -12.631103515625, -12.02734375, -11.423583984375, -10.81982421875, -10.216064453125, -9.6123046875, -9.008544921875, -8.40478515625, -7.801025390625, -7.197265625, -6.593505859375, -5.98974609375, -5.385986328125, -4.7822265625, -4.178466796875, -3.57470703125, -2.970947265625, -2.3671875, -1.763427734375, -1.15966796875, -0.555908203125, 0.0478515625, 0.651611328125, 1.25537109375, 1.859130859375, 2.462890625, 3.066650390625, 3.67041015625, 4.274169921875, 4.8779296875, 5.481689453125, 6.08544921875, 6.689208984375, 7.29296875, 7.896728515625, 8.50048828125, 9.104248046875, 9.7080078125, 10.311767578125, 10.91552734375, 11.519287109375, 12.123046875, 12.726806640625, 13.33056640625, 13.934326171875, 14.5380859375, 15.141845703125, 15.74560546875, 16.349365234375, 16.953125]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [5.0, 24.0, 87.0, 299.0, 373.0, 176.0, 42.0, 6.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.076804161071777, -4.662458896636963, -3.2481138706207275, -1.8337688446044922, -0.41942358016967773, 0.9949216842651367, 2.409266471862793, 3.8236122131347656, 5.237957000732422, 6.652302265167236, 8.06664752960205, 9.480992317199707, 10.89533805847168, 12.309682846069336, 13.724027633666992, 15.138373374938965, 16.552719116210938, 17.967063903808594, 19.38140869140625, 20.795753479003906, 22.210100173950195, 23.62444496154785, 25.038789749145508, 26.453136444091797, 27.86747932434082, 29.281824111938477, 30.696168899536133, 32.11051559448242, 33.52486038208008, 34.939205169677734, 36.35354995727539, 37.76789474487305, 39.1822395324707, 40.59658432006836, 42.010929107666016, 43.42527389526367, 44.83961868286133, 46.25396728515625, 47.668312072753906, 49.08265686035156, 50.49700164794922, 51.911346435546875, 53.32569122314453, 54.74003601074219, 56.154380798339844, 57.5687255859375, 58.983070373535156, 60.39741897583008, 61.81175994873047, 63.226104736328125, 64.64044952392578, 66.05479431152344, 67.4691390991211, 68.88348388671875, 70.2978286743164, 71.71217346191406, 73.12652587890625, 74.5408706665039, 75.95521545410156, 77.36956024169922, 78.78390502929688, 80.19824981689453, 81.61259460449219, 83.02693939208984, 84.4412841796875]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 2.0, 2.0, 7.0, 6.0, 12.0, 15.0, 11.0, 10.0, 14.0, 24.0, 21.0, 24.0, 26.0, 34.0, 33.0, 32.0, 39.0, 41.0, 48.0, 45.0, 41.0, 51.0, 40.0, 39.0, 39.0, 45.0, 29.0, 30.0, 29.0, 26.0, 32.0, 34.0, 18.0, 21.0, 16.0, 13.0, 13.0, 13.0, 11.0, 6.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-19.459896087646484, -18.735986709594727, -18.01207733154297, -17.288166046142578, -16.56425666809082, -15.840347290039062, -15.116437911987305, -14.392528533935547, -13.668618202209473, -12.944708824157715, -12.22079849243164, -11.496889114379883, -10.772979736328125, -10.04906940460205, -9.325160026550293, -8.601249694824219, -7.877340316772461, -7.153430461883545, -6.429520606994629, -5.705611228942871, -4.981701374053955, -4.257791519165039, -3.5338821411132812, -2.8099722862243652, -2.086062431335449, -1.3621526956558228, -0.6382429599761963, 0.08566665649414062, 0.8095765113830566, 1.5334863662719727, 2.2573957443237305, 2.9813055992126465, 3.7052154541015625, 4.4291253089904785, 5.1530351638793945, 5.876944541931152, 6.600854396820068, 7.324764251708984, 8.048673629760742, 8.7725830078125, 9.496493339538574, 10.220402717590332, 10.944313049316406, 11.668222427368164, 12.392131805419922, 13.116042137145996, 13.839951515197754, 14.563861846923828, 15.287771224975586, 16.011680603027344, 16.7355899810791, 17.45949935913086, 18.18341064453125, 18.907320022583008, 19.631229400634766, 20.355138778686523, 21.07904815673828, 21.80295753479004, 22.526866912841797, 23.250778198242188, 23.974687576293945, 24.698596954345703, 25.42250633239746, 26.14641571044922, 26.87032699584961]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 6.0, 7.0, 8.0, 9.0, 6.0, 9.0, 12.0, 14.0, 18.0, 24.0, 30.0, 21.0, 22.0, 27.0, 27.0, 26.0, 39.0, 35.0, 47.0, 45.0, 46.0, 40.0, 36.0, 33.0, 41.0, 36.0, 40.0, 30.0, 35.0, 33.0, 34.0, 31.0, 20.0, 18.0, 20.0, 12.0, 7.0, 13.0, 11.0, 8.0, 4.0, 8.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-3.7734375, -3.66082763671875, -3.5482177734375, -3.43560791015625, -3.322998046875, -3.21038818359375, -3.0977783203125, -2.98516845703125, -2.87255859375, -2.75994873046875, -2.6473388671875, -2.53472900390625, -2.422119140625, -2.30950927734375, -2.1968994140625, -2.08428955078125, -1.9716796875, -1.85906982421875, -1.7464599609375, -1.63385009765625, -1.521240234375, -1.40863037109375, -1.2960205078125, -1.18341064453125, -1.07080078125, -0.95819091796875, -0.8455810546875, -0.73297119140625, -0.620361328125, -0.50775146484375, -0.3951416015625, -0.28253173828125, -0.169921875, -0.05731201171875, 0.0552978515625, 0.16790771484375, 0.280517578125, 0.39312744140625, 0.5057373046875, 0.61834716796875, 0.73095703125, 0.84356689453125, 0.9561767578125, 1.06878662109375, 1.181396484375, 1.29400634765625, 1.4066162109375, 1.51922607421875, 1.6318359375, 1.74444580078125, 1.8570556640625, 1.96966552734375, 2.082275390625, 2.19488525390625, 2.3074951171875, 2.42010498046875, 2.53271484375, 2.64532470703125, 2.7579345703125, 2.87054443359375, 2.983154296875, 3.09576416015625, 3.2083740234375, 3.32098388671875, 3.43359375]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 3.0, 7.0, 14.0, 7.0, 5.0, 10.0, 19.0, 19.0, 23.0, 34.0, 37.0, 34.0, 51.0, 82.0, 110.0, 139.0, 177.0, 257.0, 305.0, 398.0, 2056.0, 3478874.0, 709041.0, 977.0, 353.0, 306.0, 236.0, 141.0, 139.0, 104.0, 65.0, 37.0, 42.0, 48.0, 33.0, 18.0, 17.0, 11.0, 8.0, 8.0, 9.0, 9.0, 7.0, 5.0, 3.0, 2.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.203125, -28.155517578125, -27.10791015625, -26.060302734375, -25.0126953125, -23.965087890625, -22.91748046875, -21.869873046875, -20.822265625, -19.774658203125, -18.72705078125, -17.679443359375, -16.6318359375, -15.584228515625, -14.53662109375, -13.489013671875, -12.44140625, -11.393798828125, -10.34619140625, -9.298583984375, -8.2509765625, -7.203369140625, -6.15576171875, -5.108154296875, -4.060546875, -3.012939453125, -1.96533203125, -0.917724609375, 0.1298828125, 1.177490234375, 2.22509765625, 3.272705078125, 4.3203125, 5.367919921875, 6.41552734375, 7.463134765625, 8.5107421875, 9.558349609375, 10.60595703125, 11.653564453125, 12.701171875, 13.748779296875, 14.79638671875, 15.843994140625, 16.8916015625, 17.939208984375, 18.98681640625, 20.034423828125, 21.08203125, 22.129638671875, 23.17724609375, 24.224853515625, 25.2724609375, 26.320068359375, 27.36767578125, 28.415283203125, 29.462890625, 30.510498046875, 31.55810546875, 32.605712890625, 33.6533203125, 34.700927734375, 35.74853515625, 36.796142578125, 37.84375]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 3.0, 5.0, 8.0, 8.0, 7.0, 19.0, 19.0, 31.0, 26.0, 52.0, 64.0, 81.0, 120.0, 183.0, 270.0, 324.0, 451.0, 536.0, 516.0, 343.0, 272.0, 178.0, 152.0, 101.0, 77.0, 61.0, 44.0, 31.0, 13.0, 17.0, 18.0, 13.0, 11.0, 10.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.61328125, -4.4337158203125, -4.254150390625, -4.0745849609375, -3.89501953125, -3.7154541015625, -3.535888671875, -3.3563232421875, -3.1767578125, -2.9971923828125, -2.817626953125, -2.6380615234375, -2.45849609375, -2.2789306640625, -2.099365234375, -1.9197998046875, -1.740234375, -1.5606689453125, -1.381103515625, -1.2015380859375, -1.02197265625, -0.8424072265625, -0.662841796875, -0.4832763671875, -0.3037109375, -0.1241455078125, 0.055419921875, 0.2349853515625, 0.41455078125, 0.5941162109375, 0.773681640625, 0.9532470703125, 1.1328125, 1.3123779296875, 1.491943359375, 1.6715087890625, 1.85107421875, 2.0306396484375, 2.210205078125, 2.3897705078125, 2.5693359375, 2.7489013671875, 2.928466796875, 3.1080322265625, 3.28759765625, 3.4671630859375, 3.646728515625, 3.8262939453125, 4.005859375, 4.1854248046875, 4.364990234375, 4.5445556640625, 4.72412109375, 4.9036865234375, 5.083251953125, 5.2628173828125, 5.4423828125, 5.6219482421875, 5.801513671875, 5.9810791015625, 6.16064453125, 6.3402099609375, 6.519775390625, 6.6993408203125, 6.87890625]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 6.0, 3.0, 6.0, 9.0, 15.0, 20.0, 27.0, 33.0, 49.0, 71.0, 113.0, 224.0, 537.0, 3630.0, 321413.0, 3832417.0, 33664.0, 1268.0, 335.0, 150.0, 68.0, 55.0, 30.0, 37.0, 23.0, 14.0, 20.0, 9.0, 10.0, 7.0, 2.0, 3.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.71875, -24.968505859375, -24.21826171875, -23.468017578125, -22.7177734375, -21.967529296875, -21.21728515625, -20.467041015625, -19.716796875, -18.966552734375, -18.21630859375, -17.466064453125, -16.7158203125, -15.965576171875, -15.21533203125, -14.465087890625, -13.71484375, -12.964599609375, -12.21435546875, -11.464111328125, -10.7138671875, -9.963623046875, -9.21337890625, -8.463134765625, -7.712890625, -6.962646484375, -6.21240234375, -5.462158203125, -4.7119140625, -3.961669921875, -3.21142578125, -2.461181640625, -1.7109375, -0.960693359375, -0.21044921875, 0.539794921875, 1.2900390625, 2.040283203125, 2.79052734375, 3.540771484375, 4.291015625, 5.041259765625, 5.79150390625, 6.541748046875, 7.2919921875, 8.042236328125, 8.79248046875, 9.542724609375, 10.29296875, 11.043212890625, 11.79345703125, 12.543701171875, 13.2939453125, 14.044189453125, 14.79443359375, 15.544677734375, 16.294921875, 17.045166015625, 17.79541015625, 18.545654296875, 19.2958984375, 20.046142578125, 20.79638671875, 21.546630859375, 22.296875]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 10.0, 77.0, 442.0, 407.0, 75.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-131.29013061523438, -128.30751037597656, -125.32489013671875, -122.34226989746094, -119.35964965820312, -116.37702941894531, -113.3944091796875, -110.41178894042969, -107.42916870117188, -104.44654846191406, -101.46392822265625, -98.48130798339844, -95.49868774414062, -92.51606750488281, -89.533447265625, -86.55082702636719, -83.5682144165039, -80.5855941772461, -77.60297393798828, -74.62035369873047, -71.63773345947266, -68.65511322021484, -65.67250061035156, -62.689876556396484, -59.70725631713867, -56.72463607788086, -53.74201583862305, -50.7593994140625, -47.77677917480469, -44.794158935546875, -41.81153869628906, -38.82891845703125, -35.84629821777344, -32.863677978515625, -29.881057739257812, -26.898439407348633, -23.91581916809082, -20.933198928833008, -17.950580596923828, -14.967960357666016, -11.985340118408203, -9.00271987915039, -6.0201005935668945, -3.0374813079833984, -0.05486106872558594, 2.9277591705322266, 5.910377502441406, 8.892997741699219, 11.875617980957031, 14.858238220214844, 17.840858459472656, 20.823476791381836, 23.80609703063965, 26.78871726989746, 29.77133560180664, 32.75395584106445, 35.736576080322266, 38.71919631958008, 41.70181655883789, 44.68443298339844, 47.66705322265625, 50.64967346191406, 53.632293701171875, 56.61491394042969, 59.5975341796875]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 12.0, 10.0, 8.0, 12.0, 7.0, 15.0, 16.0, 22.0, 22.0, 25.0, 29.0, 37.0, 38.0, 43.0, 41.0, 49.0, 48.0, 57.0, 37.0, 44.0, 42.0, 43.0, 51.0, 37.0, 40.0, 31.0, 34.0, 17.0, 18.0, 22.0, 20.0, 20.0, 9.0, 5.0, 10.0, 9.0, 2.0, 6.0, 4.0, 5.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.43429183959961, -19.788476943969727, -19.142662048339844, -18.49684715270996, -17.851032257080078, -17.205215454101562, -16.55940055847168, -15.913585662841797, -15.267770767211914, -14.621955871582031, -13.976140975952148, -13.33032512664795, -12.684510231018066, -12.038695335388184, -11.392879486083984, -10.747064590454102, -10.101249694824219, -9.455434799194336, -8.809619903564453, -8.163804054260254, -7.517989158630371, -6.872174263000488, -6.226358890533447, -5.580543518066406, -4.934728622436523, -4.288913726806641, -3.6430983543395996, -2.9972832202911377, -2.351468086242676, -1.7056529521942139, -1.059837818145752, -0.41402244567871094, 0.2317943572998047, 0.8776094913482666, 1.5234246253967285, 2.1692397594451904, 2.8150548934936523, 3.4608700275421143, 4.106685161590576, 4.752500534057617, 5.3983154296875, 6.044130325317383, 6.689945697784424, 7.335761070251465, 7.981575965881348, 8.62739086151123, 9.27320671081543, 9.919021606445312, 10.564836502075195, 11.210651397705078, 11.856466293334961, 12.50228214263916, 13.148097038269043, 13.793911933898926, 14.439727783203125, 15.085542678833008, 15.73135757446289, 16.377172470092773, 17.022987365722656, 17.66880226135254, 18.314617156982422, 18.960433959960938, 19.60624885559082, 20.252063751220703, 20.897878646850586]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 7.0, 8.0, 12.0, 9.0, 12.0, 16.0, 25.0, 21.0, 26.0, 28.0, 33.0, 29.0, 34.0, 25.0, 41.0, 40.0, 41.0, 46.0, 44.0, 43.0, 59.0, 40.0, 38.0, 32.0, 42.0, 25.0, 37.0, 39.0, 31.0, 15.0, 7.0, 21.0, 10.0, 15.0, 5.0, 6.0, 5.0, 4.0, 9.0, 4.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.80859375, -3.695465087890625, -3.58233642578125, -3.469207763671875, -3.3560791015625, -3.242950439453125, -3.12982177734375, -3.016693115234375, -2.903564453125, -2.790435791015625, -2.67730712890625, -2.564178466796875, -2.4510498046875, -2.337921142578125, -2.22479248046875, -2.111663818359375, -1.99853515625, -1.885406494140625, -1.77227783203125, -1.659149169921875, -1.5460205078125, -1.432891845703125, -1.31976318359375, -1.206634521484375, -1.093505859375, -0.980377197265625, -0.86724853515625, -0.754119873046875, -0.6409912109375, -0.527862548828125, -0.41473388671875, -0.301605224609375, -0.1884765625, -0.075347900390625, 0.03778076171875, 0.150909423828125, 0.2640380859375, 0.377166748046875, 0.49029541015625, 0.603424072265625, 0.716552734375, 0.829681396484375, 0.94281005859375, 1.055938720703125, 1.1690673828125, 1.282196044921875, 1.39532470703125, 1.508453369140625, 1.62158203125, 1.734710693359375, 1.84783935546875, 1.960968017578125, 2.0740966796875, 2.187225341796875, 2.30035400390625, 2.413482666015625, 2.526611328125, 2.639739990234375, 2.75286865234375, 2.865997314453125, 2.9791259765625, 3.092254638671875, 3.20538330078125, 3.318511962890625, 3.431640625]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 8.0, 10.0, 8.0, 9.0, 30.0, 39.0, 67.0, 88.0, 124.0, 188.0, 295.0, 385.0, 620.0, 817.0, 1237.0, 1815.0, 2569.0, 3780.0, 5494.0, 8141.0, 12232.0, 18936.0, 29631.0, 48111.0, 81166.0, 140437.0, 220015.0, 187181.0, 110483.0, 64327.0, 38628.0, 24286.0, 15310.0, 10251.0, 6876.0, 4626.0, 3180.0, 2167.0, 1513.0, 1044.0, 745.0, 549.0, 336.0, 254.0, 159.0, 140.0, 87.0, 49.0, 40.0, 19.0, 26.0, 16.0, 9.0, 5.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.34716796875, -0.33551025390625, -0.3238525390625, -0.31219482421875, -0.300537109375, -0.28887939453125, -0.2772216796875, -0.26556396484375, -0.25390625, -0.24224853515625, -0.2305908203125, -0.21893310546875, -0.207275390625, -0.19561767578125, -0.1839599609375, -0.17230224609375, -0.16064453125, -0.14898681640625, -0.1373291015625, -0.12567138671875, -0.114013671875, -0.10235595703125, -0.0906982421875, -0.07904052734375, -0.0673828125, -0.05572509765625, -0.0440673828125, -0.03240966796875, -0.020751953125, -0.00909423828125, 0.0025634765625, 0.01422119140625, 0.02587890625, 0.03753662109375, 0.0491943359375, 0.06085205078125, 0.072509765625, 0.08416748046875, 0.0958251953125, 0.10748291015625, 0.119140625, 0.13079833984375, 0.1424560546875, 0.15411376953125, 0.165771484375, 0.17742919921875, 0.1890869140625, 0.20074462890625, 0.21240234375, 0.22406005859375, 0.2357177734375, 0.24737548828125, 0.259033203125, 0.27069091796875, 0.2823486328125, 0.29400634765625, 0.3056640625, 0.31732177734375, 0.3289794921875, 0.34063720703125, 0.352294921875, 0.36395263671875, 0.3756103515625, 0.38726806640625, 0.39892578125]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 6.0, 2.0, 4.0, 3.0, 8.0, 10.0, 11.0, 9.0, 18.0, 15.0, 18.0, 30.0, 21.0, 24.0, 36.0, 29.0, 32.0, 34.0, 28.0, 41.0, 60.0, 49.0, 1056.0, 49.0, 37.0, 41.0, 43.0, 21.0, 28.0, 39.0, 33.0, 32.0, 28.0, 7.0, 25.0, 16.0, 15.0, 12.0, 8.0, 17.0, 9.0, 7.0, 3.0, 6.0, 2.0, 4.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.19921875, -2.12896728515625, -2.0587158203125, -1.98846435546875, -1.918212890625, -1.84796142578125, -1.7777099609375, -1.70745849609375, -1.63720703125, -1.56695556640625, -1.4967041015625, -1.42645263671875, -1.356201171875, -1.28594970703125, -1.2156982421875, -1.14544677734375, -1.0751953125, -1.00494384765625, -0.9346923828125, -0.86444091796875, -0.794189453125, -0.72393798828125, -0.6536865234375, -0.58343505859375, -0.51318359375, -0.44293212890625, -0.3726806640625, -0.30242919921875, -0.232177734375, -0.16192626953125, -0.0916748046875, -0.02142333984375, 0.048828125, 0.11907958984375, 0.1893310546875, 0.25958251953125, 0.329833984375, 0.40008544921875, 0.4703369140625, 0.54058837890625, 0.61083984375, 0.68109130859375, 0.7513427734375, 0.82159423828125, 0.891845703125, 0.96209716796875, 1.0323486328125, 1.10260009765625, 1.1728515625, 1.24310302734375, 1.3133544921875, 1.38360595703125, 1.453857421875, 1.52410888671875, 1.5943603515625, 1.66461181640625, 1.73486328125, 1.80511474609375, 1.8753662109375, 1.94561767578125, 2.015869140625, 2.08612060546875, 2.1563720703125, 2.22662353515625, 2.296875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 9.0, 6.0, 12.0, 25.0, 24.0, 45.0, 62.0, 83.0, 125.0, 163.0, 253.0, 339.0, 507.0, 770.0, 1094.0, 1448.0, 2148.0, 3190.0, 4640.0, 6966.0, 10436.0, 15590.0, 24344.0, 38033.0, 61305.0, 99602.0, 160775.0, 1253228.0, 153178.0, 94840.0, 58552.0, 36414.0, 22974.0, 15127.0, 9871.0, 6435.0, 4345.0, 3134.0, 2087.0, 1443.0, 1007.0, 727.0, 537.0, 367.0, 264.0, 181.0, 141.0, 90.0, 76.0, 45.0, 23.0, 16.0, 19.0, 11.0, 8.0, 1.0, 3.0, 3.0, 1.0, 2.0], "bins": [-0.2939453125, -0.28459930419921875, -0.2752532958984375, -0.26590728759765625, -0.256561279296875, -0.24721527099609375, -0.2378692626953125, -0.22852325439453125, -0.21917724609375, -0.20983123779296875, -0.2004852294921875, -0.19113922119140625, -0.181793212890625, -0.17244720458984375, -0.1631011962890625, -0.15375518798828125, -0.1444091796875, -0.13506317138671875, -0.1257171630859375, -0.11637115478515625, -0.107025146484375, -0.09767913818359375, -0.0883331298828125, -0.07898712158203125, -0.06964111328125, -0.06029510498046875, -0.0509490966796875, -0.04160308837890625, -0.032257080078125, -0.02291107177734375, -0.0135650634765625, -0.00421905517578125, 0.005126953125, 0.01447296142578125, 0.0238189697265625, 0.03316497802734375, 0.042510986328125, 0.05185699462890625, 0.0612030029296875, 0.07054901123046875, 0.07989501953125, 0.08924102783203125, 0.0985870361328125, 0.10793304443359375, 0.117279052734375, 0.12662506103515625, 0.1359710693359375, 0.14531707763671875, 0.1546630859375, 0.16400909423828125, 0.1733551025390625, 0.18270111083984375, 0.192047119140625, 0.20139312744140625, 0.2107391357421875, 0.22008514404296875, 0.22943115234375, 0.23877716064453125, 0.2481231689453125, 0.25746917724609375, 0.266815185546875, 0.27616119384765625, 0.2855072021484375, 0.29485321044921875, 0.30419921875]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 7.0, 7.0, 6.0, 13.0, 9.0, 9.0, 21.0, 9.0, 30.0, 32.0, 51.0, 57.0, 53.0, 86.0, 110.0, 85.0, 79.0, 96.0, 43.0, 41.0, 30.0, 31.0, 19.0, 16.0, 6.0, 18.0, 10.0, 7.0, 3.0, 3.0, 3.0, 1.0, 1.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020904541015625, -0.0020271241664886475, -0.001963794231414795, -0.0019004642963409424, -0.0018371343612670898, -0.0017738044261932373, -0.0017104744911193848, -0.0016471445560455322, -0.0015838146209716797, -0.0015204846858978271, -0.0014571547508239746, -0.001393824815750122, -0.0013304948806762695, -0.001267164945602417, -0.0012038350105285645, -0.001140505075454712, -0.0010771751403808594, -0.0010138452053070068, -0.0009505152702331543, -0.0008871853351593018, -0.0008238554000854492, -0.0007605254650115967, -0.0006971955299377441, -0.0006338655948638916, -0.0005705356597900391, -0.0005072057247161865, -0.000443875789642334, -0.00038054585456848145, -0.0003172159194946289, -0.00025388598442077637, -0.00019055604934692383, -0.0001272261142730713, -6.389617919921875e-05, -5.662441253662109e-07, 6.276369094848633e-05, 0.00012609362602233887, 0.0001894235610961914, 0.00025275349617004395, 0.0003160834312438965, 0.000379413366317749, 0.00044274330139160156, 0.0005060732364654541, 0.0005694031715393066, 0.0006327331066131592, 0.0006960630416870117, 0.0007593929767608643, 0.0008227229118347168, 0.0008860528469085693, 0.0009493827819824219, 0.0010127127170562744, 0.001076042652130127, 0.0011393725872039795, 0.001202702522277832, 0.0012660324573516846, 0.0013293623924255371, 0.0013926923274993896, 0.0014560222625732422, 0.0015193521976470947, 0.0015826821327209473, 0.0016460120677947998, 0.0017093420028686523, 0.0017726719379425049, 0.0018360018730163574, 0.00189933180809021, 0.0019626617431640625]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 12.0, 2.0, 4.0, 3.0, 6.0, 9.0, 11.0, 19.0, 29.0, 31.0, 31.0, 63.0, 74.0, 107.0, 164.0, 270.0, 583.0, 1673.0, 970045.0, 73236.0, 1006.0, 393.0, 258.0, 162.0, 89.0, 71.0, 36.0, 40.0, 30.0, 25.0, 16.0, 9.0, 17.0, 12.0, 6.0, 7.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.036285400390625, -0.03510856628417969, -0.033931732177734375, -0.03275489807128906, -0.03157806396484375, -0.030401229858398438, -0.029224395751953125, -0.028047561645507812, -0.0268707275390625, -0.025693893432617188, -0.024517059326171875, -0.023340225219726562, -0.02216339111328125, -0.020986557006835938, -0.019809722900390625, -0.018632888793945312, -0.0174560546875, -0.016279220581054688, -0.015102386474609375, -0.013925552368164062, -0.01274871826171875, -0.011571884155273438, -0.010395050048828125, -0.009218215942382812, -0.0080413818359375, -0.0068645477294921875, -0.005687713623046875, -0.0045108795166015625, -0.00333404541015625, -0.0021572113037109375, -0.000980377197265625, 0.0001964569091796875, 0.001373291015625, 0.0025501251220703125, 0.003726959228515625, 0.0049037933349609375, 0.00608062744140625, 0.0072574615478515625, 0.008434295654296875, 0.009611129760742188, 0.0107879638671875, 0.011964797973632812, 0.013141632080078125, 0.014318466186523438, 0.01549530029296875, 0.016672134399414062, 0.017848968505859375, 0.019025802612304688, 0.02020263671875, 0.021379470825195312, 0.022556304931640625, 0.023733139038085938, 0.02490997314453125, 0.026086807250976562, 0.027263641357421875, 0.028440475463867188, 0.0296173095703125, 0.030794143676757812, 0.031970977783203125, 0.03314781188964844, 0.03432464599609375, 0.03550148010253906, 0.036678314208984375, 0.03785514831542969, 0.039031982421875]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 15.0, 70.0, 248.0, 370.0, 215.0, 75.0, 11.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0031177103519439697, -0.0030344061087816954, -0.002951101865619421, -0.0028677978552877903, -0.002784493612125516, -0.0027011893689632416, -0.002617885125800967, -0.002534580882638693, -0.002451276872307062, -0.002367972629144788, -0.0022846683859825134, -0.0022013643756508827, -0.0021180601324886084, -0.002034755889326334, -0.0019514516461640596, -0.0018681474030017853, -0.001784843159839511, -0.0017015389166772366, -0.001618234789930284, -0.0015349305467680097, -0.0014516264200210571, -0.0013683221768587828, -0.0012850179336965084, -0.001201713690534234, -0.0011184095637872815, -0.0010351053206250072, -0.0009518011938780546, -0.0008684969507157803, -0.0007851927657611668, -0.0007018885808065534, -0.000618584337644279, -0.0005352801526896656, -0.0004519759677350521, -0.00036867178278043866, -0.00028536756872199476, -0.00020206335466355085, -0.0001187591697089374, -3.545498475432396e-05, 4.78492584079504e-05, 0.00013115344336256385, 0.0002144576283171773, 0.00029776181327179074, 0.00038106602733023465, 0.00046437024138867855, 0.000547674426343292, 0.0006309786112979054, 0.0007142828544601798, 0.0007975870394147933, 0.0008808912243694067, 0.0009641954093240201, 0.0010474995942786336, 0.001130803837440908, 0.0012141079641878605, 0.0012974122073501348, 0.0013807164505124092, 0.0014640206936746836, 0.001547324820421636, 0.0016306290635839105, 0.001713933190330863, 0.0017972374334931374, 0.0018805416766554117, 0.001963845919817686, 0.002047149930149317, 0.002130454173311591, 0.0022137584164738655]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 7.0, 6.0, 5.0, 11.0, 11.0, 7.0, 9.0, 14.0, 16.0, 20.0, 26.0, 25.0, 34.0, 28.0, 40.0, 39.0, 43.0, 44.0, 43.0, 44.0, 41.0, 45.0, 43.0, 45.0, 36.0, 34.0, 42.0, 45.0, 35.0, 31.0, 17.0, 22.0, 19.0, 19.0, 14.0, 12.0, 6.0, 5.0, 6.0, 7.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0008981227874755859, -0.0008695870637893677, -0.0008410513401031494, -0.0008125156164169312, -0.0007839798927307129, -0.0007554441690444946, -0.0007269084453582764, -0.0006983727216720581, -0.0006698369979858398, -0.0006413012742996216, -0.0006127655506134033, -0.0005842298269271851, -0.0005556941032409668, -0.0005271583795547485, -0.0004986226558685303, -0.000470086932182312, -0.00044155120849609375, -0.0004130154848098755, -0.0003844797611236572, -0.00035594403743743896, -0.0003274083137512207, -0.00029887259006500244, -0.0002703368663787842, -0.00024180114269256592, -0.00021326541900634766, -0.0001847296953201294, -0.00015619397163391113, -0.00012765824794769287, -9.912252426147461e-05, -7.058680057525635e-05, -4.2051076889038086e-05, -1.3515353202819824e-05, 1.5020370483398438e-05, 4.35560941696167e-05, 7.209181785583496e-05, 0.00010062754154205322, 0.00012916326522827148, 0.00015769898891448975, 0.000186234712600708, 0.00021477043628692627, 0.00024330615997314453, 0.0002718418836593628, 0.00030037760734558105, 0.0003289133310317993, 0.0003574490547180176, 0.00038598477840423584, 0.0004145205020904541, 0.00044305622577667236, 0.0004715919494628906, 0.0005001276731491089, 0.0005286633968353271, 0.0005571991205215454, 0.0005857348442077637, 0.0006142705678939819, 0.0006428062915802002, 0.0006713420152664185, 0.0006998777389526367, 0.000728413462638855, 0.0007569491863250732, 0.0007854849100112915, 0.0008140206336975098, 0.000842556357383728, 0.0008710920810699463, 0.0008996278047561646, 0.0009281635284423828]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 7.0, 8.0, 12.0, 9.0, 12.0, 16.0, 25.0, 21.0, 26.0, 28.0, 33.0, 29.0, 34.0, 25.0, 41.0, 40.0, 41.0, 46.0, 44.0, 43.0, 59.0, 40.0, 38.0, 32.0, 42.0, 25.0, 37.0, 39.0, 31.0, 15.0, 7.0, 21.0, 10.0, 15.0, 5.0, 6.0, 5.0, 4.0, 9.0, 4.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.80859375, -3.695465087890625, -3.58233642578125, -3.469207763671875, -3.3560791015625, -3.242950439453125, -3.12982177734375, -3.016693115234375, -2.903564453125, -2.790435791015625, -2.67730712890625, -2.564178466796875, -2.4510498046875, -2.337921142578125, -2.22479248046875, -2.111663818359375, -1.99853515625, -1.885406494140625, -1.77227783203125, -1.659149169921875, -1.5460205078125, -1.432891845703125, -1.31976318359375, -1.206634521484375, -1.093505859375, -0.980377197265625, -0.86724853515625, -0.754119873046875, -0.6409912109375, -0.527862548828125, -0.41473388671875, -0.301605224609375, -0.1884765625, -0.075347900390625, 0.03778076171875, 0.150909423828125, 0.2640380859375, 0.377166748046875, 0.49029541015625, 0.603424072265625, 0.716552734375, 0.829681396484375, 0.94281005859375, 1.055938720703125, 1.1690673828125, 1.282196044921875, 1.39532470703125, 1.508453369140625, 1.62158203125, 1.734710693359375, 1.84783935546875, 1.960968017578125, 2.0740966796875, 2.187225341796875, 2.30035400390625, 2.413482666015625, 2.526611328125, 2.639739990234375, 2.75286865234375, 2.865997314453125, 2.9791259765625, 3.092254638671875, 3.20538330078125, 3.318511962890625, 3.431640625]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 7.0, 7.0, 9.0, 19.0, 29.0, 29.0, 47.0, 44.0, 69.0, 73.0, 102.0, 160.0, 202.0, 270.0, 323.0, 469.0, 643.0, 897.0, 1199.0, 1959.0, 5248.0, 28376.0, 163862.0, 534123.0, 250260.0, 44924.0, 7830.0, 2365.0, 1364.0, 909.0, 658.0, 516.0, 385.0, 298.0, 228.0, 169.0, 124.0, 91.0, 68.0, 55.0, 31.0, 23.0, 25.0, 19.0, 15.0, 8.0, 6.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 3.0], "bins": [-7.01953125, -6.797607421875, -6.57568359375, -6.353759765625, -6.1318359375, -5.909912109375, -5.68798828125, -5.466064453125, -5.244140625, -5.022216796875, -4.80029296875, -4.578369140625, -4.3564453125, -4.134521484375, -3.91259765625, -3.690673828125, -3.46875, -3.246826171875, -3.02490234375, -2.802978515625, -2.5810546875, -2.359130859375, -2.13720703125, -1.915283203125, -1.693359375, -1.471435546875, -1.24951171875, -1.027587890625, -0.8056640625, -0.583740234375, -0.36181640625, -0.139892578125, 0.08203125, 0.303955078125, 0.52587890625, 0.747802734375, 0.9697265625, 1.191650390625, 1.41357421875, 1.635498046875, 1.857421875, 2.079345703125, 2.30126953125, 2.523193359375, 2.7451171875, 2.967041015625, 3.18896484375, 3.410888671875, 3.6328125, 3.854736328125, 4.07666015625, 4.298583984375, 4.5205078125, 4.742431640625, 4.96435546875, 5.186279296875, 5.408203125, 5.630126953125, 5.85205078125, 6.073974609375, 6.2958984375, 6.517822265625, 6.73974609375, 6.961669921875, 7.18359375]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 7.0, 4.0, 4.0, 7.0, 10.0, 12.0, 17.0, 21.0, 32.0, 40.0, 35.0, 27.0, 47.0, 65.0, 53.0, 110.0, 186.0, 1353.0, 318.0, 172.0, 93.0, 82.0, 51.0, 37.0, 33.0, 24.0, 35.0, 35.0, 19.0, 26.0, 17.0, 17.0, 15.0, 6.0, 6.0, 13.0, 3.0, 6.0, 4.0, 3.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.71875, -8.4461669921875, -8.173583984375, -7.9010009765625, -7.62841796875, -7.3558349609375, -7.083251953125, -6.8106689453125, -6.5380859375, -6.2655029296875, -5.992919921875, -5.7203369140625, -5.44775390625, -5.1751708984375, -4.902587890625, -4.6300048828125, -4.357421875, -4.0848388671875, -3.812255859375, -3.5396728515625, -3.26708984375, -2.9945068359375, -2.721923828125, -2.4493408203125, -2.1767578125, -1.9041748046875, -1.631591796875, -1.3590087890625, -1.08642578125, -0.8138427734375, -0.541259765625, -0.2686767578125, 0.00390625, 0.2764892578125, 0.549072265625, 0.8216552734375, 1.09423828125, 1.3668212890625, 1.639404296875, 1.9119873046875, 2.1845703125, 2.4571533203125, 2.729736328125, 3.0023193359375, 3.27490234375, 3.5474853515625, 3.820068359375, 4.0926513671875, 4.365234375, 4.6378173828125, 4.910400390625, 5.1829833984375, 5.45556640625, 5.7281494140625, 6.000732421875, 6.2733154296875, 6.5458984375, 6.8184814453125, 7.091064453125, 7.3636474609375, 7.63623046875, 7.9088134765625, 8.181396484375, 8.4539794921875, 8.7265625]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 4.0, 11.0, 2.0, 14.0, 10.0, 16.0, 19.0, 25.0, 28.0, 47.0, 57.0, 87.0, 107.0, 160.0, 242.0, 366.0, 645.0, 1253.0, 5115.0, 3129565.0, 4941.0, 1232.0, 619.0, 345.0, 229.0, 164.0, 114.0, 68.0, 62.0, 36.0, 30.0, 24.0, 14.0, 12.0, 12.0, 6.0, 7.0, 7.0, 3.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.75, -34.4951171875, -33.240234375, -31.9853515625, -30.73046875, -29.4755859375, -28.220703125, -26.9658203125, -25.7109375, -24.4560546875, -23.201171875, -21.9462890625, -20.69140625, -19.4365234375, -18.181640625, -16.9267578125, -15.671875, -14.4169921875, -13.162109375, -11.9072265625, -10.65234375, -9.3974609375, -8.142578125, -6.8876953125, -5.6328125, -4.3779296875, -3.123046875, -1.8681640625, -0.61328125, 0.6416015625, 1.896484375, 3.1513671875, 4.40625, 5.6611328125, 6.916015625, 8.1708984375, 9.42578125, 10.6806640625, 11.935546875, 13.1904296875, 14.4453125, 15.7001953125, 16.955078125, 18.2099609375, 19.46484375, 20.7197265625, 21.974609375, 23.2294921875, 24.484375, 25.7392578125, 26.994140625, 28.2490234375, 29.50390625, 30.7587890625, 32.013671875, 33.2685546875, 34.5234375, 35.7783203125, 37.033203125, 38.2880859375, 39.54296875, 40.7978515625, 42.052734375, 43.3076171875, 44.5625]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 120.0, 611.0, 261.0, 20.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-119.82560729980469, -117.14168548583984, -114.45775604248047, -111.77383422851562, -109.08990478515625, -106.4059829711914, -103.72206115722656, -101.03813171386719, -98.35420989990234, -95.6702880859375, -92.98635864257812, -90.30243682861328, -87.61851501464844, -84.93458557128906, -82.25066375732422, -79.56674194335938, -76.8828125, -74.19889068603516, -71.51496124267578, -68.83103942871094, -66.14710998535156, -63.46318817138672, -60.779266357421875, -58.095340728759766, -55.411415100097656, -52.72748947143555, -50.04356384277344, -47.359642028808594, -44.675716400146484, -41.991790771484375, -39.30786895751953, -36.62394332885742, -33.94001007080078, -31.256084442138672, -28.572160720825195, -25.88823699951172, -23.20431137084961, -20.5203857421875, -17.836462020874023, -15.152538299560547, -12.468612670898438, -9.784687995910645, -7.100763320922852, -4.416838645935059, -1.7329139709472656, 0.9510107040405273, 3.6349353790283203, 6.318859100341797, 9.002784729003906, 11.6867094039917, 14.370634078979492, 17.05455780029297, 19.738483428955078, 22.422409057617188, 25.106332778930664, 27.79025650024414, 30.47418212890625, 33.15810775756836, 35.84203338623047, 38.52595520019531, 41.20988082885742, 43.89380645751953, 46.577728271484375, 49.261653900146484, 51.945579528808594]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 7.0, 12.0, 7.0, 10.0, 12.0, 13.0, 16.0, 16.0, 19.0, 21.0, 23.0, 25.0, 24.0, 31.0, 29.0, 27.0, 35.0, 32.0, 28.0, 42.0, 39.0, 41.0, 49.0, 46.0, 34.0, 40.0, 33.0, 41.0, 32.0, 25.0, 24.0, 21.0, 21.0, 18.0, 15.0, 19.0, 14.0, 21.0, 5.0, 5.0, 8.0, 10.0, 1.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-21.61600112915039, -20.964628219604492, -20.313257217407227, -19.661884307861328, -19.01051139831543, -18.35913848876953, -17.707767486572266, -17.056394577026367, -16.40502166748047, -15.753649711608887, -15.102276802062988, -14.450904846191406, -13.799531936645508, -13.148159980773926, -12.496788024902344, -11.845415115356445, -11.19404411315918, -10.542672157287598, -9.8912992477417, -9.239927291870117, -8.588554382324219, -7.937182426452637, -7.285810470581055, -6.6344380378723145, -5.983065605163574, -5.331693172454834, -4.680320739746094, -4.028948783874512, -3.3775763511657715, -2.7262039184570312, -2.07483172416687, -1.423459529876709, -0.7720870971679688, -0.12071478366851807, 0.5306575298309326, 1.1820298433303833, 1.833402156829834, 2.484774589538574, 3.1361467838287354, 3.7875189781188965, 4.438891410827637, 5.090263843536377, 5.741636276245117, 6.393008232116699, 7.0443806648254395, 7.69575309753418, 8.347125053405762, 8.998497009277344, 9.649869918823242, 10.301241874694824, 10.952614784240723, 11.603986740112305, 12.255359649658203, 12.906731605529785, 13.558103561401367, 14.209476470947266, 14.860848426818848, 15.51222038269043, 16.163593292236328, 16.814966201782227, 17.466337203979492, 18.11771011352539, 18.76908302307129, 19.420454025268555, 20.071826934814453]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 7.0, 7.0, 9.0, 11.0, 11.0, 14.0, 14.0, 16.0, 25.0, 25.0, 20.0, 28.0, 36.0, 29.0, 41.0, 36.0, 41.0, 34.0, 53.0, 45.0, 42.0, 39.0, 33.0, 52.0, 61.0, 30.0, 33.0, 34.0, 18.0, 21.0, 23.0, 22.0, 16.0, 14.0, 10.0, 12.0, 9.0, 3.0, 9.0, 5.0, 4.0, 5.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.41015625, -3.29620361328125, -3.1822509765625, -3.06829833984375, -2.954345703125, -2.84039306640625, -2.7264404296875, -2.61248779296875, -2.49853515625, -2.38458251953125, -2.2706298828125, -2.15667724609375, -2.042724609375, -1.92877197265625, -1.8148193359375, -1.70086669921875, -1.5869140625, -1.47296142578125, -1.3590087890625, -1.24505615234375, -1.131103515625, -1.01715087890625, -0.9031982421875, -0.78924560546875, -0.67529296875, -0.56134033203125, -0.4473876953125, -0.33343505859375, -0.219482421875, -0.10552978515625, 0.0084228515625, 0.12237548828125, 0.236328125, 0.35028076171875, 0.4642333984375, 0.57818603515625, 0.692138671875, 0.80609130859375, 0.9200439453125, 1.03399658203125, 1.14794921875, 1.26190185546875, 1.3758544921875, 1.48980712890625, 1.603759765625, 1.71771240234375, 1.8316650390625, 1.94561767578125, 2.0595703125, 2.17352294921875, 2.2874755859375, 2.40142822265625, 2.515380859375, 2.62933349609375, 2.7432861328125, 2.85723876953125, 2.97119140625, 3.08514404296875, 3.1990966796875, 3.31304931640625, 3.427001953125, 3.54095458984375, 3.6549072265625, 3.76885986328125, 3.8828125]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 3.0, 7.0, 10.0, 7.0, 5.0, 14.0, 21.0, 18.0, 31.0, 32.0, 58.0, 95.0, 131.0, 190.0, 338.0, 556.0, 1000.0, 1859.0, 3999.0, 9374.0, 26073.0, 85366.0, 294996.0, 873904.0, 1582842.0, 885385.0, 298695.0, 85412.0, 25974.0, 9562.0, 3951.0, 1934.0, 977.0, 503.0, 317.0, 211.0, 127.0, 72.0, 68.0, 55.0, 27.0, 22.0, 24.0, 15.0, 5.0, 8.0, 12.0, 3.0, 1.0, 5.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.638671875, -3.506378173828125, -3.37408447265625, -3.241790771484375, -3.1094970703125, -2.977203369140625, -2.84490966796875, -2.712615966796875, -2.580322265625, -2.448028564453125, -2.31573486328125, -2.183441162109375, -2.0511474609375, -1.918853759765625, -1.78656005859375, -1.654266357421875, -1.52197265625, -1.389678955078125, -1.25738525390625, -1.125091552734375, -0.9927978515625, -0.860504150390625, -0.72821044921875, -0.595916748046875, -0.463623046875, -0.331329345703125, -0.19903564453125, -0.066741943359375, 0.0655517578125, 0.197845458984375, 0.33013916015625, 0.462432861328125, 0.5947265625, 0.727020263671875, 0.85931396484375, 0.991607666015625, 1.1239013671875, 1.256195068359375, 1.38848876953125, 1.520782470703125, 1.653076171875, 1.785369873046875, 1.91766357421875, 2.049957275390625, 2.1822509765625, 2.314544677734375, 2.44683837890625, 2.579132080078125, 2.71142578125, 2.843719482421875, 2.97601318359375, 3.108306884765625, 3.2406005859375, 3.372894287109375, 3.50518798828125, 3.637481689453125, 3.769775390625, 3.902069091796875, 4.03436279296875, 4.166656494140625, 4.2989501953125, 4.431243896484375, 4.56353759765625, 4.695831298828125, 4.828125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 9.0, 6.0, 8.0, 14.0, 16.0, 31.0, 29.0, 36.0, 52.0, 71.0, 101.0, 123.0, 183.0, 238.0, 363.0, 463.0, 546.0, 448.0, 342.0, 237.0, 182.0, 139.0, 100.0, 100.0, 51.0, 51.0, 33.0, 31.0, 20.0, 20.0, 7.0, 7.0, 8.0, 6.0, 3.0, 5.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.23046875, -7.02032470703125, -6.8101806640625, -6.60003662109375, -6.389892578125, -6.17974853515625, -5.9696044921875, -5.75946044921875, -5.54931640625, -5.33917236328125, -5.1290283203125, -4.91888427734375, -4.708740234375, -4.49859619140625, -4.2884521484375, -4.07830810546875, -3.8681640625, -3.65802001953125, -3.4478759765625, -3.23773193359375, -3.027587890625, -2.81744384765625, -2.6072998046875, -2.39715576171875, -2.18701171875, -1.97686767578125, -1.7667236328125, -1.55657958984375, -1.346435546875, -1.13629150390625, -0.9261474609375, -0.71600341796875, -0.505859375, -0.29571533203125, -0.0855712890625, 0.12457275390625, 0.334716796875, 0.54486083984375, 0.7550048828125, 0.96514892578125, 1.17529296875, 1.38543701171875, 1.5955810546875, 1.80572509765625, 2.015869140625, 2.22601318359375, 2.4361572265625, 2.64630126953125, 2.8564453125, 3.06658935546875, 3.2767333984375, 3.48687744140625, 3.697021484375, 3.90716552734375, 4.1173095703125, 4.32745361328125, 4.53759765625, 4.74774169921875, 4.9578857421875, 5.16802978515625, 5.378173828125, 5.58831787109375, 5.7984619140625, 6.00860595703125, 6.21875]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 3.0, 3.0, 9.0, 14.0, 29.0, 26.0, 55.0, 117.0, 182.0, 326.0, 595.0, 1473.0, 4966.0, 86031.0, 3227877.0, 847236.0, 20827.0, 2621.0, 919.0, 447.0, 223.0, 128.0, 67.0, 51.0, 22.0, 13.0, 8.0, 8.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-20.71875, -20.234619140625, -19.75048828125, -19.266357421875, -18.7822265625, -18.298095703125, -17.81396484375, -17.329833984375, -16.845703125, -16.361572265625, -15.87744140625, -15.393310546875, -14.9091796875, -14.425048828125, -13.94091796875, -13.456787109375, -12.97265625, -12.488525390625, -12.00439453125, -11.520263671875, -11.0361328125, -10.552001953125, -10.06787109375, -9.583740234375, -9.099609375, -8.615478515625, -8.13134765625, -7.647216796875, -7.1630859375, -6.678955078125, -6.19482421875, -5.710693359375, -5.2265625, -4.742431640625, -4.25830078125, -3.774169921875, -3.2900390625, -2.805908203125, -2.32177734375, -1.837646484375, -1.353515625, -0.869384765625, -0.38525390625, 0.098876953125, 0.5830078125, 1.067138671875, 1.55126953125, 2.035400390625, 2.51953125, 3.003662109375, 3.48779296875, 3.971923828125, 4.4560546875, 4.940185546875, 5.42431640625, 5.908447265625, 6.392578125, 6.876708984375, 7.36083984375, 7.844970703125, 8.3291015625, 8.813232421875, 9.29736328125, 9.781494140625, 10.265625]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 9.0, 122.0, 636.0, 241.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-172.91302490234375, -168.05313110351562, -163.19322204589844, -158.3333282470703, -153.4734344482422, -148.613525390625, -143.75363159179688, -138.89373779296875, -134.03382873535156, -129.17393493652344, -124.31403350830078, -119.45413208007812, -114.59423065185547, -109.73432922363281, -104.87443542480469, -100.01453399658203, -95.1546401977539, -90.29473876953125, -85.43484497070312, -80.57494354248047, -75.71504211425781, -70.85514831542969, -65.99524688720703, -61.135345458984375, -56.275447845458984, -51.415550231933594, -46.55564880371094, -41.69575119018555, -36.835853576660156, -31.9759521484375, -27.11605453491211, -22.256153106689453, -17.396255493164062, -12.536355972290039, -7.676457405090332, -2.816558837890625, 2.0433406829833984, 6.903240203857422, 11.763137817382812, 16.62303924560547, 21.48293685913086, 26.342836380004883, 31.202735900878906, 36.0626335144043, 40.92253112792969, 45.782432556152344, 50.642330169677734, 55.50223159790039, 60.36212921142578, 65.22203063964844, 70.08192443847656, 74.94182586669922, 79.80172729492188, 84.66162109375, 89.52152252197266, 94.38142395019531, 99.24131774902344, 104.1012191772461, 108.96111297607422, 113.82101440429688, 118.68091583251953, 123.54081726074219, 128.4007110595703, 133.2606201171875, 138.12051391601562]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 4.0, 5.0, 6.0, 8.0, 7.0, 7.0, 8.0, 12.0, 19.0, 25.0, 22.0, 19.0, 20.0, 24.0, 28.0, 36.0, 31.0, 33.0, 42.0, 41.0, 32.0, 36.0, 40.0, 35.0, 38.0, 25.0, 33.0, 44.0, 37.0, 23.0, 29.0, 36.0, 31.0, 25.0, 14.0, 20.0, 19.0, 23.0, 14.0, 9.0, 11.0, 14.0, 4.0, 5.0, 0.0, 5.0, 4.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-25.626014709472656, -24.84342384338379, -24.06083106994629, -23.278240203857422, -22.495647430419922, -21.713056564331055, -20.930465698242188, -20.147872924804688, -19.36528205871582, -18.582691192626953, -17.800098419189453, -17.017507553100586, -16.23491668701172, -15.452323913574219, -14.669733047485352, -13.887141227722168, -13.104549407958984, -12.3219575881958, -11.539365768432617, -10.75677490234375, -9.974183082580566, -9.191591262817383, -8.409000396728516, -7.626408576965332, -6.843816757202148, -6.061224937438965, -5.2786335945129395, -4.496042251586914, -3.7134504318237305, -2.930858850479126, -2.1482672691345215, -1.365675926208496, -0.5830821990966797, 0.1995093822479248, 0.9821009635925293, 1.7646925449371338, 2.5472841262817383, 3.3298757076263428, 4.112467288970947, 4.895058631896973, 5.677650451660156, 6.46024227142334, 7.242833614349365, 8.02542495727539, 8.808016777038574, 9.590608596801758, 10.373199462890625, 11.155791282653809, 11.938383102416992, 12.720974922180176, 13.50356674194336, 14.286157608032227, 15.06874942779541, 15.851341247558594, 16.63393211364746, 17.416522979736328, 18.199115753173828, 18.981706619262695, 19.764299392700195, 20.546890258789062, 21.329483032226562, 22.11207389831543, 22.894664764404297, 23.677257537841797, 24.459848403930664]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 0.0, 4.0, 12.0, 6.0, 9.0, 8.0, 10.0, 26.0, 19.0, 23.0, 18.0, 22.0, 36.0, 35.0, 25.0, 28.0, 49.0, 42.0, 47.0, 41.0, 48.0, 34.0, 42.0, 40.0, 43.0, 37.0, 33.0, 32.0, 25.0, 28.0, 30.0, 31.0, 23.0, 15.0, 8.0, 19.0, 13.0, 12.0, 7.0, 9.0, 7.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.166015625, -3.070343017578125, -2.97467041015625, -2.878997802734375, -2.7833251953125, -2.687652587890625, -2.59197998046875, -2.496307373046875, -2.400634765625, -2.304962158203125, -2.20928955078125, -2.113616943359375, -2.0179443359375, -1.922271728515625, -1.82659912109375, -1.730926513671875, -1.63525390625, -1.539581298828125, -1.44390869140625, -1.348236083984375, -1.2525634765625, -1.156890869140625, -1.06121826171875, -0.965545654296875, -0.869873046875, -0.774200439453125, -0.67852783203125, -0.582855224609375, -0.4871826171875, -0.391510009765625, -0.29583740234375, -0.200164794921875, -0.1044921875, -0.008819580078125, 0.08685302734375, 0.182525634765625, 0.2781982421875, 0.373870849609375, 0.46954345703125, 0.565216064453125, 0.660888671875, 0.756561279296875, 0.85223388671875, 0.947906494140625, 1.0435791015625, 1.139251708984375, 1.23492431640625, 1.330596923828125, 1.42626953125, 1.521942138671875, 1.61761474609375, 1.713287353515625, 1.8089599609375, 1.904632568359375, 2.00030517578125, 2.095977783203125, 2.191650390625, 2.287322998046875, 2.38299560546875, 2.478668212890625, 2.5743408203125, 2.670013427734375, 2.76568603515625, 2.861358642578125, 2.95703125]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 5.0, 11.0, 12.0, 21.0, 34.0, 35.0, 58.0, 80.0, 124.0, 166.0, 250.0, 387.0, 581.0, 799.0, 1160.0, 1800.0, 2686.0, 4038.0, 5910.0, 9126.0, 14069.0, 21845.0, 34605.0, 57239.0, 99709.0, 177797.0, 233800.0, 156189.0, 87383.0, 50617.0, 31098.0, 19574.0, 12577.0, 8210.0, 5437.0, 3617.0, 2409.0, 1642.0, 1105.0, 741.0, 479.0, 352.0, 251.0, 156.0, 125.0, 86.0, 55.0, 39.0, 31.0, 14.0, 8.0, 9.0, 6.0, 2.0, 2.0, 3.0], "bins": [-0.341796875, -0.33185577392578125, -0.3219146728515625, -0.31197357177734375, -0.302032470703125, -0.29209136962890625, -0.2821502685546875, -0.27220916748046875, -0.26226806640625, -0.25232696533203125, -0.2423858642578125, -0.23244476318359375, -0.222503662109375, -0.21256256103515625, -0.2026214599609375, -0.19268035888671875, -0.1827392578125, -0.17279815673828125, -0.1628570556640625, -0.15291595458984375, -0.142974853515625, -0.13303375244140625, -0.1230926513671875, -0.11315155029296875, -0.10321044921875, -0.09326934814453125, -0.0833282470703125, -0.07338714599609375, -0.063446044921875, -0.05350494384765625, -0.0435638427734375, -0.03362274169921875, -0.023681640625, -0.01374053955078125, -0.0037994384765625, 0.00614166259765625, 0.016082763671875, 0.02602386474609375, 0.0359649658203125, 0.04590606689453125, 0.05584716796875, 0.06578826904296875, 0.0757293701171875, 0.08567047119140625, 0.095611572265625, 0.10555267333984375, 0.1154937744140625, 0.12543487548828125, 0.1353759765625, 0.14531707763671875, 0.1552581787109375, 0.16519927978515625, 0.175140380859375, 0.18508148193359375, 0.1950225830078125, 0.20496368408203125, 0.21490478515625, 0.22484588623046875, 0.2347869873046875, 0.24472808837890625, 0.254669189453125, 0.26461029052734375, 0.2745513916015625, 0.28449249267578125, 0.29443359375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 3.0, 6.0, 3.0, 4.0, 10.0, 11.0, 10.0, 11.0, 23.0, 18.0, 23.0, 29.0, 24.0, 33.0, 26.0, 23.0, 31.0, 30.0, 43.0, 35.0, 47.0, 41.0, 1059.0, 43.0, 39.0, 41.0, 26.0, 25.0, 44.0, 26.0, 28.0, 30.0, 26.0, 24.0, 23.0, 13.0, 18.0, 11.0, 9.0, 9.0, 16.0, 6.0, 3.0, 5.0, 6.0, 5.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0], "bins": [-1.8505859375, -1.7937774658203125, -1.736968994140625, -1.6801605224609375, -1.62335205078125, -1.5665435791015625, -1.509735107421875, -1.4529266357421875, -1.3961181640625, -1.3393096923828125, -1.282501220703125, -1.2256927490234375, -1.16888427734375, -1.1120758056640625, -1.055267333984375, -0.9984588623046875, -0.941650390625, -0.8848419189453125, -0.828033447265625, -0.7712249755859375, -0.71441650390625, -0.6576080322265625, -0.600799560546875, -0.5439910888671875, -0.4871826171875, -0.4303741455078125, -0.373565673828125, -0.3167572021484375, -0.25994873046875, -0.2031402587890625, -0.146331787109375, -0.0895233154296875, -0.03271484375, 0.0240936279296875, 0.080902099609375, 0.1377105712890625, 0.19451904296875, 0.2513275146484375, 0.308135986328125, 0.3649444580078125, 0.4217529296875, 0.4785614013671875, 0.535369873046875, 0.5921783447265625, 0.64898681640625, 0.7057952880859375, 0.762603759765625, 0.8194122314453125, 0.876220703125, 0.9330291748046875, 0.989837646484375, 1.0466461181640625, 1.10345458984375, 1.1602630615234375, 1.217071533203125, 1.2738800048828125, 1.3306884765625, 1.3874969482421875, 1.444305419921875, 1.5011138916015625, 1.55792236328125, 1.6147308349609375, 1.671539306640625, 1.7283477783203125, 1.78515625]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 5.0, 6.0, 9.0, 7.0, 23.0, 24.0, 33.0, 52.0, 84.0, 108.0, 147.0, 250.0, 336.0, 421.0, 633.0, 881.0, 1342.0, 1884.0, 2734.0, 4132.0, 5933.0, 8821.0, 13258.0, 19920.0, 31303.0, 49177.0, 80120.0, 133621.0, 1254202.0, 184911.0, 113242.0, 68101.0, 41934.0, 26252.0, 17156.0, 11336.0, 7606.0, 5270.0, 3701.0, 2471.0, 1674.0, 1216.0, 854.0, 655.0, 379.0, 278.0, 178.0, 144.0, 122.0, 62.0, 46.0, 31.0, 26.0, 9.0, 8.0, 8.0, 4.0, 6.0, 1.0], "bins": [-0.26806640625, -0.2601432800292969, -0.25222015380859375, -0.24429702758789062, -0.2363739013671875, -0.22845077514648438, -0.22052764892578125, -0.21260452270507812, -0.204681396484375, -0.19675827026367188, -0.18883514404296875, -0.18091201782226562, -0.1729888916015625, -0.16506576538085938, -0.15714263916015625, -0.14921951293945312, -0.14129638671875, -0.13337326049804688, -0.12545013427734375, -0.11752700805664062, -0.1096038818359375, -0.10168075561523438, -0.09375762939453125, -0.08583450317382812, -0.077911376953125, -0.06998825073242188, -0.06206512451171875, -0.054141998291015625, -0.0462188720703125, -0.038295745849609375, -0.03037261962890625, -0.022449493408203125, -0.0145263671875, -0.006603240966796875, 0.00131988525390625, 0.009243011474609375, 0.0171661376953125, 0.025089263916015625, 0.03301239013671875, 0.040935516357421875, 0.048858642578125, 0.056781768798828125, 0.06470489501953125, 0.07262802124023438, 0.0805511474609375, 0.08847427368164062, 0.09639739990234375, 0.10432052612304688, 0.11224365234375, 0.12016677856445312, 0.12808990478515625, 0.13601303100585938, 0.1439361572265625, 0.15185928344726562, 0.15978240966796875, 0.16770553588867188, 0.175628662109375, 0.18355178833007812, 0.19147491455078125, 0.19939804077148438, 0.2073211669921875, 0.21524429321289062, 0.22316741943359375, 0.23109054565429688, 0.239013671875]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 3.0, 3.0, 7.0, 7.0, 10.0, 12.0, 7.0, 25.0, 22.0, 21.0, 10.0, 22.0, 39.0, 32.0, 41.0, 37.0, 48.0, 55.0, 61.0, 58.0, 58.0, 45.0, 44.0, 52.0, 37.0, 40.0, 43.0, 28.0, 28.0, 17.0, 19.0, 17.0, 8.0, 10.0, 12.0, 3.0, 5.0, 5.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0006933212280273438, -0.0006702244281768799, -0.000647127628326416, -0.0006240308284759521, -0.0006009340286254883, -0.0005778372287750244, -0.0005547404289245605, -0.0005316436290740967, -0.0005085468292236328, -0.00048545002937316895, -0.0004623532295227051, -0.0004392564296722412, -0.00041615962982177734, -0.0003930628299713135, -0.0003699660301208496, -0.00034686923027038574, -0.0003237724304199219, -0.000300675630569458, -0.00027757883071899414, -0.0002544820308685303, -0.0002313852310180664, -0.00020828843116760254, -0.00018519163131713867, -0.0001620948314666748, -0.00013899803161621094, -0.00011590123176574707, -9.28044319152832e-05, -6.970763206481934e-05, -4.661083221435547e-05, -2.35140323638916e-05, -4.172325134277344e-07, 2.2679567337036133e-05, 4.57763671875e-05, 6.887316703796387e-05, 9.196996688842773e-05, 0.0001150667667388916, 0.00013816356658935547, 0.00016126036643981934, 0.0001843571662902832, 0.00020745396614074707, 0.00023055076599121094, 0.0002536475658416748, 0.00027674436569213867, 0.00029984116554260254, 0.0003229379653930664, 0.0003460347652435303, 0.00036913156509399414, 0.000392228364944458, 0.0004153251647949219, 0.00043842196464538574, 0.0004615187644958496, 0.0004846155643463135, 0.0005077123641967773, 0.0005308091640472412, 0.0005539059638977051, 0.0005770027637481689, 0.0006000995635986328, 0.0006231963634490967, 0.0006462931632995605, 0.0006693899631500244, 0.0006924867630004883, 0.0007155835628509521, 0.000738680362701416, 0.0007617771625518799, 0.0007848739624023438]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 6.0, 4.0, 10.0, 3.0, 9.0, 13.0, 14.0, 20.0, 23.0, 34.0, 40.0, 41.0, 62.0, 90.0, 122.0, 171.0, 248.0, 333.0, 628.0, 1511.0, 63391.0, 964120.0, 14856.0, 1074.0, 547.0, 325.0, 221.0, 130.0, 101.0, 84.0, 39.0, 46.0, 48.0, 44.0, 39.0, 21.0, 15.0, 17.0, 14.0, 10.0, 6.0, 7.0, 4.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0139617919921875, -0.013543248176574707, -0.013124704360961914, -0.012706160545349121, -0.012287616729736328, -0.011869072914123535, -0.011450529098510742, -0.01103198528289795, -0.010613441467285156, -0.010194897651672363, -0.00977635383605957, -0.009357810020446777, -0.008939266204833984, -0.008520722389221191, -0.008102178573608398, -0.0076836347579956055, -0.0072650909423828125, -0.0068465471267700195, -0.0064280033111572266, -0.006009459495544434, -0.005590915679931641, -0.005172371864318848, -0.004753828048706055, -0.004335284233093262, -0.003916740417480469, -0.0034981966018676758, -0.003079652786254883, -0.00266110897064209, -0.002242565155029297, -0.001824021339416504, -0.001405477523803711, -0.000986933708190918, -0.000568389892578125, -0.00014984607696533203, 0.00026869773864746094, 0.0006872415542602539, 0.0011057853698730469, 0.0015243291854858398, 0.0019428730010986328, 0.0023614168167114258, 0.0027799606323242188, 0.0031985044479370117, 0.0036170482635498047, 0.004035592079162598, 0.004454135894775391, 0.004872679710388184, 0.0052912235260009766, 0.0057097673416137695, 0.0061283111572265625, 0.0065468549728393555, 0.0069653987884521484, 0.007383942604064941, 0.007802486419677734, 0.008221030235290527, 0.00863957405090332, 0.009058117866516113, 0.009476661682128906, 0.0098952054977417, 0.010313749313354492, 0.010732293128967285, 0.011150836944580078, 0.011569380760192871, 0.011987924575805664, 0.012406468391418457, 0.01282501220703125]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 67.0, 414.0, 439.0, 85.0, 8.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00449946615844965, -0.004403896629810333, -0.004308327566832304, -0.0042127580381929874, -0.004117188975214958, -0.004021619446575642, -0.003926050383597612, -0.0038304810877889395, -0.0037349117919802666, -0.0036393424961715937, -0.0035437732003629208, -0.003448203904554248, -0.003352634608745575, -0.003257065312936902, -0.003161496017128229, -0.0030659267213195562, -0.0029703574255108833, -0.0028747881297022104, -0.0027792188338935375, -0.0026836495380848646, -0.0025880802422761917, -0.002492510946467519, -0.002396941650658846, -0.002301372354850173, -0.0022058028262108564, -0.0021102335304021835, -0.0020146642345935106, -0.0019190949387848377, -0.0018235256429761648, -0.001727956347167492, -0.001632387051358819, -0.001536817755550146, -0.001441248576156795, -0.0013456792803481221, -0.0012501099845394492, -0.0011545406887307763, -0.0010589713929221034, -0.0009634020971134305, -0.0008678327430970967, -0.0007722634472884238, -0.0006766941514797509, -0.000581124855671078, -0.00048555555986240506, -0.0003899862349499017, -0.0002944169391412288, -0.0001988476433325559, -0.00010327831842005253, -7.709022611379623e-06, 8.786027319729328e-05, 0.0001834295690059662, 0.0002789988648146391, 0.00037456818972714245, 0.00047013748553581536, 0.0005657067522406578, 0.0006612761062569916, 0.0007568454020656645, 0.0008524146978743374, 0.0009479839936830103, 0.0010435533476993442, 0.001139122643508017, 0.00123469193931669, 0.0013302612351253629, 0.0014258305309340358, 0.0015213998267427087, 0.0016169691225513816]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 3.0, 9.0, 9.0, 9.0, 9.0, 20.0, 18.0, 22.0, 27.0, 22.0, 21.0, 30.0, 27.0, 27.0, 27.0, 38.0, 43.0, 37.0, 39.0, 25.0, 22.0, 57.0, 42.0, 35.0, 46.0, 45.0, 38.0, 40.0, 25.0, 27.0, 26.0, 19.0, 18.0, 18.0, 15.0, 13.0, 7.0, 15.0, 11.0, 3.0, 6.0, 4.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.00043201446533203125, -0.00041953567415475845, -0.00040705688297748566, -0.00039457809180021286, -0.00038209930062294006, -0.00036962050944566727, -0.00035714171826839447, -0.0003446629270911217, -0.0003321841359138489, -0.0003197053447365761, -0.0003072265535593033, -0.0002947477623820305, -0.0002822689712047577, -0.0002697901800274849, -0.0002573113888502121, -0.0002448325976729393, -0.0002323538064956665, -0.0002198750153183937, -0.0002073962241411209, -0.00019491743296384811, -0.00018243864178657532, -0.00016995985060930252, -0.00015748105943202972, -0.00014500226825475693, -0.00013252347707748413, -0.00012004468590021133, -0.00010756589472293854, -9.508710354566574e-05, -8.260831236839294e-05, -7.012952119112015e-05, -5.765073001384735e-05, -4.5171938836574554e-05, -3.269314765930176e-05, -2.021435648202896e-05, -7.735565304756165e-06, 4.743225872516632e-06, 1.722201704978943e-05, 2.9700808227062225e-05, 4.217959940433502e-05, 5.465839058160782e-05, 6.713718175888062e-05, 7.961597293615341e-05, 9.209476411342621e-05, 0.000104573555290699, 0.0001170523464679718, 0.0001295311376452446, 0.0001420099288225174, 0.0001544887199997902, 0.000166967511177063, 0.00017944630235433578, 0.00019192509353160858, 0.00020440388470888138, 0.00021688267588615417, 0.00022936146706342697, 0.00024184025824069977, 0.00025431904941797256, 0.00026679784059524536, 0.00027927663177251816, 0.00029175542294979095, 0.00030423421412706375, 0.00031671300530433655, 0.00032919179648160934, 0.00034167058765888214, 0.00035414937883615494, 0.00036662817001342773]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 0.0, 4.0, 12.0, 6.0, 9.0, 8.0, 10.0, 26.0, 19.0, 23.0, 18.0, 22.0, 36.0, 35.0, 25.0, 28.0, 49.0, 42.0, 47.0, 41.0, 48.0, 34.0, 42.0, 39.0, 44.0, 37.0, 33.0, 32.0, 25.0, 28.0, 30.0, 31.0, 23.0, 15.0, 8.0, 19.0, 13.0, 12.0, 7.0, 9.0, 7.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.166015625, -3.070343017578125, -2.97467041015625, -2.878997802734375, -2.7833251953125, -2.687652587890625, -2.59197998046875, -2.496307373046875, -2.400634765625, -2.304962158203125, -2.20928955078125, -2.113616943359375, -2.0179443359375, -1.922271728515625, -1.82659912109375, -1.730926513671875, -1.63525390625, -1.539581298828125, -1.44390869140625, -1.348236083984375, -1.2525634765625, -1.156890869140625, -1.06121826171875, -0.965545654296875, -0.869873046875, -0.774200439453125, -0.67852783203125, -0.582855224609375, -0.4871826171875, -0.391510009765625, -0.29583740234375, -0.200164794921875, -0.1044921875, -0.008819580078125, 0.08685302734375, 0.182525634765625, 0.2781982421875, 0.373870849609375, 0.46954345703125, 0.565216064453125, 0.660888671875, 0.756561279296875, 0.85223388671875, 0.947906494140625, 1.0435791015625, 1.139251708984375, 1.23492431640625, 1.330596923828125, 1.42626953125, 1.521942138671875, 1.61761474609375, 1.713287353515625, 1.8089599609375, 1.904632568359375, 2.00030517578125, 2.095977783203125, 2.191650390625, 2.287322998046875, 2.38299560546875, 2.478668212890625, 2.5743408203125, 2.670013427734375, 2.76568603515625, 2.861358642578125, 2.95703125]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 9.0, 8.0, 15.0, 14.0, 29.0, 43.0, 66.0, 63.0, 92.0, 130.0, 174.0, 212.0, 250.0, 340.0, 483.0, 681.0, 842.0, 1201.0, 1647.0, 2296.0, 3694.0, 8837.0, 45532.0, 387773.0, 508717.0, 61809.0, 10439.0, 4098.0, 2433.0, 1710.0, 1246.0, 933.0, 670.0, 500.0, 400.0, 291.0, 245.0, 165.0, 130.0, 90.0, 80.0, 44.0, 35.0, 26.0, 19.0, 16.0, 8.0, 6.0, 6.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.00390625, -6.77850341796875, -6.5531005859375, -6.32769775390625, -6.102294921875, -5.87689208984375, -5.6514892578125, -5.42608642578125, -5.20068359375, -4.97528076171875, -4.7498779296875, -4.52447509765625, -4.299072265625, -4.07366943359375, -3.8482666015625, -3.62286376953125, -3.3974609375, -3.17205810546875, -2.9466552734375, -2.72125244140625, -2.495849609375, -2.27044677734375, -2.0450439453125, -1.81964111328125, -1.59423828125, -1.36883544921875, -1.1434326171875, -0.91802978515625, -0.692626953125, -0.46722412109375, -0.2418212890625, -0.01641845703125, 0.208984375, 0.43438720703125, 0.6597900390625, 0.88519287109375, 1.110595703125, 1.33599853515625, 1.5614013671875, 1.78680419921875, 2.01220703125, 2.23760986328125, 2.4630126953125, 2.68841552734375, 2.913818359375, 3.13922119140625, 3.3646240234375, 3.59002685546875, 3.8154296875, 4.04083251953125, 4.2662353515625, 4.49163818359375, 4.717041015625, 4.94244384765625, 5.1678466796875, 5.39324951171875, 5.61865234375, 5.84405517578125, 6.0694580078125, 6.29486083984375, 6.520263671875, 6.74566650390625, 6.9710693359375, 7.19647216796875, 7.421875]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 6.0, 5.0, 4.0, 6.0, 6.0, 11.0, 15.0, 11.0, 14.0, 20.0, 24.0, 38.0, 41.0, 50.0, 51.0, 68.0, 99.0, 238.0, 1587.0, 284.0, 107.0, 52.0, 54.0, 49.0, 40.0, 34.0, 22.0, 19.0, 17.0, 21.0, 14.0, 12.0, 7.0, 9.0, 4.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.375, -9.087158203125, -8.79931640625, -8.511474609375, -8.2236328125, -7.935791015625, -7.64794921875, -7.360107421875, -7.072265625, -6.784423828125, -6.49658203125, -6.208740234375, -5.9208984375, -5.633056640625, -5.34521484375, -5.057373046875, -4.76953125, -4.481689453125, -4.19384765625, -3.906005859375, -3.6181640625, -3.330322265625, -3.04248046875, -2.754638671875, -2.466796875, -2.178955078125, -1.89111328125, -1.603271484375, -1.3154296875, -1.027587890625, -0.73974609375, -0.451904296875, -0.1640625, 0.123779296875, 0.41162109375, 0.699462890625, 0.9873046875, 1.275146484375, 1.56298828125, 1.850830078125, 2.138671875, 2.426513671875, 2.71435546875, 3.002197265625, 3.2900390625, 3.577880859375, 3.86572265625, 4.153564453125, 4.44140625, 4.729248046875, 5.01708984375, 5.304931640625, 5.5927734375, 5.880615234375, 6.16845703125, 6.456298828125, 6.744140625, 7.031982421875, 7.31982421875, 7.607666015625, 7.8955078125, 8.183349609375, 8.47119140625, 8.759033203125, 9.046875]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 7.0, 9.0, 7.0, 10.0, 21.0, 15.0, 25.0, 29.0, 31.0, 56.0, 83.0, 138.0, 216.0, 394.0, 754.0, 2031.0, 820805.0, 2317077.0, 2150.0, 781.0, 354.0, 258.0, 139.0, 97.0, 55.0, 48.0, 34.0, 20.0, 22.0, 13.0, 6.0, 3.0, 7.0, 1.0, 1.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.5, -35.2841796875, -34.068359375, -32.8525390625, -31.63671875, -30.4208984375, -29.205078125, -27.9892578125, -26.7734375, -25.5576171875, -24.341796875, -23.1259765625, -21.91015625, -20.6943359375, -19.478515625, -18.2626953125, -17.046875, -15.8310546875, -14.615234375, -13.3994140625, -12.18359375, -10.9677734375, -9.751953125, -8.5361328125, -7.3203125, -6.1044921875, -4.888671875, -3.6728515625, -2.45703125, -1.2412109375, -0.025390625, 1.1904296875, 2.40625, 3.6220703125, 4.837890625, 6.0537109375, 7.26953125, 8.4853515625, 9.701171875, 10.9169921875, 12.1328125, 13.3486328125, 14.564453125, 15.7802734375, 16.99609375, 18.2119140625, 19.427734375, 20.6435546875, 21.859375, 23.0751953125, 24.291015625, 25.5068359375, 26.72265625, 27.9384765625, 29.154296875, 30.3701171875, 31.5859375, 32.8017578125, 34.017578125, 35.2333984375, 36.44921875, 37.6650390625, 38.880859375, 40.0966796875, 41.3125]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 6.0, 72.0, 305.0, 431.0, 166.0, 27.0, 6.0, 0.0, 0.0, 1.0], "bins": [-120.43241119384766, -118.32765197753906, -116.22289276123047, -114.11813354492188, -112.01338195800781, -109.90862274169922, -107.80386352539062, -105.69910430908203, -103.59434509277344, -101.48958587646484, -99.38482666015625, -97.28006744384766, -95.17530822753906, -93.070556640625, -90.9657974243164, -88.86103820800781, -86.75627899169922, -84.65151977539062, -82.54676055908203, -80.44200134277344, -78.33724975585938, -76.23249053955078, -74.12773132324219, -72.0229721069336, -69.918212890625, -67.8134536743164, -65.70869445800781, -63.603939056396484, -61.49917984008789, -59.3944206237793, -57.28966522216797, -55.184906005859375, -53.08014678955078, -50.97538757324219, -48.870628356933594, -46.765872955322266, -44.66111373901367, -42.55635452270508, -40.45159912109375, -38.346839904785156, -36.24208068847656, -34.13732147216797, -32.032562255859375, -29.927806854248047, -27.823047637939453, -25.71828842163086, -23.6135311126709, -21.508773803710938, -19.404014587402344, -17.29925537109375, -15.194498062133789, -13.089739799499512, -10.984981536865234, -8.880223274230957, -6.77546501159668, -4.670706748962402, -2.565948486328125, -0.46119022369384766, 1.6435680389404297, 3.748326301574707, 5.853084564208984, 7.957842826843262, 10.062601089477539, 12.167359352111816, 14.272117614746094]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 6.0, 6.0, 8.0, 12.0, 6.0, 9.0, 15.0, 14.0, 22.0, 15.0, 29.0, 33.0, 37.0, 34.0, 33.0, 31.0, 35.0, 46.0, 38.0, 41.0, 40.0, 51.0, 55.0, 44.0, 41.0, 37.0, 39.0, 37.0, 35.0, 29.0, 25.0, 19.0, 14.0, 13.0, 11.0, 10.0, 7.0, 10.0, 10.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-32.10478591918945, -31.19209861755371, -30.27941131591797, -29.366724014282227, -28.454036712646484, -27.541349411010742, -26.628662109375, -25.715974807739258, -24.803287506103516, -23.890600204467773, -22.97791290283203, -22.06522560119629, -21.152538299560547, -20.239850997924805, -19.327163696289062, -18.41447639465332, -17.501789093017578, -16.589101791381836, -15.676414489746094, -14.763727188110352, -13.85103988647461, -12.938352584838867, -12.025665283203125, -11.112977981567383, -10.20029067993164, -9.287603378295898, -8.374916076660156, -7.462228775024414, -6.549541473388672, -5.63685417175293, -4.7241668701171875, -3.8114795684814453, -2.8987903594970703, -1.9861030578613281, -1.073415756225586, -0.16072845458984375, 0.7519588470458984, 1.6646461486816406, 2.577333450317383, 3.490020751953125, 4.402708053588867, 5.315395355224609, 6.228082656860352, 7.140769958496094, 8.053457260131836, 8.966144561767578, 9.87883186340332, 10.791519165039062, 11.704206466674805, 12.616893768310547, 13.529581069946289, 14.442268371582031, 15.354955673217773, 16.267642974853516, 17.180330276489258, 18.093017578125, 19.005704879760742, 19.918392181396484, 20.831079483032227, 21.74376678466797, 22.65645408630371, 23.569141387939453, 24.481828689575195, 25.394515991210938, 26.30720329284668]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 7.0, 5.0, 3.0, 3.0, 6.0, 13.0, 10.0, 11.0, 11.0, 12.0, 20.0, 23.0, 26.0, 36.0, 29.0, 37.0, 38.0, 30.0, 28.0, 43.0, 41.0, 43.0, 44.0, 40.0, 39.0, 56.0, 38.0, 45.0, 29.0, 33.0, 33.0, 14.0, 22.0, 26.0, 14.0, 23.0, 16.0, 18.0, 10.0, 7.0, 5.0, 7.0, 4.0, 2.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.25390625, -3.153961181640625, -3.05401611328125, -2.954071044921875, -2.8541259765625, -2.754180908203125, -2.65423583984375, -2.554290771484375, -2.454345703125, -2.354400634765625, -2.25445556640625, -2.154510498046875, -2.0545654296875, -1.954620361328125, -1.85467529296875, -1.754730224609375, -1.65478515625, -1.554840087890625, -1.45489501953125, -1.354949951171875, -1.2550048828125, -1.155059814453125, -1.05511474609375, -0.955169677734375, -0.855224609375, -0.755279541015625, -0.65533447265625, -0.555389404296875, -0.4554443359375, -0.355499267578125, -0.25555419921875, -0.155609130859375, -0.0556640625, 0.044281005859375, 0.14422607421875, 0.244171142578125, 0.3441162109375, 0.444061279296875, 0.54400634765625, 0.643951416015625, 0.743896484375, 0.843841552734375, 0.94378662109375, 1.043731689453125, 1.1436767578125, 1.243621826171875, 1.34356689453125, 1.443511962890625, 1.54345703125, 1.643402099609375, 1.74334716796875, 1.843292236328125, 1.9432373046875, 2.043182373046875, 2.14312744140625, 2.243072509765625, 2.343017578125, 2.442962646484375, 2.54290771484375, 2.642852783203125, 2.7427978515625, 2.842742919921875, 2.94268798828125, 3.042633056640625, 3.142578125]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 4.0, 3.0, 12.0, 7.0, 13.0, 15.0, 19.0, 22.0, 31.0, 38.0, 43.0, 61.0, 112.0, 199.0, 438.0, 1078.0, 2922.0, 10808.0, 61792.0, 696221.0, 2644549.0, 698375.0, 61755.0, 10729.0, 2979.0, 1087.0, 389.0, 208.0, 92.0, 69.0, 50.0, 39.0, 28.0, 19.0, 18.0, 16.0, 9.0, 9.0, 6.0, 9.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.21875, -6.00054931640625, -5.7823486328125, -5.56414794921875, -5.345947265625, -5.12774658203125, -4.9095458984375, -4.69134521484375, -4.47314453125, -4.25494384765625, -4.0367431640625, -3.81854248046875, -3.600341796875, -3.38214111328125, -3.1639404296875, -2.94573974609375, -2.7275390625, -2.50933837890625, -2.2911376953125, -2.07293701171875, -1.854736328125, -1.63653564453125, -1.4183349609375, -1.20013427734375, -0.98193359375, -0.76373291015625, -0.5455322265625, -0.32733154296875, -0.109130859375, 0.10906982421875, 0.3272705078125, 0.54547119140625, 0.763671875, 0.98187255859375, 1.2000732421875, 1.41827392578125, 1.636474609375, 1.85467529296875, 2.0728759765625, 2.29107666015625, 2.50927734375, 2.72747802734375, 2.9456787109375, 3.16387939453125, 3.382080078125, 3.60028076171875, 3.8184814453125, 4.03668212890625, 4.2548828125, 4.47308349609375, 4.6912841796875, 4.90948486328125, 5.127685546875, 5.34588623046875, 5.5640869140625, 5.78228759765625, 6.00048828125, 6.21868896484375, 6.4368896484375, 6.65509033203125, 6.873291015625, 7.09149169921875, 7.3096923828125, 7.52789306640625, 7.74609375]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 8.0, 12.0, 40.0, 152.0, 729.0, 2027.0, 885.0, 185.0, 41.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.09375, -29.22412109375, -28.3544921875, -27.48486328125, -26.615234375, -25.74560546875, -24.8759765625, -24.00634765625, -23.13671875, -22.26708984375, -21.3974609375, -20.52783203125, -19.658203125, -18.78857421875, -17.9189453125, -17.04931640625, -16.1796875, -15.31005859375, -14.4404296875, -13.57080078125, -12.701171875, -11.83154296875, -10.9619140625, -10.09228515625, -9.22265625, -8.35302734375, -7.4833984375, -6.61376953125, -5.744140625, -4.87451171875, -4.0048828125, -3.13525390625, -2.265625, -1.39599609375, -0.5263671875, 0.34326171875, 1.212890625, 2.08251953125, 2.9521484375, 3.82177734375, 4.69140625, 5.56103515625, 6.4306640625, 7.30029296875, 8.169921875, 9.03955078125, 9.9091796875, 10.77880859375, 11.6484375, 12.51806640625, 13.3876953125, 14.25732421875, 15.126953125, 15.99658203125, 16.8662109375, 17.73583984375, 18.60546875, 19.47509765625, 20.3447265625, 21.21435546875, 22.083984375, 22.95361328125, 23.8232421875, 24.69287109375, 25.5625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 6.0, 6.0, 16.0, 75.0, 363.0, 3181.0, 4182570.0, 7304.0, 585.0, 127.0, 33.0, 10.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.90625, -53.05126953125, -51.1962890625, -49.34130859375, -47.486328125, -45.63134765625, -43.7763671875, -41.92138671875, -40.06640625, -38.21142578125, -36.3564453125, -34.50146484375, -32.646484375, -30.79150390625, -28.9365234375, -27.08154296875, -25.2265625, -23.37158203125, -21.5166015625, -19.66162109375, -17.806640625, -15.95166015625, -14.0966796875, -12.24169921875, -10.38671875, -8.53173828125, -6.6767578125, -4.82177734375, -2.966796875, -1.11181640625, 0.7431640625, 2.59814453125, 4.453125, 6.30810546875, 8.1630859375, 10.01806640625, 11.873046875, 13.72802734375, 15.5830078125, 17.43798828125, 19.29296875, 21.14794921875, 23.0029296875, 24.85791015625, 26.712890625, 28.56787109375, 30.4228515625, 32.27783203125, 34.1328125, 35.98779296875, 37.8427734375, 39.69775390625, 41.552734375, 43.40771484375, 45.2626953125, 47.11767578125, 48.97265625, 50.82763671875, 52.6826171875, 54.53759765625, 56.392578125, 58.24755859375, 60.1025390625, 61.95751953125, 63.8125]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 136.0, 744.0, 124.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-155.8914794921875, -150.60498046875, -145.3184814453125, -140.031982421875, -134.7454833984375, -129.45899963378906, -124.17250061035156, -118.88600158691406, -113.59950256347656, -108.31300354003906, -103.02650451660156, -97.7400131225586, -92.4535140991211, -87.1670150756836, -81.88052368164062, -76.59402465820312, -71.30752563476562, -66.02102661132812, -60.73453140258789, -55.448036193847656, -50.161537170410156, -44.875038146972656, -39.58854293823242, -34.30204772949219, -29.015548706054688, -23.72905158996582, -18.442554473876953, -13.156057357788086, -7.869560241699219, -2.5830631256103516, 2.7034339904785156, 7.98992919921875, 13.27642822265625, 18.562925338745117, 23.849422454833984, 29.13591957092285, 34.42241668701172, 39.70891571044922, 44.99541091918945, 50.28190612792969, 55.56840515136719, 60.85490417480469, 66.14140319824219, 71.42789459228516, 76.71439361572266, 82.00089263916016, 87.28738403320312, 92.57388305664062, 97.86038208007812, 103.14688110351562, 108.43338012695312, 113.7198715209961, 119.0063705444336, 124.2928695678711, 129.57936096191406, 134.86585998535156, 140.15235900878906, 145.43885803222656, 150.72535705566406, 156.01185607910156, 161.29833984375, 166.5848388671875, 171.871337890625, 177.1578369140625, 182.4443359375]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 6.0, 7.0, 4.0, 9.0, 4.0, 14.0, 12.0, 12.0, 15.0, 10.0, 24.0, 26.0, 29.0, 28.0, 33.0, 31.0, 36.0, 37.0, 41.0, 32.0, 35.0, 26.0, 37.0, 44.0, 33.0, 37.0, 31.0, 35.0, 29.0, 36.0, 33.0, 33.0, 29.0, 21.0, 22.0, 19.0, 15.0, 13.0, 14.0, 13.0, 8.0, 6.0, 6.0, 5.0, 3.0, 3.0, 2.0, 4.0, 7.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.217395782470703, -25.44339942932129, -24.669403076171875, -23.89540672302246, -23.121410369873047, -22.347414016723633, -21.57341766357422, -20.799423217773438, -20.02542495727539, -19.251428604125977, -18.477432250976562, -17.70343589782715, -16.929439544677734, -16.15544319152832, -15.381447792053223, -14.607451438903809, -13.833456039428711, -13.059459686279297, -12.285463333129883, -11.511466979980469, -10.737470626831055, -9.96347427368164, -9.189478874206543, -8.415482521057129, -7.641486167907715, -6.867489814758301, -6.093493461608887, -5.319497585296631, -4.545501232147217, -3.7715048789978027, -2.997509002685547, -2.223512649536133, -1.4495162963867188, -0.6755200624465942, 0.09847617149353027, 0.8724722862243652, 1.6464686393737793, 2.4204649925231934, 3.194460868835449, 3.9684572219848633, 4.742453575134277, 5.516449928283691, 6.2904462814331055, 7.064442157745361, 7.838438510894775, 8.612434387207031, 9.386430740356445, 10.16042709350586, 10.934423446655273, 11.708419799804688, 12.482416152954102, 13.256412506103516, 14.03040885925293, 14.804405212402344, 15.578400611877441, 16.352397918701172, 17.126392364501953, 17.900388717651367, 18.67438507080078, 19.448381423950195, 20.22237777709961, 20.996374130249023, 21.770370483398438, 22.54436492919922, 23.318363189697266]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 3.0, 10.0, 7.0, 6.0, 12.0, 12.0, 17.0, 13.0, 12.0, 20.0, 23.0, 28.0, 29.0, 31.0, 29.0, 37.0, 24.0, 33.0, 35.0, 36.0, 38.0, 33.0, 41.0, 46.0, 34.0, 37.0, 39.0, 31.0, 23.0, 21.0, 24.0, 37.0, 34.0, 26.0, 7.0, 18.0, 13.0, 10.0, 12.0, 14.0, 7.0, 12.0, 8.0, 2.0, 2.0, 7.0, 3.0, 1.0, 3.0, 0.0, 3.0, 0.0, 3.0], "bins": [-2.34765625, -2.276611328125, -2.20556640625, -2.134521484375, -2.0634765625, -1.992431640625, -1.92138671875, -1.850341796875, -1.779296875, -1.708251953125, -1.63720703125, -1.566162109375, -1.4951171875, -1.424072265625, -1.35302734375, -1.281982421875, -1.2109375, -1.139892578125, -1.06884765625, -0.997802734375, -0.9267578125, -0.855712890625, -0.78466796875, -0.713623046875, -0.642578125, -0.571533203125, -0.50048828125, -0.429443359375, -0.3583984375, -0.287353515625, -0.21630859375, -0.145263671875, -0.07421875, -0.003173828125, 0.06787109375, 0.138916015625, 0.2099609375, 0.281005859375, 0.35205078125, 0.423095703125, 0.494140625, 0.565185546875, 0.63623046875, 0.707275390625, 0.7783203125, 0.849365234375, 0.92041015625, 0.991455078125, 1.0625, 1.133544921875, 1.20458984375, 1.275634765625, 1.3466796875, 1.417724609375, 1.48876953125, 1.559814453125, 1.630859375, 1.701904296875, 1.77294921875, 1.843994140625, 1.9150390625, 1.986083984375, 2.05712890625, 2.128173828125, 2.19921875]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 11.0, 15.0, 15.0, 23.0, 22.0, 48.0, 72.0, 108.0, 156.0, 213.0, 278.0, 443.0, 671.0, 1058.0, 1590.0, 2470.0, 3678.0, 6026.0, 9630.0, 15368.0, 25115.0, 42682.0, 73262.0, 134325.0, 233265.0, 214310.0, 119066.0, 65467.0, 38050.0, 22920.0, 14013.0, 8654.0, 5551.0, 3384.0, 2251.0, 1455.0, 933.0, 638.0, 405.0, 276.0, 184.0, 143.0, 103.0, 60.0, 45.0, 32.0, 19.0, 14.0, 15.0, 6.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 3.0], "bins": [-0.275390625, -0.2667579650878906, -0.25812530517578125, -0.24949264526367188, -0.2408599853515625, -0.23222732543945312, -0.22359466552734375, -0.21496200561523438, -0.206329345703125, -0.19769668579101562, -0.18906402587890625, -0.18043136596679688, -0.1717987060546875, -0.16316604614257812, -0.15453338623046875, -0.14590072631835938, -0.13726806640625, -0.12863540649414062, -0.12000274658203125, -0.11137008666992188, -0.1027374267578125, -0.09410476684570312, -0.08547210693359375, -0.07683944702148438, -0.068206787109375, -0.059574127197265625, -0.05094146728515625, -0.042308807373046875, -0.0336761474609375, -0.025043487548828125, -0.01641082763671875, -0.007778167724609375, 0.0008544921875, 0.009487152099609375, 0.01811981201171875, 0.026752471923828125, 0.0353851318359375, 0.044017791748046875, 0.05265045166015625, 0.061283111572265625, 0.069915771484375, 0.07854843139648438, 0.08718109130859375, 0.09581375122070312, 0.1044464111328125, 0.11307907104492188, 0.12171173095703125, 0.13034439086914062, 0.13897705078125, 0.14760971069335938, 0.15624237060546875, 0.16487503051757812, 0.1735076904296875, 0.18214035034179688, 0.19077301025390625, 0.19940567016601562, 0.208038330078125, 0.21667098999023438, 0.22530364990234375, 0.23393630981445312, 0.2425689697265625, 0.2512016296386719, 0.25983428955078125, 0.2684669494628906, 0.277099609375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 8.0, 7.0, 7.0, 12.0, 10.0, 15.0, 15.0, 17.0, 20.0, 27.0, 40.0, 31.0, 35.0, 36.0, 49.0, 34.0, 39.0, 47.0, 42.0, 1071.0, 36.0, 55.0, 38.0, 31.0, 29.0, 28.0, 26.0, 32.0, 35.0, 23.0, 22.0, 22.0, 16.0, 11.0, 13.0, 11.0, 12.0, 3.0, 4.0, 5.0, 5.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.5439453125, -1.4933319091796875, -1.442718505859375, -1.3921051025390625, -1.34149169921875, -1.2908782958984375, -1.240264892578125, -1.1896514892578125, -1.1390380859375, -1.0884246826171875, -1.037811279296875, -0.9871978759765625, -0.93658447265625, -0.8859710693359375, -0.835357666015625, -0.7847442626953125, -0.734130859375, -0.6835174560546875, -0.632904052734375, -0.5822906494140625, -0.53167724609375, -0.4810638427734375, -0.430450439453125, -0.3798370361328125, -0.3292236328125, -0.2786102294921875, -0.227996826171875, -0.1773834228515625, -0.12677001953125, -0.0761566162109375, -0.025543212890625, 0.0250701904296875, 0.07568359375, 0.1262969970703125, 0.176910400390625, 0.2275238037109375, 0.27813720703125, 0.3287506103515625, 0.379364013671875, 0.4299774169921875, 0.4805908203125, 0.5312042236328125, 0.581817626953125, 0.6324310302734375, 0.68304443359375, 0.7336578369140625, 0.784271240234375, 0.8348846435546875, 0.885498046875, 0.9361114501953125, 0.986724853515625, 1.0373382568359375, 1.08795166015625, 1.1385650634765625, 1.189178466796875, 1.2397918701171875, 1.2904052734375, 1.3410186767578125, 1.391632080078125, 1.4422454833984375, 1.49285888671875, 1.5434722900390625, 1.594085693359375, 1.6446990966796875, 1.6953125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 4.0, 3.0, 6.0, 13.0, 19.0, 22.0, 37.0, 52.0, 65.0, 83.0, 111.0, 178.0, 231.0, 336.0, 445.0, 617.0, 889.0, 1342.0, 1799.0, 2677.0, 3773.0, 5631.0, 8404.0, 12809.0, 19608.0, 30621.0, 49383.0, 84766.0, 150579.0, 1274441.0, 181292.0, 102946.0, 59463.0, 35974.0, 22865.0, 14825.0, 9784.0, 6523.0, 4431.0, 3082.0, 2096.0, 1432.0, 1010.0, 729.0, 511.0, 345.0, 261.0, 170.0, 136.0, 90.0, 76.0, 59.0, 30.0, 23.0, 17.0, 8.0, 10.0, 9.0, 3.0, 1.0, 1.0], "bins": [-0.2216796875, -0.21489524841308594, -0.20811080932617188, -0.2013263702392578, -0.19454193115234375, -0.1877574920654297, -0.18097305297851562, -0.17418861389160156, -0.1674041748046875, -0.16061973571777344, -0.15383529663085938, -0.1470508575439453, -0.14026641845703125, -0.1334819793701172, -0.12669754028320312, -0.11991310119628906, -0.113128662109375, -0.10634422302246094, -0.09955978393554688, -0.09277534484863281, -0.08599090576171875, -0.07920646667480469, -0.07242202758789062, -0.06563758850097656, -0.0588531494140625, -0.05206871032714844, -0.045284271240234375, -0.03849983215332031, -0.03171539306640625, -0.024930953979492188, -0.018146514892578125, -0.011362075805664062, -0.00457763671875, 0.0022068023681640625, 0.008991241455078125, 0.015775680541992188, 0.02256011962890625, 0.029344558715820312, 0.036128997802734375, 0.04291343688964844, 0.0496978759765625, 0.05648231506347656, 0.06326675415039062, 0.07005119323730469, 0.07683563232421875, 0.08362007141113281, 0.09040451049804688, 0.09718894958496094, 0.103973388671875, 0.11075782775878906, 0.11754226684570312, 0.12432670593261719, 0.13111114501953125, 0.1378955841064453, 0.14468002319335938, 0.15146446228027344, 0.1582489013671875, 0.16503334045410156, 0.17181777954101562, 0.1786022186279297, 0.18538665771484375, 0.1921710968017578, 0.19895553588867188, 0.20573997497558594, 0.2125244140625]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 4.0, 6.0, 10.0, 7.0, 7.0, 5.0, 16.0, 13.0, 22.0, 21.0, 37.0, 33.0, 54.0, 46.0, 68.0, 54.0, 84.0, 77.0, 63.0, 67.0, 58.0, 49.0, 37.0, 33.0, 27.0, 15.0, 14.0, 9.0, 8.0, 16.0, 5.0, 4.0, 5.0, 9.0, 5.0, 8.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.001110076904296875, -0.0010782405734062195, -0.001046404242515564, -0.0010145679116249084, -0.000982731580734253, -0.0009508952498435974, -0.0009190589189529419, -0.0008872225880622864, -0.0008553862571716309, -0.0008235499262809753, -0.0007917135953903198, -0.0007598772644996643, -0.0007280409336090088, -0.0006962046027183533, -0.0006643682718276978, -0.0006325319409370422, -0.0006006956100463867, -0.0005688592791557312, -0.0005370229482650757, -0.0005051866173744202, -0.00047335028648376465, -0.00044151395559310913, -0.0004096776247024536, -0.0003778412938117981, -0.0003460049629211426, -0.00031416863203048706, -0.00028233230113983154, -0.000250495970249176, -0.0002186596393585205, -0.000186823308467865, -0.00015498697757720947, -0.00012315064668655396, -9.131431579589844e-05, -5.947798490524292e-05, -2.7641654014587402e-05, 4.194676876068115e-06, 3.603100776672363e-05, 6.786733865737915e-05, 9.970366954803467e-05, 0.00013154000043869019, 0.0001633763313293457, 0.00019521266222000122, 0.00022704899311065674, 0.00025888532400131226, 0.0002907216548919678, 0.0003225579857826233, 0.0003543943166732788, 0.0003862306475639343, 0.00041806697845458984, 0.00044990330934524536, 0.0004817396402359009, 0.0005135759711265564, 0.0005454123020172119, 0.0005772486329078674, 0.000609084963798523, 0.0006409212946891785, 0.000672757625579834, 0.0007045939564704895, 0.000736430287361145, 0.0007682666182518005, 0.0008001029491424561, 0.0008319392800331116, 0.0008637756109237671, 0.0008956119418144226, 0.0009274482727050781]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 5.0, 6.0, 3.0, 5.0, 6.0, 9.0, 14.0, 19.0, 12.0, 21.0, 18.0, 34.0, 34.0, 52.0, 66.0, 95.0, 157.0, 224.0, 379.0, 622.0, 1378.0, 189381.0, 852457.0, 1673.0, 694.0, 395.0, 231.0, 155.0, 110.0, 69.0, 51.0, 44.0, 29.0, 24.0, 15.0, 14.0, 13.0, 12.0, 7.0, 6.0, 7.0, 2.0, 4.0, 1.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0165863037109375, -0.016016244888305664, -0.015446186065673828, -0.014876127243041992, -0.014306068420410156, -0.01373600959777832, -0.013165950775146484, -0.012595891952514648, -0.012025833129882812, -0.011455774307250977, -0.01088571548461914, -0.010315656661987305, -0.009745597839355469, -0.009175539016723633, -0.008605480194091797, -0.008035421371459961, -0.007465362548828125, -0.006895303726196289, -0.006325244903564453, -0.005755186080932617, -0.005185127258300781, -0.004615068435668945, -0.004045009613037109, -0.0034749507904052734, -0.0029048919677734375, -0.0023348331451416016, -0.0017647743225097656, -0.0011947154998779297, -0.0006246566772460938, -5.459785461425781e-05, 0.0005154609680175781, 0.001085519790649414, 0.00165557861328125, 0.002225637435913086, 0.002795696258544922, 0.003365755081176758, 0.003935813903808594, 0.00450587272644043, 0.005075931549072266, 0.0056459903717041016, 0.0062160491943359375, 0.0067861080169677734, 0.007356166839599609, 0.007926225662231445, 0.008496284484863281, 0.009066343307495117, 0.009636402130126953, 0.010206460952758789, 0.010776519775390625, 0.011346578598022461, 0.011916637420654297, 0.012486696243286133, 0.013056755065917969, 0.013626813888549805, 0.01419687271118164, 0.014766931533813477, 0.015336990356445312, 0.01590704917907715, 0.016477108001708984, 0.01704716682434082, 0.017617225646972656, 0.018187284469604492, 0.018757343292236328, 0.019327402114868164, 0.0198974609375]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 11.0, 566.0, 432.0, 3.0, 1.0], "bins": [-0.00776103138923645, -0.007633655332028866, -0.007506279740482569, -0.007378903683274984, -0.007251528091728687, -0.007124152034521103, -0.006996776442974806, -0.0068694003857672215, -0.006742024794220924, -0.00661464873701334, -0.006487273145467043, -0.0063598970882594585, -0.0062325214967131615, -0.006105145439505577, -0.00597776984795928, -0.005850393790751696, -0.005723017733544111, -0.005595641676336527, -0.00546826608479023, -0.005340890027582645, -0.005213514436036348, -0.005086138378828764, -0.004958762787282467, -0.0048313867300748825, -0.004704010672867298, -0.004576634615659714, -0.004449259024113417, -0.004321882966905832, -0.004194507375359535, -0.004067131318151951, -0.003939755726605654, -0.0038123796693980694, -0.0036850038450211287, -0.003557628020644188, -0.003430252196267247, -0.0033028763718903065, -0.003175500314682722, -0.003048124723136425, -0.0029207486659288406, -0.0027933728415519, -0.002665997017174959, -0.0025386211927980185, -0.0024112453684210777, -0.002283869544044137, -0.0021564937196671963, -0.002029117662459612, -0.0019017418380826712, -0.0017743660137057304, -0.0016469901893287897, -0.001519614364951849, -0.0013922385405749083, -0.0012648625997826457, -0.001137486775405705, -0.0010101109510287642, -0.0008827350684441626, -0.000755359185859561, -0.0006279833614826202, -0.0005006075371056795, -0.00037323165452107787, -0.0002458558010403067, -0.0001184799475595355, 8.895876817405224e-06, 0.00013627175940200686, 0.0002636476419866085, 0.00039102346636354923]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 6.0, 5.0, 15.0, 11.0, 11.0, 17.0, 21.0, 20.0, 20.0, 29.0, 36.0, 41.0, 38.0, 44.0, 61.0, 48.0, 44.0, 53.0, 54.0, 51.0, 38.0, 49.0, 34.0, 43.0, 34.0, 29.0, 36.0, 23.0, 12.0, 21.0, 15.0, 13.0, 9.0, 11.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005265474319458008, -0.0005075614899396896, -0.0004885755479335785, -0.00046958960592746735, -0.0004506036639213562, -0.00043161772191524506, -0.0004126317799091339, -0.00039364583790302277, -0.0003746598958969116, -0.0003556739538908005, -0.00033668801188468933, -0.0003177020698785782, -0.00029871612787246704, -0.0002797301858663559, -0.00026074424386024475, -0.0002417583018541336, -0.00022277235984802246, -0.00020378641784191132, -0.00018480047583580017, -0.00016581453382968903, -0.00014682859182357788, -0.00012784264981746674, -0.00010885670781135559, -8.987076580524445e-05, -7.08848237991333e-05, -5.1898881793022156e-05, -3.291293978691101e-05, -1.3926997780799866e-05, 5.058944225311279e-06, 2.4044886231422424e-05, 4.303082823753357e-05, 6.201677024364471e-05, 8.100271224975586e-05, 9.9988654255867e-05, 0.00011897459626197815, 0.0001379605382680893, 0.00015694648027420044, 0.00017593242228031158, 0.00019491836428642273, 0.00021390430629253387, 0.00023289024829864502, 0.00025187619030475616, 0.0002708621323108673, 0.00028984807431697845, 0.0003088340163230896, 0.00032781995832920074, 0.0003468059003353119, 0.00036579184234142303, 0.0003847777843475342, 0.0004037637263536453, 0.00042274966835975647, 0.0004417356103658676, 0.00046072155237197876, 0.0004797074943780899, 0.000498693436384201, 0.0005176793783903122, 0.0005366653203964233, 0.0005556512624025345, 0.0005746372044086456, 0.0005936231464147568, 0.0006126090884208679, 0.0006315950304269791, 0.0006505809724330902, 0.0006695669144392014, 0.0006885528564453125]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 3.0, 10.0, 7.0, 6.0, 12.0, 12.0, 17.0, 13.0, 12.0, 20.0, 23.0, 28.0, 29.0, 31.0, 29.0, 37.0, 24.0, 33.0, 35.0, 36.0, 38.0, 33.0, 41.0, 46.0, 34.0, 37.0, 39.0, 31.0, 23.0, 21.0, 24.0, 37.0, 34.0, 26.0, 7.0, 18.0, 13.0, 10.0, 12.0, 14.0, 7.0, 12.0, 8.0, 2.0, 2.0, 7.0, 3.0, 1.0, 3.0, 0.0, 3.0, 0.0, 3.0], "bins": [-2.34765625, -2.276611328125, -2.20556640625, -2.134521484375, -2.0634765625, -1.992431640625, -1.92138671875, -1.850341796875, -1.779296875, -1.708251953125, -1.63720703125, -1.566162109375, -1.4951171875, -1.424072265625, -1.35302734375, -1.281982421875, -1.2109375, -1.139892578125, -1.06884765625, -0.997802734375, -0.9267578125, -0.855712890625, -0.78466796875, -0.713623046875, -0.642578125, -0.571533203125, -0.50048828125, -0.429443359375, -0.3583984375, -0.287353515625, -0.21630859375, -0.145263671875, -0.07421875, -0.003173828125, 0.06787109375, 0.138916015625, 0.2099609375, 0.281005859375, 0.35205078125, 0.423095703125, 0.494140625, 0.565185546875, 0.63623046875, 0.707275390625, 0.7783203125, 0.849365234375, 0.92041015625, 0.991455078125, 1.0625, 1.133544921875, 1.20458984375, 1.275634765625, 1.3466796875, 1.417724609375, 1.48876953125, 1.559814453125, 1.630859375, 1.701904296875, 1.77294921875, 1.843994140625, 1.9150390625, 1.986083984375, 2.05712890625, 2.128173828125, 2.19921875]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 1.0, 12.0, 8.0, 14.0, 25.0, 16.0, 30.0, 39.0, 35.0, 65.0, 71.0, 81.0, 109.0, 174.0, 225.0, 271.0, 351.0, 533.0, 788.0, 1217.0, 2162.0, 4254.0, 9867.0, 32235.0, 176459.0, 598119.0, 170229.0, 31165.0, 9658.0, 4152.0, 2126.0, 1174.0, 812.0, 527.0, 382.0, 312.0, 186.0, 154.0, 114.0, 84.0, 71.0, 59.0, 40.0, 38.0, 24.0, 20.0, 22.0, 13.0, 10.0, 6.0, 4.0, 8.0, 3.0, 3.0, 2.0, 1.0, 2.0], "bins": [-4.2734375, -4.14190673828125, -4.0103759765625, -3.87884521484375, -3.747314453125, -3.61578369140625, -3.4842529296875, -3.35272216796875, -3.22119140625, -3.08966064453125, -2.9581298828125, -2.82659912109375, -2.695068359375, -2.56353759765625, -2.4320068359375, -2.30047607421875, -2.1689453125, -2.03741455078125, -1.9058837890625, -1.77435302734375, -1.642822265625, -1.51129150390625, -1.3797607421875, -1.24822998046875, -1.11669921875, -0.98516845703125, -0.8536376953125, -0.72210693359375, -0.590576171875, -0.45904541015625, -0.3275146484375, -0.19598388671875, -0.064453125, 0.06707763671875, 0.1986083984375, 0.33013916015625, 0.461669921875, 0.59320068359375, 0.7247314453125, 0.85626220703125, 0.98779296875, 1.11932373046875, 1.2508544921875, 1.38238525390625, 1.513916015625, 1.64544677734375, 1.7769775390625, 1.90850830078125, 2.0400390625, 2.17156982421875, 2.3031005859375, 2.43463134765625, 2.566162109375, 2.69769287109375, 2.8292236328125, 2.96075439453125, 3.09228515625, 3.22381591796875, 3.3553466796875, 3.48687744140625, 3.618408203125, 3.74993896484375, 3.8814697265625, 4.01300048828125, 4.14453125]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 3.0, 2.0, 5.0, 5.0, 3.0, 11.0, 10.0, 10.0, 11.0, 14.0, 20.0, 20.0, 31.0, 33.0, 34.0, 39.0, 54.0, 62.0, 88.0, 192.0, 1546.0, 320.0, 140.0, 77.0, 60.0, 45.0, 43.0, 31.0, 28.0, 25.0, 15.0, 10.0, 16.0, 11.0, 6.0, 8.0, 6.0, 1.0, 5.0, 3.0, 1.0, 4.0, 0.0, 5.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-9.3828125, -9.113037109375, -8.84326171875, -8.573486328125, -8.3037109375, -8.033935546875, -7.76416015625, -7.494384765625, -7.224609375, -6.954833984375, -6.68505859375, -6.415283203125, -6.1455078125, -5.875732421875, -5.60595703125, -5.336181640625, -5.06640625, -4.796630859375, -4.52685546875, -4.257080078125, -3.9873046875, -3.717529296875, -3.44775390625, -3.177978515625, -2.908203125, -2.638427734375, -2.36865234375, -2.098876953125, -1.8291015625, -1.559326171875, -1.28955078125, -1.019775390625, -0.75, -0.480224609375, -0.21044921875, 0.059326171875, 0.3291015625, 0.598876953125, 0.86865234375, 1.138427734375, 1.408203125, 1.677978515625, 1.94775390625, 2.217529296875, 2.4873046875, 2.757080078125, 3.02685546875, 3.296630859375, 3.56640625, 3.836181640625, 4.10595703125, 4.375732421875, 4.6455078125, 4.915283203125, 5.18505859375, 5.454833984375, 5.724609375, 5.994384765625, 6.26416015625, 6.533935546875, 6.8037109375, 7.073486328125, 7.34326171875, 7.613037109375, 7.8828125]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 3.0, 7.0, 5.0, 9.0, 16.0, 23.0, 42.0, 33.0, 57.0, 73.0, 104.0, 138.0, 194.0, 412.0, 857.0, 3977.0, 3031594.0, 104586.0, 1904.0, 640.0, 340.0, 168.0, 141.0, 94.0, 66.0, 59.0, 32.0, 35.0, 23.0, 20.0, 13.0, 9.0, 2.0, 7.0, 3.0, 4.0, 1.0, 4.0, 1.0, 1.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.796875, -17.199951171875, -16.60302734375, -16.006103515625, -15.4091796875, -14.812255859375, -14.21533203125, -13.618408203125, -13.021484375, -12.424560546875, -11.82763671875, -11.230712890625, -10.6337890625, -10.036865234375, -9.43994140625, -8.843017578125, -8.24609375, -7.649169921875, -7.05224609375, -6.455322265625, -5.8583984375, -5.261474609375, -4.66455078125, -4.067626953125, -3.470703125, -2.873779296875, -2.27685546875, -1.679931640625, -1.0830078125, -0.486083984375, 0.11083984375, 0.707763671875, 1.3046875, 1.901611328125, 2.49853515625, 3.095458984375, 3.6923828125, 4.289306640625, 4.88623046875, 5.483154296875, 6.080078125, 6.677001953125, 7.27392578125, 7.870849609375, 8.4677734375, 9.064697265625, 9.66162109375, 10.258544921875, 10.85546875, 11.452392578125, 12.04931640625, 12.646240234375, 13.2431640625, 13.840087890625, 14.43701171875, 15.033935546875, 15.630859375, 16.227783203125, 16.82470703125, 17.421630859375, 18.0185546875, 18.615478515625, 19.21240234375, 19.809326171875, 20.40625]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 52.0, 945.0, 15.0, 0.0, 0.0, 0.0, 1.0], "bins": [-262.3836364746094, -257.8918762207031, -253.4001007080078, -248.9083251953125, -244.41656494140625, -239.92478942871094, -235.4330291748047, -230.94125366210938, -226.44949340820312, -221.9577178955078, -217.46595764160156, -212.97418212890625, -208.482421875, -203.9906463623047, -199.49888610839844, -195.00711059570312, -190.5153350830078, -186.0235595703125, -181.53179931640625, -177.04002380371094, -172.5482635498047, -168.05648803710938, -163.56472778320312, -159.0729522705078, -154.5811767578125, -150.0894012451172, -145.59764099121094, -141.10586547851562, -136.61410522460938, -132.12232971191406, -127.63056182861328, -123.1387939453125, -118.64701843261719, -114.1552505493164, -109.66348266601562, -105.17171478271484, -100.67994689941406, -96.18817138671875, -91.69640350341797, -87.20463562011719, -82.7128677368164, -78.22109985351562, -73.72933197021484, -69.23756408691406, -64.74578857421875, -60.254024505615234, -55.76225280761719, -51.270484924316406, -46.778717041015625, -42.286949157714844, -37.79518127441406, -33.303409576416016, -28.811641693115234, -24.319873809814453, -19.82810401916504, -15.336334228515625, -10.844568252563477, -6.352799415588379, -1.8610305786132812, 2.6307382583618164, 7.122507095336914, 11.614274978637695, 16.10604476928711, 20.597814559936523, 25.089582443237305]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 4.0, 3.0, 5.0, 5.0, 2.0, 9.0, 9.0, 9.0, 10.0, 16.0, 9.0, 13.0, 11.0, 16.0, 25.0, 15.0, 21.0, 21.0, 21.0, 40.0, 24.0, 38.0, 42.0, 27.0, 35.0, 26.0, 20.0, 32.0, 43.0, 35.0, 38.0, 35.0, 28.0, 31.0, 18.0, 35.0, 28.0, 22.0, 15.0, 21.0, 17.0, 13.0, 13.0, 13.0, 11.0, 16.0, 8.0, 9.0, 12.0, 13.0, 9.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 5.0], "bins": [-15.109373092651367, -14.654638290405273, -14.199904441833496, -13.745169639587402, -13.290435791015625, -12.835700988769531, -12.380966186523438, -11.92623233795166, -11.471498489379883, -11.016763687133789, -10.562029838562012, -10.107295036315918, -9.65256118774414, -9.197826385498047, -8.743091583251953, -8.288357734680176, -7.833622932434082, -7.3788886070251465, -6.924154281616211, -6.469419479370117, -6.01468563079834, -5.559950828552246, -5.1052165031433105, -4.650482177734375, -4.1957478523254395, -3.741013526916504, -3.2862792015075684, -2.8315446376800537, -2.376810312271118, -1.9220759868621826, -1.467341423034668, -1.0126070976257324, -0.5578718185424805, -0.10313743352890015, 0.3515969514846802, 0.8063313961029053, 1.2610657215118408, 1.7158000469207764, 2.170534610748291, 2.6252689361572266, 3.080003261566162, 3.5347375869750977, 3.989471912384033, 4.444206237792969, 4.8989410400390625, 5.35367488861084, 5.808409690856934, 6.263144016265869, 6.717878341674805, 7.17261266708374, 7.627346992492676, 8.08208179473877, 8.536815643310547, 8.99155044555664, 9.446285247802734, 9.901019096374512, 10.355752944946289, 10.810487747192383, 11.26522159576416, 11.719956398010254, 12.174690246582031, 12.629425048828125, 13.084159851074219, 13.538893699645996, 13.99362850189209]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 5.0, 2.0, 4.0, 2.0, 7.0, 2.0, 12.0, 4.0, 8.0, 8.0, 9.0, 11.0, 14.0, 22.0, 20.0, 27.0, 27.0, 22.0, 36.0, 31.0, 25.0, 20.0, 29.0, 26.0, 34.0, 58.0, 48.0, 43.0, 37.0, 31.0, 40.0, 30.0, 47.0, 22.0, 23.0, 24.0, 32.0, 18.0, 22.0, 17.0, 25.0, 14.0, 10.0, 19.0, 11.0, 6.0, 8.0, 5.0, 3.0, 5.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-2.892578125, -2.80718994140625, -2.7218017578125, -2.63641357421875, -2.551025390625, -2.46563720703125, -2.3802490234375, -2.29486083984375, -2.20947265625, -2.12408447265625, -2.0386962890625, -1.95330810546875, -1.867919921875, -1.78253173828125, -1.6971435546875, -1.61175537109375, -1.5263671875, -1.44097900390625, -1.3555908203125, -1.27020263671875, -1.184814453125, -1.09942626953125, -1.0140380859375, -0.92864990234375, -0.84326171875, -0.75787353515625, -0.6724853515625, -0.58709716796875, -0.501708984375, -0.41632080078125, -0.3309326171875, -0.24554443359375, -0.16015625, -0.07476806640625, 0.0106201171875, 0.09600830078125, 0.181396484375, 0.26678466796875, 0.3521728515625, 0.43756103515625, 0.52294921875, 0.60833740234375, 0.6937255859375, 0.77911376953125, 0.864501953125, 0.94989013671875, 1.0352783203125, 1.12066650390625, 1.2060546875, 1.29144287109375, 1.3768310546875, 1.46221923828125, 1.547607421875, 1.63299560546875, 1.7183837890625, 1.80377197265625, 1.88916015625, 1.97454833984375, 2.0599365234375, 2.14532470703125, 2.230712890625, 2.31610107421875, 2.4014892578125, 2.48687744140625, 2.572265625]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 5.0, 5.0, 5.0, 7.0, 11.0, 10.0, 6.0, 17.0, 24.0, 18.0, 35.0, 43.0, 57.0, 81.0, 111.0, 142.0, 211.0, 300.0, 406.0, 609.0, 927.0, 1789.0, 6940.0, 261439.0, 3675216.0, 234177.0, 6849.0, 1880.0, 891.0, 586.0, 381.0, 295.0, 227.0, 149.0, 104.0, 73.0, 52.0, 47.0, 30.0, 19.0, 28.0, 18.0, 16.0, 10.0, 8.0, 8.0, 9.0, 2.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0], "bins": [-15.125, -14.67333984375, -14.2216796875, -13.77001953125, -13.318359375, -12.86669921875, -12.4150390625, -11.96337890625, -11.51171875, -11.06005859375, -10.6083984375, -10.15673828125, -9.705078125, -9.25341796875, -8.8017578125, -8.35009765625, -7.8984375, -7.44677734375, -6.9951171875, -6.54345703125, -6.091796875, -5.64013671875, -5.1884765625, -4.73681640625, -4.28515625, -3.83349609375, -3.3818359375, -2.93017578125, -2.478515625, -2.02685546875, -1.5751953125, -1.12353515625, -0.671875, -0.22021484375, 0.2314453125, 0.68310546875, 1.134765625, 1.58642578125, 2.0380859375, 2.48974609375, 2.94140625, 3.39306640625, 3.8447265625, 4.29638671875, 4.748046875, 5.19970703125, 5.6513671875, 6.10302734375, 6.5546875, 7.00634765625, 7.4580078125, 7.90966796875, 8.361328125, 8.81298828125, 9.2646484375, 9.71630859375, 10.16796875, 10.61962890625, 11.0712890625, 11.52294921875, 11.974609375, 12.42626953125, 12.8779296875, 13.32958984375, 13.78125]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 7.0, 1.0, 3.0, 7.0, 14.0, 26.0, 33.0, 62.0, 109.0, 231.0, 384.0, 599.0, 789.0, 658.0, 487.0, 304.0, 156.0, 104.0, 44.0, 23.0, 19.0, 8.0, 4.0, 5.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.05078125, -6.78778076171875, -6.5247802734375, -6.26177978515625, -5.998779296875, -5.73577880859375, -5.4727783203125, -5.20977783203125, -4.94677734375, -4.68377685546875, -4.4207763671875, -4.15777587890625, -3.894775390625, -3.63177490234375, -3.3687744140625, -3.10577392578125, -2.8427734375, -2.57977294921875, -2.3167724609375, -2.05377197265625, -1.790771484375, -1.52777099609375, -1.2647705078125, -1.00177001953125, -0.73876953125, -0.47576904296875, -0.2127685546875, 0.05023193359375, 0.313232421875, 0.57623291015625, 0.8392333984375, 1.10223388671875, 1.365234375, 1.62823486328125, 1.8912353515625, 2.15423583984375, 2.417236328125, 2.68023681640625, 2.9432373046875, 3.20623779296875, 3.46923828125, 3.73223876953125, 3.9952392578125, 4.25823974609375, 4.521240234375, 4.78424072265625, 5.0472412109375, 5.31024169921875, 5.5732421875, 5.83624267578125, 6.0992431640625, 6.36224365234375, 6.625244140625, 6.88824462890625, 7.1512451171875, 7.41424560546875, 7.67724609375, 7.94024658203125, 8.2032470703125, 8.46624755859375, 8.729248046875, 8.99224853515625, 9.2552490234375, 9.51824951171875, 9.78125]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 6.0, 4.0, 2.0, 6.0, 18.0, 14.0, 32.0, 52.0, 89.0, 181.0, 363.0, 865.0, 2415.0, 8035.0, 53679.0, 768310.0, 2951649.0, 369696.0, 30122.0, 5603.0, 1768.0, 718.0, 302.0, 147.0, 79.0, 44.0, 30.0, 22.0, 13.0, 5.0, 6.0, 3.0, 2.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4375, -6.22552490234375, -6.0135498046875, -5.80157470703125, -5.589599609375, -5.37762451171875, -5.1656494140625, -4.95367431640625, -4.74169921875, -4.52972412109375, -4.3177490234375, -4.10577392578125, -3.893798828125, -3.68182373046875, -3.4698486328125, -3.25787353515625, -3.0458984375, -2.83392333984375, -2.6219482421875, -2.40997314453125, -2.197998046875, -1.98602294921875, -1.7740478515625, -1.56207275390625, -1.35009765625, -1.13812255859375, -0.9261474609375, -0.71417236328125, -0.502197265625, -0.29022216796875, -0.0782470703125, 0.13372802734375, 0.345703125, 0.55767822265625, 0.7696533203125, 0.98162841796875, 1.193603515625, 1.40557861328125, 1.6175537109375, 1.82952880859375, 2.04150390625, 2.25347900390625, 2.4654541015625, 2.67742919921875, 2.889404296875, 3.10137939453125, 3.3133544921875, 3.52532958984375, 3.7373046875, 3.94927978515625, 4.1612548828125, 4.37322998046875, 4.585205078125, 4.79718017578125, 5.0091552734375, 5.22113037109375, 5.43310546875, 5.64508056640625, 5.8570556640625, 6.06903076171875, 6.281005859375, 6.49298095703125, 6.7049560546875, 6.91693115234375, 7.12890625]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 9.0, 7.0, 22.0, 22.0, 37.0, 64.0, 74.0, 107.0, 116.0, 136.0, 113.0, 100.0, 68.0, 50.0, 38.0, 17.0, 8.0, 8.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.768287658691406, -31.316558837890625, -29.864830017089844, -28.41309928894043, -26.96137046813965, -25.509641647338867, -24.057910919189453, -22.606182098388672, -21.15445327758789, -19.70272445678711, -18.250995635986328, -16.799264907836914, -15.347536087036133, -13.895807266235352, -12.444077491760254, -10.992347717285156, -9.540618896484375, -8.088890075683594, -6.637160301208496, -5.185431003570557, -3.733701705932617, -2.2819724082946777, -0.8302431106567383, 0.6214866638183594, 2.0732154846191406, 3.52494478225708, 4.9766740798950195, 6.428403377532959, 7.880132675170898, 9.33186149597168, 10.783591270446777, 12.235321044921875, 13.687049865722656, 15.138778686523438, 16.59050750732422, 18.042238235473633, 19.493967056274414, 20.945695877075195, 22.39742660522461, 23.84915542602539, 25.300884246826172, 26.752613067626953, 28.204341888427734, 29.65607261657715, 31.10780143737793, 32.559532165527344, 34.011260986328125, 35.462989807128906, 36.91471862792969, 38.36644744873047, 39.81817626953125, 41.26990509033203, 42.72163391113281, 44.17336654663086, 45.62509536743164, 47.07682418823242, 48.5285530090332, 49.980281829833984, 51.432010650634766, 52.88373947143555, 54.335472106933594, 55.787200927734375, 57.238929748535156, 58.69065856933594, 60.14238739013672]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 9.0, 11.0, 9.0, 6.0, 13.0, 12.0, 13.0, 13.0, 21.0, 18.0, 23.0, 25.0, 29.0, 27.0, 33.0, 47.0, 29.0, 38.0, 38.0, 53.0, 31.0, 32.0, 41.0, 31.0, 47.0, 39.0, 32.0, 23.0, 32.0, 26.0, 33.0, 23.0, 18.0, 19.0, 14.0, 15.0, 11.0, 14.0, 12.0, 12.0, 6.0, 7.0, 0.0, 3.0, 0.0, 3.0, 4.0, 2.0, 1.0, 3.0], "bins": [-20.572280883789062, -19.982149124145508, -19.392017364501953, -18.801883697509766, -18.21175193786621, -17.621620178222656, -17.0314884185791, -16.441356658935547, -15.851223945617676, -15.261092185974121, -14.67095947265625, -14.080827713012695, -13.49069595336914, -12.90056324005127, -12.310431480407715, -11.720298767089844, -11.130167007446289, -10.540035247802734, -9.949902534484863, -9.359770774841309, -8.769638061523438, -8.179506301879883, -7.589374542236328, -6.999242305755615, -6.409110069274902, -5.8189778327941895, -5.228845596313477, -4.638713836669922, -4.048581600189209, -3.458449363708496, -2.8683173656463623, -2.2781853675842285, -1.6880550384521484, -1.097922921180725, -0.5077908039093018, 0.08234131336212158, 0.6724734306335449, 1.2626056671142578, 1.8527376651763916, 2.4428696632385254, 3.0330018997192383, 3.623134136199951, 4.213266372680664, 4.803398132324219, 5.393530368804932, 5.9836626052856445, 6.573794364929199, 7.163926601409912, 7.754058837890625, 8.34419059753418, 8.93432331085205, 9.524455070495605, 10.114587783813477, 10.704719543457031, 11.294851303100586, 11.88498306274414, 12.475115776062012, 13.065247535705566, 13.655380249023438, 14.245512008666992, 14.835643768310547, 15.425776481628418, 16.01590919494629, 16.606040954589844, 17.1961727142334]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 3.0, 0.0, 2.0, 2.0, 4.0, 10.0, 13.0, 9.0, 14.0, 10.0, 19.0, 17.0, 18.0, 16.0, 32.0, 22.0, 33.0, 38.0, 48.0, 33.0, 40.0, 44.0, 41.0, 42.0, 42.0, 42.0, 43.0, 41.0, 37.0, 35.0, 43.0, 29.0, 22.0, 31.0, 15.0, 17.0, 15.0, 14.0, 16.0, 11.0, 15.0, 5.0, 5.0, 3.0, 5.0, 4.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-36.46875, -35.35302734375, -34.2373046875, -33.12158203125, -32.005859375, -30.89013671875, -29.7744140625, -28.65869140625, -27.54296875, -26.42724609375, -25.3115234375, -24.19580078125, -23.080078125, -21.96435546875, -20.8486328125, -19.73291015625, -18.6171875, -17.50146484375, -16.3857421875, -15.27001953125, -14.154296875, -13.03857421875, -11.9228515625, -10.80712890625, -9.69140625, -8.57568359375, -7.4599609375, -6.34423828125, -5.228515625, -4.11279296875, -2.9970703125, -1.88134765625, -0.765625, 0.35009765625, 1.4658203125, 2.58154296875, 3.697265625, 4.81298828125, 5.9287109375, 7.04443359375, 8.16015625, 9.27587890625, 10.3916015625, 11.50732421875, 12.623046875, 13.73876953125, 14.8544921875, 15.97021484375, 17.0859375, 18.20166015625, 19.3173828125, 20.43310546875, 21.548828125, 22.66455078125, 23.7802734375, 24.89599609375, 26.01171875, 27.12744140625, 28.2431640625, 29.35888671875, 30.474609375, 31.59033203125, 32.7060546875, 33.82177734375, 34.9375]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 8.0, 16.0, 12.0, 30.0, 45.0, 57.0, 91.0, 158.0, 217.0, 367.0, 556.0, 937.0, 1362.0, 2149.0, 3153.0, 4893.0, 7293.0, 11446.0, 18448.0, 30260.0, 50801.0, 87507.0, 148344.0, 220598.0, 184052.0, 110430.0, 64497.0, 37686.0, 23145.0, 14203.0, 9099.0, 5822.0, 3663.0, 2590.0, 1654.0, 1029.0, 649.0, 445.0, 286.0, 202.0, 133.0, 81.0, 46.0, 26.0, 28.0, 12.0, 14.0, 10.0, 7.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.22265625, -3.121063232421875, -3.01947021484375, -2.917877197265625, -2.8162841796875, -2.714691162109375, -2.61309814453125, -2.511505126953125, -2.409912109375, -2.308319091796875, -2.20672607421875, -2.105133056640625, -2.0035400390625, -1.901947021484375, -1.80035400390625, -1.698760986328125, -1.59716796875, -1.495574951171875, -1.39398193359375, -1.292388916015625, -1.1907958984375, -1.089202880859375, -0.98760986328125, -0.886016845703125, -0.784423828125, -0.682830810546875, -0.58123779296875, -0.479644775390625, -0.3780517578125, -0.276458740234375, -0.17486572265625, -0.073272705078125, 0.0283203125, 0.129913330078125, 0.23150634765625, 0.333099365234375, 0.4346923828125, 0.536285400390625, 0.63787841796875, 0.739471435546875, 0.841064453125, 0.942657470703125, 1.04425048828125, 1.145843505859375, 1.2474365234375, 1.349029541015625, 1.45062255859375, 1.552215576171875, 1.65380859375, 1.755401611328125, 1.85699462890625, 1.958587646484375, 2.0601806640625, 2.161773681640625, 2.26336669921875, 2.364959716796875, 2.466552734375, 2.568145751953125, 2.66973876953125, 2.771331787109375, 2.8729248046875, 2.974517822265625, 3.07611083984375, 3.177703857421875, 3.279296875]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 6.0, 9.0, 6.0, 9.0, 10.0, 9.0, 4.0, 11.0, 16.0, 17.0, 24.0, 27.0, 22.0, 26.0, 26.0, 27.0, 34.0, 28.0, 40.0, 51.0, 30.0, 42.0, 1080.0, 49.0, 43.0, 28.0, 30.0, 33.0, 31.0, 41.0, 21.0, 26.0, 21.0, 19.0, 25.0, 24.0, 12.0, 16.0, 11.0, 12.0, 9.0, 7.0, 8.0, 2.0, 2.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-21.21875, -20.543701171875, -19.86865234375, -19.193603515625, -18.5185546875, -17.843505859375, -17.16845703125, -16.493408203125, -15.818359375, -15.143310546875, -14.46826171875, -13.793212890625, -13.1181640625, -12.443115234375, -11.76806640625, -11.093017578125, -10.41796875, -9.742919921875, -9.06787109375, -8.392822265625, -7.7177734375, -7.042724609375, -6.36767578125, -5.692626953125, -5.017578125, -4.342529296875, -3.66748046875, -2.992431640625, -2.3173828125, -1.642333984375, -0.96728515625, -0.292236328125, 0.3828125, 1.057861328125, 1.73291015625, 2.407958984375, 3.0830078125, 3.758056640625, 4.43310546875, 5.108154296875, 5.783203125, 6.458251953125, 7.13330078125, 7.808349609375, 8.4833984375, 9.158447265625, 9.83349609375, 10.508544921875, 11.18359375, 11.858642578125, 12.53369140625, 13.208740234375, 13.8837890625, 14.558837890625, 15.23388671875, 15.908935546875, 16.583984375, 17.259033203125, 17.93408203125, 18.609130859375, 19.2841796875, 19.959228515625, 20.63427734375, 21.309326171875, 21.984375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 3.0, 5.0, 1.0, 7.0, 4.0, 13.0, 13.0, 21.0, 27.0, 54.0, 67.0, 80.0, 139.0, 173.0, 264.0, 431.0, 594.0, 949.0, 1425.0, 2070.0, 3095.0, 4980.0, 7709.0, 12210.0, 19813.0, 32195.0, 54355.0, 93589.0, 165394.0, 1286641.0, 170034.0, 96693.0, 55668.0, 33284.0, 20065.0, 12397.0, 7887.0, 5043.0, 3350.0, 2082.0, 1391.0, 938.0, 635.0, 428.0, 316.0, 184.0, 129.0, 95.0, 63.0, 48.0, 34.0, 16.0, 18.0, 11.0, 7.0, 3.0, 1.0, 1.0, 3.0, 2.0], "bins": [-3.609375, -3.501708984375, -3.39404296875, -3.286376953125, -3.1787109375, -3.071044921875, -2.96337890625, -2.855712890625, -2.748046875, -2.640380859375, -2.53271484375, -2.425048828125, -2.3173828125, -2.209716796875, -2.10205078125, -1.994384765625, -1.88671875, -1.779052734375, -1.67138671875, -1.563720703125, -1.4560546875, -1.348388671875, -1.24072265625, -1.133056640625, -1.025390625, -0.917724609375, -0.81005859375, -0.702392578125, -0.5947265625, -0.487060546875, -0.37939453125, -0.271728515625, -0.1640625, -0.056396484375, 0.05126953125, 0.158935546875, 0.2666015625, 0.374267578125, 0.48193359375, 0.589599609375, 0.697265625, 0.804931640625, 0.91259765625, 1.020263671875, 1.1279296875, 1.235595703125, 1.34326171875, 1.450927734375, 1.55859375, 1.666259765625, 1.77392578125, 1.881591796875, 1.9892578125, 2.096923828125, 2.20458984375, 2.312255859375, 2.419921875, 2.527587890625, 2.63525390625, 2.742919921875, 2.8505859375, 2.958251953125, 3.06591796875, 3.173583984375, 3.28125]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 0.0, 7.0, 2.0, 7.0, 2.0, 6.0, 8.0, 8.0, 17.0, 19.0, 27.0, 35.0, 54.0, 63.0, 75.0, 85.0, 96.0, 104.0, 75.0, 68.0, 59.0, 45.0, 31.0, 26.0, 24.0, 15.0, 16.0, 7.0, 6.0, 5.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0297088623046875, -0.02890181541442871, -0.028094768524169922, -0.027287721633911133, -0.026480674743652344, -0.025673627853393555, -0.024866580963134766, -0.024059534072875977, -0.023252487182617188, -0.0224454402923584, -0.02163839340209961, -0.02083134651184082, -0.02002429962158203, -0.019217252731323242, -0.018410205841064453, -0.017603158950805664, -0.016796112060546875, -0.015989065170288086, -0.015182018280029297, -0.014374971389770508, -0.013567924499511719, -0.01276087760925293, -0.01195383071899414, -0.011146783828735352, -0.010339736938476562, -0.009532690048217773, -0.008725643157958984, -0.007918596267700195, -0.007111549377441406, -0.006304502487182617, -0.005497455596923828, -0.004690408706665039, -0.00388336181640625, -0.003076314926147461, -0.002269268035888672, -0.0014622211456298828, -0.0006551742553710938, 0.0001518726348876953, 0.0009589195251464844, 0.0017659664154052734, 0.0025730133056640625, 0.0033800601959228516, 0.004187107086181641, 0.00499415397644043, 0.005801200866699219, 0.006608247756958008, 0.007415294647216797, 0.008222341537475586, 0.009029388427734375, 0.009836435317993164, 0.010643482208251953, 0.011450529098510742, 0.012257575988769531, 0.01306462287902832, 0.01387166976928711, 0.014678716659545898, 0.015485763549804688, 0.016292810440063477, 0.017099857330322266, 0.017906904220581055, 0.018713951110839844, 0.019520998001098633, 0.020328044891357422, 0.02113509178161621, 0.021942138671875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 3.0, 0.0, 1.0, 1.0, 5.0, 2.0, 3.0, 16.0, 11.0, 13.0, 13.0, 17.0, 25.0, 36.0, 41.0, 87.0, 118.0, 161.0, 345.0, 535.0, 1211.0, 2645.0, 7297.0, 26403.0, 135597.0, 571884.0, 242475.0, 42432.0, 10501.0, 3558.0, 1442.0, 666.0, 355.0, 218.0, 128.0, 84.0, 61.0, 44.0, 28.0, 21.0, 13.0, 18.0, 12.0, 13.0, 6.0, 10.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1151123046875, -0.11109542846679688, -0.10707855224609375, -0.10306167602539062, -0.0990447998046875, -0.09502792358398438, -0.09101104736328125, -0.08699417114257812, -0.082977294921875, -0.07896041870117188, -0.07494354248046875, -0.07092666625976562, -0.0669097900390625, -0.06289291381835938, -0.05887603759765625, -0.054859161376953125, -0.05084228515625, -0.046825408935546875, -0.04280853271484375, -0.038791656494140625, -0.0347747802734375, -0.030757904052734375, -0.02674102783203125, -0.022724151611328125, -0.018707275390625, -0.014690399169921875, -0.01067352294921875, -0.006656646728515625, -0.0026397705078125, 0.001377105712890625, 0.00539398193359375, 0.009410858154296875, 0.013427734375, 0.017444610595703125, 0.02146148681640625, 0.025478363037109375, 0.0294952392578125, 0.033512115478515625, 0.03752899169921875, 0.041545867919921875, 0.045562744140625, 0.049579620361328125, 0.05359649658203125, 0.057613372802734375, 0.0616302490234375, 0.06564712524414062, 0.06966400146484375, 0.07368087768554688, 0.07769775390625, 0.08171463012695312, 0.08573150634765625, 0.08974838256835938, 0.0937652587890625, 0.09778213500976562, 0.10179901123046875, 0.10581588745117188, 0.109832763671875, 0.11384963989257812, 0.11786651611328125, 0.12188339233398438, 0.1259002685546875, 0.12991714477539062, 0.13393402099609375, 0.13795089721679688, 0.1419677734375]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 11.0, 18.0, 37.0, 49.0, 85.0, 118.0, 128.0, 145.0, 126.0, 103.0, 68.0, 36.0, 24.0, 15.0, 12.0, 8.0, 5.0, 5.0, 5.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.017672255635261536, -0.016899771988391876, -0.016127288341522217, -0.015354804694652557, -0.014582321047782898, -0.013809837400913239, -0.013037352822721004, -0.012264869175851345, -0.011492385528981686, -0.010719901882112026, -0.009947418235242367, -0.009174933657050133, -0.008402450010180473, -0.007629966828972101, -0.0068574827164411545, -0.006084999069571495, -0.005312515422701836, -0.004540031775832176, -0.003767547896131873, -0.00299506401643157, -0.0022225803695619106, -0.0014500967226922512, -0.0006776126101613045, 9.487103670835495e-05, 0.0008673546835780144, 0.0016398384468629956, 0.002412322210147977, 0.00318480608984828, 0.003957289736717939, 0.004729773383587599, 0.0055022574961185455, 0.006274741142988205, 0.007047224789857864, 0.007819708436727524, 0.008592192083597183, 0.009364675730466843, 0.010137159377336502, 0.010909643024206161, 0.011682127602398396, 0.012454611249268055, 0.013227094896137714, 0.013999578543007374, 0.014772062189877033, 0.015544546768069267, 0.016317030414938927, 0.017089514061808586, 0.017861997708678246, 0.018634481355547905, 0.019406965002417564, 0.020179448649287224, 0.020951932296156883, 0.021724415943026543, 0.022496899589896202, 0.02326938323676586, 0.02404186874628067, 0.02481435239315033, 0.02558683604001999, 0.02635931968688965, 0.027131803333759308, 0.027904286980628967, 0.028676770627498627, 0.029449254274368286, 0.030221737921237946, 0.030994221568107605, 0.031766705214977264]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 6.0, 5.0, 11.0, 4.0, 5.0, 8.0, 7.0, 19.0, 13.0, 14.0, 17.0, 29.0, 16.0, 30.0, 39.0, 37.0, 30.0, 32.0, 41.0, 48.0, 39.0, 44.0, 48.0, 38.0, 40.0, 36.0, 34.0, 26.0, 30.0, 33.0, 40.0, 20.0, 24.0, 24.0, 20.0, 13.0, 18.0, 13.0, 10.0, 12.0, 11.0, 5.0, 3.0, 7.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.012194693088531494, -0.011804303154349327, -0.01141391322016716, -0.011023523285984993, -0.010633133351802826, -0.010242743417620659, -0.009852353483438492, -0.009461963549256325, -0.009071573615074158, -0.00868118368089199, -0.008290793746709824, -0.007900403812527657, -0.0075100138783454895, -0.0071196239441633224, -0.006729234009981155, -0.006338844075798988, -0.005948454141616821, -0.005558064207434654, -0.005167674273252487, -0.00477728433907032, -0.004386894404888153, -0.003996504470705986, -0.003606114536523819, -0.003215724602341652, -0.002825334668159485, -0.002434944733977318, -0.0020445547997951508, -0.0016541648656129837, -0.0012637749314308167, -0.0008733849972486496, -0.00048299506306648254, -9.260512888431549e-05, 0.00029778480529785156, 0.0006881747394800186, 0.0010785646736621857, 0.0014689546078443527, 0.0018593445420265198, 0.002249734476208687, 0.002640124410390854, 0.003030514344573021, 0.003420904278755188, 0.003811294212937355, 0.004201684147119522, 0.004592074081301689, 0.004982464015483856, 0.005372853949666023, 0.00576324388384819, 0.006153633818030357, 0.006544023752212524, 0.0069344136863946915, 0.0073248036205768585, 0.007715193554759026, 0.008105583488941193, 0.00849597342312336, 0.008886363357305527, 0.009276753291487694, 0.00966714322566986, 0.010057533159852028, 0.010447923094034195, 0.010838313028216362, 0.011228702962398529, 0.011619092896580696, 0.012009482830762863, 0.01239987276494503, 0.012790262699127197]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 3.0, 0.0, 2.0, 2.0, 4.0, 10.0, 12.0, 10.0, 14.0, 10.0, 19.0, 16.0, 17.0, 18.0, 30.0, 24.0, 32.0, 40.0, 47.0, 34.0, 39.0, 44.0, 41.0, 42.0, 40.0, 44.0, 43.0, 40.0, 35.0, 38.0, 41.0, 30.0, 22.0, 30.0, 17.0, 16.0, 16.0, 14.0, 16.0, 11.0, 15.0, 5.0, 5.0, 3.0, 5.0, 4.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-36.46875, -35.353515625, -34.23828125, -33.123046875, -32.0078125, -30.892578125, -29.77734375, -28.662109375, -27.546875, -26.431640625, -25.31640625, -24.201171875, -23.0859375, -21.970703125, -20.85546875, -19.740234375, -18.625, -17.509765625, -16.39453125, -15.279296875, -14.1640625, -13.048828125, -11.93359375, -10.818359375, -9.703125, -8.587890625, -7.47265625, -6.357421875, -5.2421875, -4.126953125, -3.01171875, -1.896484375, -0.78125, 0.333984375, 1.44921875, 2.564453125, 3.6796875, 4.794921875, 5.91015625, 7.025390625, 8.140625, 9.255859375, 10.37109375, 11.486328125, 12.6015625, 13.716796875, 14.83203125, 15.947265625, 17.0625, 18.177734375, 19.29296875, 20.408203125, 21.5234375, 22.638671875, 23.75390625, 24.869140625, 25.984375, 27.099609375, 28.21484375, 29.330078125, 30.4453125, 31.560546875, 32.67578125, 33.791015625, 34.90625]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 4.0, 8.0, 12.0, 13.0, 24.0, 22.0, 28.0, 45.0, 59.0, 69.0, 130.0, 205.0, 280.0, 415.0, 702.0, 1302.0, 2632.0, 6144.0, 19401.0, 87160.0, 428469.0, 394164.0, 77727.0, 17916.0, 5933.0, 2465.0, 1251.0, 682.0, 428.0, 267.0, 182.0, 107.0, 100.0, 66.0, 35.0, 30.0, 26.0, 9.0, 14.0, 10.0, 9.0, 2.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.265625, -7.04522705078125, -6.8248291015625, -6.60443115234375, -6.384033203125, -6.16363525390625, -5.9432373046875, -5.72283935546875, -5.50244140625, -5.28204345703125, -5.0616455078125, -4.84124755859375, -4.620849609375, -4.40045166015625, -4.1800537109375, -3.95965576171875, -3.7392578125, -3.51885986328125, -3.2984619140625, -3.07806396484375, -2.857666015625, -2.63726806640625, -2.4168701171875, -2.19647216796875, -1.97607421875, -1.75567626953125, -1.5352783203125, -1.31488037109375, -1.094482421875, -0.87408447265625, -0.6536865234375, -0.43328857421875, -0.212890625, 0.00750732421875, 0.2279052734375, 0.44830322265625, 0.668701171875, 0.88909912109375, 1.1094970703125, 1.32989501953125, 1.55029296875, 1.77069091796875, 1.9910888671875, 2.21148681640625, 2.431884765625, 2.65228271484375, 2.8726806640625, 3.09307861328125, 3.3134765625, 3.53387451171875, 3.7542724609375, 3.97467041015625, 4.195068359375, 4.41546630859375, 4.6358642578125, 4.85626220703125, 5.07666015625, 5.29705810546875, 5.5174560546875, 5.73785400390625, 5.958251953125, 6.17864990234375, 6.3990478515625, 6.61944580078125, 6.83984375]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 6.0, 10.0, 18.0, 17.0, 20.0, 36.0, 44.0, 65.0, 98.0, 105.0, 2046.0, 186.0, 89.0, 92.0, 51.0, 35.0, 44.0, 25.0, 22.0, 16.0, 6.0, 6.0, 5.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-111.625, -108.330078125, -105.03515625, -101.740234375, -98.4453125, -95.150390625, -91.85546875, -88.560546875, -85.265625, -81.970703125, -78.67578125, -75.380859375, -72.0859375, -68.791015625, -65.49609375, -62.201171875, -58.90625, -55.611328125, -52.31640625, -49.021484375, -45.7265625, -42.431640625, -39.13671875, -35.841796875, -32.546875, -29.251953125, -25.95703125, -22.662109375, -19.3671875, -16.072265625, -12.77734375, -9.482421875, -6.1875, -2.892578125, 0.40234375, 3.697265625, 6.9921875, 10.287109375, 13.58203125, 16.876953125, 20.171875, 23.466796875, 26.76171875, 30.056640625, 33.3515625, 36.646484375, 39.94140625, 43.236328125, 46.53125, 49.826171875, 53.12109375, 56.416015625, 59.7109375, 63.005859375, 66.30078125, 69.595703125, 72.890625, 76.185546875, 79.48046875, 82.775390625, 86.0703125, 89.365234375, 92.66015625, 95.955078125, 99.25]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 1.0, 5.0, 6.0, 5.0, 7.0, 18.0, 17.0, 25.0, 36.0, 54.0, 69.0, 117.0, 199.0, 305.0, 522.0, 1015.0, 2781.0, 18763.0, 2613267.0, 488678.0, 14929.0, 2587.0, 971.0, 509.0, 272.0, 181.0, 106.0, 80.0, 58.0, 32.0, 24.0, 24.0, 14.0, 10.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.5859375, -14.11474609375, -13.6435546875, -13.17236328125, -12.701171875, -12.22998046875, -11.7587890625, -11.28759765625, -10.81640625, -10.34521484375, -9.8740234375, -9.40283203125, -8.931640625, -8.46044921875, -7.9892578125, -7.51806640625, -7.046875, -6.57568359375, -6.1044921875, -5.63330078125, -5.162109375, -4.69091796875, -4.2197265625, -3.74853515625, -3.27734375, -2.80615234375, -2.3349609375, -1.86376953125, -1.392578125, -0.92138671875, -0.4501953125, 0.02099609375, 0.4921875, 0.96337890625, 1.4345703125, 1.90576171875, 2.376953125, 2.84814453125, 3.3193359375, 3.79052734375, 4.26171875, 4.73291015625, 5.2041015625, 5.67529296875, 6.146484375, 6.61767578125, 7.0888671875, 7.56005859375, 8.03125, 8.50244140625, 8.9736328125, 9.44482421875, 9.916015625, 10.38720703125, 10.8583984375, 11.32958984375, 11.80078125, 12.27197265625, 12.7431640625, 13.21435546875, 13.685546875, 14.15673828125, 14.6279296875, 15.09912109375, 15.5703125]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 6.0, 9.0, 23.0, 91.0, 279.0, 340.0, 168.0, 51.0, 13.0, 16.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-139.14376831054688, -133.12490844726562, -127.10604858398438, -121.08718872070312, -115.06832885742188, -109.04946899414062, -103.03060150146484, -97.0117416381836, -90.99288177490234, -84.9740219116211, -78.95516204833984, -72.93629455566406, -66.91743469238281, -60.89857864379883, -54.87971496582031, -48.86085510253906, -42.84199523925781, -36.82313537597656, -30.80427360534668, -24.785411834716797, -18.766551971435547, -12.747692108154297, -6.728828430175781, -0.7099685668945312, 5.308891296386719, 11.327752113342285, 17.34661293029785, 23.365474700927734, 29.384334564208984, 35.403194427490234, 41.42205810546875, 47.44091796875, 53.45977783203125, 59.4786376953125, 65.49749755859375, 71.516357421875, 77.53521728515625, 83.5540771484375, 89.57294464111328, 95.59180450439453, 101.61066436767578, 107.62952423095703, 113.64838409423828, 119.66725158691406, 125.68611145019531, 131.70497131347656, 137.7238311767578, 143.74269104003906, 149.7615509033203, 155.78041076660156, 161.7992706298828, 167.81813049316406, 173.8369903564453, 179.85585021972656, 185.87472534179688, 191.89358520507812, 197.91244506835938, 203.93130493164062, 209.95016479492188, 215.96902465820312, 221.98788452148438, 228.00674438476562, 234.02560424804688, 240.04446411132812, 246.06332397460938]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 6.0, 8.0, 8.0, 8.0, 11.0, 16.0, 10.0, 19.0, 33.0, 27.0, 30.0, 21.0, 33.0, 44.0, 49.0, 36.0, 33.0, 38.0, 35.0, 68.0, 51.0, 38.0, 54.0, 37.0, 47.0, 44.0, 30.0, 17.0, 26.0, 28.0, 20.0, 14.0, 10.0, 13.0, 7.0, 9.0, 8.0, 1.0, 5.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-70.78162384033203, -68.49209594726562, -66.20257568359375, -63.913047790527344, -61.62351989746094, -59.3339958190918, -57.044471740722656, -54.75494384765625, -52.46541976928711, -50.17589569091797, -47.88636779785156, -45.59684371948242, -43.30731964111328, -41.017791748046875, -38.728267669677734, -36.438743591308594, -34.14921569824219, -31.859689712524414, -29.57016372680664, -27.2806396484375, -24.991113662719727, -22.701587677001953, -20.412063598632812, -18.12253761291504, -15.833011627197266, -13.543485641479492, -11.253960609436035, -8.964435577392578, -6.674909591674805, -4.385383605957031, -2.095858573913574, 0.1936664581298828, 2.4832000732421875, 4.772725582122803, 7.062251091003418, 9.351776123046875, 11.641302108764648, 13.930828094482422, 16.220352172851562, 18.509878158569336, 20.79940414428711, 23.088930130004883, 25.378456115722656, 27.667980194091797, 29.95750617980957, 32.247032165527344, 34.536556243896484, 36.826080322265625, 39.11560821533203, 41.40513229370117, 43.69466018676758, 45.98418426513672, 48.273712158203125, 50.563236236572266, 52.852760314941406, 55.14228820800781, 57.43181228637695, 59.721336364746094, 62.0108642578125, 64.3003921508789, 66.58991241455078, 68.87944030761719, 71.1689682006836, 73.45848846435547, 75.74801635742188]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 7.0, 9.0, 9.0, 12.0, 12.0, 20.0, 29.0, 44.0, 60.0, 74.0, 100.0, 159.0, 217.0, 351.0, 520.0, 784.0, 1361.0, 2091.0, 3277.0, 5001.0, 7131.0, 1008935.0, 6348.0, 4238.0, 2786.0, 1785.0, 1105.0, 684.0, 445.0, 301.0, 171.0, 153.0, 90.0, 53.0, 65.0, 36.0, 21.0, 22.0, 15.0, 13.0, 10.0, 3.0, 3.0, 4.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.990504264831543, -12.56213092803955, -12.133756637573242, -11.70538330078125, -11.277009963989258, -10.84863567352295, -10.420262336730957, -9.991888046264648, -9.563514709472656, -9.135141372680664, -8.706767082214355, -8.278393745422363, -7.850019931793213, -7.4216461181640625, -6.99327278137207, -6.56489896774292, -6.1365251541137695, -5.708151340484619, -5.279777526855469, -4.851404190063477, -4.423030376434326, -3.994656562805176, -3.5662829875946045, -3.137909412384033, -2.709535598754883, -2.2811617851257324, -1.8527882099151611, -1.4244145154953003, -0.9960408210754395, -0.5676670074462891, -0.13929343223571777, 0.2890801429748535, 0.7174530029296875, 1.1458266973495483, 1.5742003917694092, 2.0025739669799805, 2.430947780609131, 2.8593215942382812, 3.2876951694488525, 3.716068744659424, 4.144442558288574, 4.572816371917725, 5.001190185546875, 5.429563522338867, 5.857937335968018, 6.286311149597168, 6.71468448638916, 7.1430583000183105, 7.571432113647461, 7.999805927276611, 8.428179740905762, 8.856553077697754, 9.284927368164062, 9.713300704956055, 10.141674041748047, 10.570047378540039, 10.998421669006348, 11.42679500579834, 11.855169296264648, 12.28354263305664, 12.711915969848633, 13.140290260314941, 13.568663597106934, 13.997037887573242, 14.425411224365234]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 2.0, 12.0, 8.0, 15.0, 24.0, 54.0, 63.0, 105.0, 229.0, 51460032.0, 2305.0, 123.0, 61.0, 49.0, 29.0, 19.0, 17.0, 10.0, 13.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1726.7813720703125, -1664.7305908203125, -1602.679931640625, -1540.629150390625, -1478.578369140625, -1416.527587890625, -1354.4769287109375, -1292.4261474609375, -1230.37548828125, -1168.32470703125, -1106.2740478515625, -1044.2232666015625, -982.1724853515625, -920.1217651367188, -858.071044921875, -796.020263671875, -733.969482421875, -671.9187622070312, -609.8679809570312, -547.8172607421875, -485.7665100097656, -423.71575927734375, -361.6650390625, -299.6142883300781, -237.56353759765625, -175.51278686523438, -113.46205139160156, -51.41131591796875, 10.639434814453125, 72.690185546875, 134.74090576171875, 196.79165649414062, 258.842529296875, 320.8932800292969, 382.94403076171875, 444.9947509765625, 507.0455017089844, 569.0962524414062, 631.14697265625, 693.19775390625, 755.2484741210938, 817.2991943359375, 879.3499755859375, 941.4006958007812, 1003.451416015625, 1065.502197265625, 1127.552978515625, 1189.6036376953125, 1251.6544189453125, 1313.7052001953125, 1375.755859375, 1437.806640625, 1499.857421875, 1561.908203125, 1623.9588623046875, 1686.0096435546875, 1748.060302734375, 1810.111083984375, 1872.1617431640625, 1934.2125244140625, 1996.2633056640625, 2058.31396484375, 2120.36474609375, 2182.41552734375, 2244.46630859375]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 8.0, 7.0, 13.0, 54.0, 58.0, 88.0, 133.0, 234.0, 353.0, 468.0, 732.0, 1058.0, 1563.0, 2307.0, 3186.0, 4498.0, 6742.0, 10039.0, 14401.0, 20988.0, 30929.0, 46046.0, 69706.0, 106224.0, 161133.0, 248740.0, 394054.0, 3052013.0, 1093062.0, 355477.0, 227539.0, 147541.0, 96341.0, 63142.0, 42700.0, 28219.0, 19250.0, 13356.0, 9092.0, 6197.0, 4341.0, 3002.0, 2110.0, 1378.0, 947.0, 691.0, 472.0, 311.0, 181.0, 142.0, 62.0, 64.0, 23.0, 12.0, 9.0, 5.0, 5.0, 5.0], "bins": [-1.091796875, -1.0595855712890625, -1.027374267578125, -0.9951629638671875, -0.96295166015625, -0.9307403564453125, -0.898529052734375, -0.8663177490234375, -0.8341064453125, -0.8018951416015625, -0.769683837890625, -0.7374725341796875, -0.70526123046875, -0.6730499267578125, -0.640838623046875, -0.6086273193359375, -0.576416015625, -0.5442047119140625, -0.511993408203125, -0.4797821044921875, -0.44757080078125, -0.4153594970703125, -0.383148193359375, -0.3509368896484375, -0.3187255859375, -0.2865142822265625, -0.254302978515625, -0.2220916748046875, -0.18988037109375, -0.1576690673828125, -0.125457763671875, -0.0932464599609375, -0.06103515625, -0.0288238525390625, 0.003387451171875, 0.0355987548828125, 0.06781005859375, 0.1000213623046875, 0.132232666015625, 0.1644439697265625, 0.1966552734375, 0.2288665771484375, 0.261077880859375, 0.2932891845703125, 0.32550048828125, 0.3577117919921875, 0.389923095703125, 0.4221343994140625, 0.454345703125, 0.4865570068359375, 0.518768310546875, 0.5509796142578125, 0.58319091796875, 0.6154022216796875, 0.647613525390625, 0.6798248291015625, 0.7120361328125, 0.7442474365234375, 0.776458740234375, 0.8086700439453125, 0.84088134765625, 0.8730926513671875, 0.905303955078125, 0.9375152587890625, 0.9697265625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 14.0, 2.0, 8.0, 14.0, 8.0, 14.0, 14.0, 18.0, 22.0, 23.0, 26.0, 30.0, 32.0, 36.0, 41.0, 37.0, 42.0, 46.0, 51.0, 731.0, 343.0, 54.0, 34.0, 45.0, 30.0, 42.0, 40.0, 34.0, 29.0, 22.0, 16.0, 30.0, 16.0, 15.0, 17.0, 10.0, 10.0, 8.0, 8.0, 1.0, 5.0, 1.0, 3.0, 3.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-7.8984375, -7.65032958984375, -7.4022216796875, -7.15411376953125, -6.906005859375, -6.65789794921875, -6.4097900390625, -6.16168212890625, -5.91357421875, -5.66546630859375, -5.4173583984375, -5.16925048828125, -4.921142578125, -4.67303466796875, -4.4249267578125, -4.17681884765625, -3.9287109375, -3.68060302734375, -3.4324951171875, -3.18438720703125, -2.936279296875, -2.68817138671875, -2.4400634765625, -2.19195556640625, -1.94384765625, -1.69573974609375, -1.4476318359375, -1.19952392578125, -0.951416015625, -0.70330810546875, -0.4552001953125, -0.20709228515625, 0.041015625, 0.28912353515625, 0.5372314453125, 0.78533935546875, 1.033447265625, 1.28155517578125, 1.5296630859375, 1.77777099609375, 2.02587890625, 2.27398681640625, 2.5220947265625, 2.77020263671875, 3.018310546875, 3.26641845703125, 3.5145263671875, 3.76263427734375, 4.0107421875, 4.25885009765625, 4.5069580078125, 4.75506591796875, 5.003173828125, 5.25128173828125, 5.4993896484375, 5.74749755859375, 5.99560546875, 6.24371337890625, 6.4918212890625, 6.73992919921875, 6.988037109375, 7.23614501953125, 7.4842529296875, 7.73236083984375, 7.98046875]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [7.0, 3.0, 6.0, 7.0, 8.0, 7.0, 10.0, 23.0, 18.0, 36.0, 38.0, 69.0, 102.0, 134.0, 207.0, 290.0, 372.0, 636.0, 887.0, 1349.0, 1977.0, 2887.0, 4530.0, 6635.0, 10320.0, 16065.0, 25570.0, 41831.0, 69907.0, 115802.0, 197367.0, 345831.0, 840729.0, 3528588.0, 458972.0, 248938.0, 146538.0, 85394.0, 51896.0, 32097.0, 19691.0, 12227.0, 7957.0, 5188.0, 3378.0, 2169.0, 1488.0, 1017.0, 755.0, 506.0, 316.0, 230.0, 127.0, 97.0, 68.0, 49.0, 37.0, 28.0, 10.0, 12.0, 8.0, 7.0, 5.0, 3.0], "bins": [-1.51953125, -1.473785400390625, -1.42803955078125, -1.382293701171875, -1.3365478515625, -1.290802001953125, -1.24505615234375, -1.199310302734375, -1.153564453125, -1.107818603515625, -1.06207275390625, -1.016326904296875, -0.9705810546875, -0.924835205078125, -0.87908935546875, -0.833343505859375, -0.78759765625, -0.741851806640625, -0.69610595703125, -0.650360107421875, -0.6046142578125, -0.558868408203125, -0.51312255859375, -0.467376708984375, -0.421630859375, -0.375885009765625, -0.33013916015625, -0.284393310546875, -0.2386474609375, -0.192901611328125, -0.14715576171875, -0.101409912109375, -0.0556640625, -0.009918212890625, 0.03582763671875, 0.081573486328125, 0.1273193359375, 0.173065185546875, 0.21881103515625, 0.264556884765625, 0.310302734375, 0.356048583984375, 0.40179443359375, 0.447540283203125, 0.4932861328125, 0.539031982421875, 0.58477783203125, 0.630523681640625, 0.67626953125, 0.722015380859375, 0.76776123046875, 0.813507080078125, 0.8592529296875, 0.904998779296875, 0.95074462890625, 0.996490478515625, 1.042236328125, 1.087982177734375, 1.13372802734375, 1.179473876953125, 1.2252197265625, 1.270965576171875, 1.31671142578125, 1.362457275390625, 1.408203125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 5.0, 9.0, 18.0, 15.0, 13.0, 17.0, 17.0, 19.0, 29.0, 21.0, 26.0, 30.0, 36.0, 29.0, 42.0, 53.0, 47.0, 99.0, 831.0, 219.0, 57.0, 45.0, 35.0, 43.0, 30.0, 29.0, 36.0, 23.0, 26.0, 30.0, 19.0, 13.0, 8.0, 12.0, 7.0, 12.0, 9.0, 4.0, 4.0, 6.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.375, -6.19085693359375, -6.0067138671875, -5.82257080078125, -5.638427734375, -5.45428466796875, -5.2701416015625, -5.08599853515625, -4.90185546875, -4.71771240234375, -4.5335693359375, -4.34942626953125, -4.165283203125, -3.98114013671875, -3.7969970703125, -3.61285400390625, -3.4287109375, -3.24456787109375, -3.0604248046875, -2.87628173828125, -2.692138671875, -2.50799560546875, -2.3238525390625, -2.13970947265625, -1.95556640625, -1.77142333984375, -1.5872802734375, -1.40313720703125, -1.218994140625, -1.03485107421875, -0.8507080078125, -0.66656494140625, -0.482421875, -0.29827880859375, -0.1141357421875, 0.07000732421875, 0.254150390625, 0.43829345703125, 0.6224365234375, 0.80657958984375, 0.99072265625, 1.17486572265625, 1.3590087890625, 1.54315185546875, 1.727294921875, 1.91143798828125, 2.0955810546875, 2.27972412109375, 2.4638671875, 2.64801025390625, 2.8321533203125, 3.01629638671875, 3.200439453125, 3.38458251953125, 3.5687255859375, 3.75286865234375, 3.93701171875, 4.12115478515625, 4.3052978515625, 4.48944091796875, 4.673583984375, 4.85772705078125, 5.0418701171875, 5.22601318359375, 5.41015625]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 11.0, 21.0, 18.0, 13.0, 24.0, 35.0, 63.0, 95.0, 160.0, 196.0, 262.0, 431.0, 704.0, 1039.0, 1594.0, 2842.0, 5476.0, 12968.0, 40532.0, 222391.0, 5886123.0, 77631.0, 21433.0, 7877.0, 3926.0, 1940.0, 1204.0, 810.0, 516.0, 307.0, 230.0, 171.0, 135.0, 88.0, 55.0, 30.0, 21.0, 10.0, 19.0, 5.0, 9.0, 6.0, 2.0, 0.0, 1.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-7.16796875, -6.9384765625, -6.708984375, -6.4794921875, -6.25, -6.0205078125, -5.791015625, -5.5615234375, -5.33203125, -5.1025390625, -4.873046875, -4.6435546875, -4.4140625, -4.1845703125, -3.955078125, -3.7255859375, -3.49609375, -3.2666015625, -3.037109375, -2.8076171875, -2.578125, -2.3486328125, -2.119140625, -1.8896484375, -1.66015625, -1.4306640625, -1.201171875, -0.9716796875, -0.7421875, -0.5126953125, -0.283203125, -0.0537109375, 0.17578125, 0.4052734375, 0.634765625, 0.8642578125, 1.09375, 1.3232421875, 1.552734375, 1.7822265625, 2.01171875, 2.2412109375, 2.470703125, 2.7001953125, 2.9296875, 3.1591796875, 3.388671875, 3.6181640625, 3.84765625, 4.0771484375, 4.306640625, 4.5361328125, 4.765625, 4.9951171875, 5.224609375, 5.4541015625, 5.68359375, 5.9130859375, 6.142578125, 6.3720703125, 6.6015625, 6.8310546875, 7.060546875, 7.2900390625, 7.51953125]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 6.0, 6.0, 2.0, 9.0, 14.0, 12.0, 27.0, 19.0, 17.0, 27.0, 28.0, 18.0, 25.0, 29.0, 37.0, 31.0, 54.0, 64.0, 162.0, 712.0, 219.0, 72.0, 50.0, 38.0, 44.0, 35.0, 32.0, 30.0, 32.0, 30.0, 22.0, 17.0, 17.0, 20.0, 17.0, 3.0, 5.0, 8.0, 14.0, 1.0, 9.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.2421875, -4.10760498046875, -3.9730224609375, -3.83843994140625, -3.703857421875, -3.56927490234375, -3.4346923828125, -3.30010986328125, -3.16552734375, -3.03094482421875, -2.8963623046875, -2.76177978515625, -2.627197265625, -2.49261474609375, -2.3580322265625, -2.22344970703125, -2.0888671875, -1.95428466796875, -1.8197021484375, -1.68511962890625, -1.550537109375, -1.41595458984375, -1.2813720703125, -1.14678955078125, -1.01220703125, -0.87762451171875, -0.7430419921875, -0.60845947265625, -0.473876953125, -0.33929443359375, -0.2047119140625, -0.07012939453125, 0.064453125, 0.19903564453125, 0.3336181640625, 0.46820068359375, 0.602783203125, 0.73736572265625, 0.8719482421875, 1.00653076171875, 1.14111328125, 1.27569580078125, 1.4102783203125, 1.54486083984375, 1.679443359375, 1.81402587890625, 1.9486083984375, 2.08319091796875, 2.2177734375, 2.35235595703125, 2.4869384765625, 2.62152099609375, 2.756103515625, 2.89068603515625, 3.0252685546875, 3.15985107421875, 3.29443359375, 3.42901611328125, 3.5635986328125, 3.69818115234375, 3.832763671875, 3.96734619140625, 4.1019287109375, 4.23651123046875, 4.37109375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 6.0, 4.0, 12.0, 27.0, 44.0, 76.0, 159.0, 219.0, 207.0, 124.0, 62.0, 33.0, 15.0, 8.0, 5.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.960474491119385, -7.5760579109191895, -7.191641330718994, -6.807224750518799, -6.4228081703186035, -6.038391590118408, -5.653975009918213, -5.269558429718018, -4.885141849517822, -4.500725269317627, -4.116308689117432, -3.7318921089172363, -3.347475528717041, -2.9630589485168457, -2.5786423683166504, -2.194225788116455, -1.8098092079162598, -1.4253926277160645, -1.0409760475158691, -0.6565594673156738, -0.2721428871154785, 0.1122736930847168, 0.4966902732849121, 0.8811068534851074, 1.2655234336853027, 1.649940013885498, 2.0343565940856934, 2.4187731742858887, 2.803189754486084, 3.1876063346862793, 3.5720229148864746, 3.95643949508667, 4.340856552124023, 4.725273132324219, 5.109689712524414, 5.494106292724609, 5.878522872924805, 6.262939453125, 6.647356033325195, 7.031772613525391, 7.416189193725586, 7.800605773925781, 8.185022354125977, 8.569438934326172, 8.953855514526367, 9.338272094726562, 9.722688674926758, 10.107105255126953, 10.491521835327148, 10.875938415527344, 11.260354995727539, 11.644771575927734, 12.02918815612793, 12.413604736328125, 12.79802131652832, 13.182437896728516, 13.566854476928711, 13.951271057128906, 14.335687637329102, 14.720104217529297, 15.104520797729492, 15.488937377929688, 15.873353958129883, 16.257770538330078, 16.642187118530273]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 7.0, 10.0, 6.0, 6.0, 18.0, 21.0, 25.0, 34.0, 37.0, 49.0, 57.0, 53.0, 63.0, 62.0, 54.0, 65.0, 71.0, 52.0, 58.0, 43.0, 44.0, 36.0, 30.0, 35.0, 21.0, 10.0, 11.0, 7.0, 8.0, 7.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.039026260375977, -11.74767017364502, -11.456315040588379, -11.164958953857422, -10.873603820800781, -10.582247734069824, -10.290892601013184, -9.999536514282227, -9.708181381225586, -9.416825294494629, -9.125470161437988, -8.834114074707031, -8.54275894165039, -8.251402854919434, -7.960047245025635, -7.668691635131836, -7.377335548400879, -7.08597993850708, -6.794624328613281, -6.503268718719482, -6.211913108825684, -5.920557022094727, -5.629201412200928, -5.337845802307129, -5.04649019241333, -4.755134582519531, -4.463778972625732, -4.172423362731934, -3.8810675144195557, -3.589711904525757, -3.298356056213379, -3.00700044631958, -2.7156457901000977, -2.424290180206299, -2.1329345703125, -1.841578722000122, -1.5502231121063232, -1.2588675022125244, -0.967511773109436, -0.6761560440063477, -0.38480043411254883, -0.09344476461410522, 0.19791090488433838, 0.489266574382782, 0.7806222438812256, 1.0719778537750244, 1.3633335828781128, 1.6546893119812012, 1.946044921875, 2.237400531768799, 2.5287561416625977, 2.8201119899749756, 3.1114675998687744, 3.4028232097625732, 3.694179058074951, 3.98553466796875, 4.276890277862549, 4.568245887756348, 4.8596014976501465, 5.150957107543945, 5.442313194274902, 5.733668327331543, 6.0250244140625, 6.316380023956299, 6.607735633850098]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 6.0, 7.0, 8.0, 8.0, 9.0, 6.0, 18.0, 16.0, 26.0, 37.0, 23.0, 24.0, 42.0, 57.0, 67.0, 88.0, 125.0, 183.0, 204.0, 279.0, 371.0, 489.0, 657.0, 1003.0, 1518.0, 2441.0, 4003.0, 7497.0, 16496.0, 51137.0, 3815016.0, 244569.0, 26848.0, 9883.0, 4490.0, 2467.0, 1482.0, 910.0, 544.0, 369.0, 267.0, 160.0, 119.0, 93.0, 73.0, 55.0, 31.0, 17.0, 15.0, 13.0, 6.0, 8.0, 7.0, 5.0, 5.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.21533203125, -0.209320068359375, -0.20330810546875, -0.197296142578125, -0.1912841796875, -0.185272216796875, -0.17926025390625, -0.173248291015625, -0.167236328125, -0.161224365234375, -0.15521240234375, -0.149200439453125, -0.1431884765625, -0.137176513671875, -0.13116455078125, -0.125152587890625, -0.119140625, -0.113128662109375, -0.10711669921875, -0.101104736328125, -0.0950927734375, -0.089080810546875, -0.08306884765625, -0.077056884765625, -0.071044921875, -0.065032958984375, -0.05902099609375, -0.053009033203125, -0.0469970703125, -0.040985107421875, -0.03497314453125, -0.028961181640625, -0.02294921875, -0.016937255859375, -0.01092529296875, -0.004913330078125, 0.0010986328125, 0.007110595703125, 0.01312255859375, 0.019134521484375, 0.025146484375, 0.031158447265625, 0.03717041015625, 0.043182373046875, 0.0491943359375, 0.055206298828125, 0.06121826171875, 0.067230224609375, 0.0732421875, 0.079254150390625, 0.08526611328125, 0.091278076171875, 0.0972900390625, 0.103302001953125, 0.10931396484375, 0.115325927734375, 0.121337890625, 0.127349853515625, 0.13336181640625, 0.139373779296875, 0.1453857421875, 0.151397705078125, 0.15740966796875, 0.163421630859375, 0.16943359375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 2.0, 6.0, 2.0, 5.0, 6.0, 9.0, 11.0, 19.0, 25.0, 11.0, 192.0, 578.0, 40.0, 24.0, 11.0, 8.0, 4.0, 4.0, 7.0, 6.0, 6.0, 3.0, 4.0, 2.0, 0.0, 3.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.047027587890625, -0.04572153091430664, -0.04441547393798828, -0.04310941696166992, -0.04180335998535156, -0.0404973030090332, -0.039191246032714844, -0.037885189056396484, -0.036579132080078125, -0.035273075103759766, -0.033967018127441406, -0.03266096115112305, -0.03135490417480469, -0.030048847198486328, -0.02874279022216797, -0.02743673324584961, -0.02613067626953125, -0.02482461929321289, -0.02351856231689453, -0.022212505340576172, -0.020906448364257812, -0.019600391387939453, -0.018294334411621094, -0.016988277435302734, -0.015682220458984375, -0.014376163482666016, -0.013070106506347656, -0.011764049530029297, -0.010457992553710938, -0.009151935577392578, -0.007845878601074219, -0.006539821624755859, -0.0052337646484375, -0.003927707672119141, -0.0026216506958007812, -0.0013155937194824219, -9.5367431640625e-06, 0.0012965202331542969, 0.0026025772094726562, 0.003908634185791016, 0.005214691162109375, 0.006520748138427734, 0.007826805114746094, 0.009132862091064453, 0.010438919067382812, 0.011744976043701172, 0.013051033020019531, 0.01435708999633789, 0.01566314697265625, 0.01696920394897461, 0.01827526092529297, 0.019581317901611328, 0.020887374877929688, 0.022193431854248047, 0.023499488830566406, 0.024805545806884766, 0.026111602783203125, 0.027417659759521484, 0.028723716735839844, 0.030029773712158203, 0.03133583068847656, 0.03264188766479492, 0.03394794464111328, 0.03525400161743164, 0.03656005859375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 7.0, 7.0, 12.0, 19.0, 19.0, 28.0, 58.0, 58.0, 131.0, 217.0, 382.0, 735.0, 1591.0, 4370.0, 17279.0, 125155.0, 3731760.0, 271327.0, 29421.0, 7006.0, 2375.0, 1021.0, 531.0, 312.0, 180.0, 103.0, 65.0, 43.0, 24.0, 13.0, 6.0, 8.0, 6.0, 4.0, 5.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.279541015625, -0.2707023620605469, -0.26186370849609375, -0.2530250549316406, -0.2441864013671875, -0.23534774780273438, -0.22650909423828125, -0.21767044067382812, -0.208831787109375, -0.19999313354492188, -0.19115447998046875, -0.18231582641601562, -0.1734771728515625, -0.16463851928710938, -0.15579986572265625, -0.14696121215820312, -0.13812255859375, -0.12928390502929688, -0.12044525146484375, -0.11160659790039062, -0.1027679443359375, -0.09392929077148438, -0.08509063720703125, -0.07625198364257812, -0.067413330078125, -0.058574676513671875, -0.04973602294921875, -0.040897369384765625, -0.0320587158203125, -0.023220062255859375, -0.01438140869140625, -0.005542755126953125, 0.0032958984375, 0.012134552001953125, 0.02097320556640625, 0.029811859130859375, 0.0386505126953125, 0.047489166259765625, 0.05632781982421875, 0.06516647338867188, 0.074005126953125, 0.08284378051757812, 0.09168243408203125, 0.10052108764648438, 0.1093597412109375, 0.11819839477539062, 0.12703704833984375, 0.13587570190429688, 0.14471435546875, 0.15355300903320312, 0.16239166259765625, 0.17123031616210938, 0.1800689697265625, 0.18890762329101562, 0.19774627685546875, 0.20658493041992188, 0.215423583984375, 0.22426223754882812, 0.23310089111328125, 0.24193954467773438, 0.2507781982421875, 0.2596168518066406, 0.26845550537109375, 0.2772941589355469, 0.2861328125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 6.0, 13.0, 25.0, 24.0, 52.0, 85.0, 152.0, 241.0, 760.0, 1722.0, 411.0, 211.0, 112.0, 92.0, 47.0, 35.0, 28.0, 14.0, 10.0, 7.0, 7.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.078125, -0.07525920867919922, -0.07239341735839844, -0.06952762603759766, -0.06666183471679688, -0.0637960433959961, -0.06093025207519531, -0.05806446075439453, -0.05519866943359375, -0.05233287811279297, -0.04946708679199219, -0.046601295471191406, -0.043735504150390625, -0.040869712829589844, -0.03800392150878906, -0.03513813018798828, -0.0322723388671875, -0.02940654754638672, -0.026540756225585938, -0.023674964904785156, -0.020809173583984375, -0.017943382263183594, -0.015077590942382812, -0.012211799621582031, -0.00934600830078125, -0.006480216979980469, -0.0036144256591796875, -0.0007486343383789062, 0.002117156982421875, 0.004982948303222656, 0.007848739624023438, 0.010714530944824219, 0.013580322265625, 0.01644611358642578, 0.019311904907226562, 0.022177696228027344, 0.025043487548828125, 0.027909278869628906, 0.030775070190429688, 0.03364086151123047, 0.03650665283203125, 0.03937244415283203, 0.04223823547363281, 0.045104026794433594, 0.047969818115234375, 0.050835609436035156, 0.05370140075683594, 0.05656719207763672, 0.0594329833984375, 0.06229877471923828, 0.06516456604003906, 0.06803035736083984, 0.07089614868164062, 0.0737619400024414, 0.07662773132324219, 0.07949352264404297, 0.08235931396484375, 0.08522510528564453, 0.08809089660644531, 0.0909566879272461, 0.09382247924804688, 0.09668827056884766, 0.09955406188964844, 0.10241985321044922, 0.10528564453125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 17.0, 17.0, 35.0, 130.0, 306.0, 268.0, 110.0, 54.0, 27.0, 20.0, 4.0, 5.0, 6.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27859652042388916, -0.2547541856765747, -0.23091186583042145, -0.2070695459842682, -0.18322721123695374, -0.15938489139080048, -0.13554257154464722, -0.11170023679733276, -0.0878579169511795, -0.06401558965444565, -0.04017326608300209, -0.016330942511558533, 0.0075113847851753235, 0.03135371208190918, 0.05519603192806244, 0.07903836667537689, 0.10288068652153015, 0.1267230063676834, 0.15056534111499786, 0.17440766096115112, 0.19824999570846558, 0.22209231555461884, 0.2459346354007721, 0.26977697014808655, 0.2936192750930786, 0.31746160984039307, 0.34130391478538513, 0.3651462495326996, 0.38898858428001404, 0.4128308892250061, 0.43667322397232056, 0.460515558719635, 0.48435789346694946, 0.5082002282142639, 0.5320425629615784, 0.555884838104248, 0.5797271728515625, 0.603569507598877, 0.6274118423461914, 0.6512541770935059, 0.6750965118408203, 0.6989388465881348, 0.7227811813354492, 0.7466235160827637, 0.7704657912254333, 0.7943081259727478, 0.8181504607200623, 0.8419927954673767, 0.8658350706100464, 0.8896774053573608, 0.9135197401046753, 0.9373620748519897, 0.9612043499946594, 0.9850466847419739, 1.0088889598846436, 1.032731294631958, 1.056573748588562, 1.0804160833358765, 1.104258418083191, 1.1281007528305054, 1.1519430875778198, 1.1757854223251343, 1.1996276378631592, 1.2234699726104736, 1.247312307357788]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 7.0, 11.0, 15.0, 25.0, 33.0, 47.0, 45.0, 83.0, 105.0, 92.0, 93.0, 85.0, 95.0, 68.0, 59.0, 48.0, 33.0, 27.0, 9.0, 11.0, 9.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5118328332901001, -0.4925919473171234, -0.47335106134414673, -0.45411017537117004, -0.43486928939819336, -0.41562843322753906, -0.3963875472545624, -0.3771466612815857, -0.357905775308609, -0.3386648893356323, -0.31942400336265564, -0.30018311738967896, -0.28094226121902466, -0.2617013454437256, -0.2424604892730713, -0.2232196033000946, -0.20397871732711792, -0.18473783135414124, -0.16549694538116455, -0.14625607430934906, -0.12701518833637238, -0.10777430236339569, -0.0885334238409996, -0.06929254531860352, -0.05005165934562683, -0.030810777097940445, -0.011569894850254059, 0.007670987397432327, 0.026911869645118713, 0.0461527556180954, 0.06539363414049149, 0.08463451266288757, 0.10387545824050903, 0.12311634421348572, 0.1423572301864624, 0.1615981012582779, 0.18083898723125458, 0.20007987320423126, 0.21932074427604675, 0.23856163024902344, 0.2578025162220001, 0.2770434021949768, 0.2962842881679535, 0.3155251741409302, 0.3347660303115845, 0.35400694608688354, 0.37324780225753784, 0.3924886882305145, 0.4117295742034912, 0.4309704601764679, 0.4502113461494446, 0.46945223212242126, 0.48869311809539795, 0.5079339742660522, 0.5271748900413513, 0.5464157462120056, 0.5656566619873047, 0.584897518157959, 0.6041384339332581, 0.6233792901039124, 0.6426202058792114, 0.6618610620498657, 0.6811019778251648, 0.7003428339958191, 0.7195836901664734]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 2.0, 6.0, 8.0, 14.0, 25.0, 28.0, 44.0, 74.0, 60.0, 101.0, 173.0, 262.0, 400.0, 623.0, 1040.0, 1758.0, 3310.0, 6119.0, 14257.0, 56274.0, 857552.0, 75473.0, 15926.0, 6779.0, 3426.0, 1874.0, 1063.0, 639.0, 408.0, 285.0, 164.0, 106.0, 82.0, 62.0, 37.0, 28.0, 17.0, 13.0, 14.0, 7.0, 6.0, 3.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.224609375, -0.217010498046875, -0.20941162109375, -0.201812744140625, -0.1942138671875, -0.186614990234375, -0.17901611328125, -0.171417236328125, -0.163818359375, -0.156219482421875, -0.14862060546875, -0.141021728515625, -0.1334228515625, -0.125823974609375, -0.11822509765625, -0.110626220703125, -0.10302734375, -0.095428466796875, -0.08782958984375, -0.080230712890625, -0.0726318359375, -0.065032958984375, -0.05743408203125, -0.049835205078125, -0.042236328125, -0.034637451171875, -0.02703857421875, -0.019439697265625, -0.0118408203125, -0.004241943359375, 0.00335693359375, 0.010955810546875, 0.0185546875, 0.026153564453125, 0.03375244140625, 0.041351318359375, 0.0489501953125, 0.056549072265625, 0.06414794921875, 0.071746826171875, 0.079345703125, 0.086944580078125, 0.09454345703125, 0.102142333984375, 0.1097412109375, 0.117340087890625, 0.12493896484375, 0.132537841796875, 0.14013671875, 0.147735595703125, 0.15533447265625, 0.162933349609375, 0.1705322265625, 0.178131103515625, 0.18572998046875, 0.193328857421875, 0.200927734375, 0.208526611328125, 0.21612548828125, 0.223724365234375, 0.2313232421875, 0.238922119140625, 0.24652099609375, 0.254119873046875, 0.26171875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 1.0, 1.0, 4.0, 5.0, 5.0, 4.0, 15.0, 12.0, 21.0, 50.0, 158.0, 332.0, 229.0, 75.0, 30.0, 11.0, 10.0, 5.0, 4.0, 7.0, 6.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05517578125, -0.05362272262573242, -0.052069664001464844, -0.050516605377197266, -0.04896354675292969, -0.04741048812866211, -0.04585742950439453, -0.04430437088012695, -0.042751312255859375, -0.0411982536315918, -0.03964519500732422, -0.03809213638305664, -0.03653907775878906, -0.034986019134521484, -0.033432960510253906, -0.03187990188598633, -0.03032684326171875, -0.028773784637451172, -0.027220726013183594, -0.025667667388916016, -0.024114608764648438, -0.02256155014038086, -0.02100849151611328, -0.019455432891845703, -0.017902374267578125, -0.016349315643310547, -0.014796257019042969, -0.01324319839477539, -0.011690139770507812, -0.010137081146240234, -0.008584022521972656, -0.007030963897705078, -0.0054779052734375, -0.003924846649169922, -0.0023717880249023438, -0.0008187294006347656, 0.0007343292236328125, 0.0022873878479003906, 0.0038404464721679688, 0.005393505096435547, 0.006946563720703125, 0.008499622344970703, 0.010052680969238281, 0.01160573959350586, 0.013158798217773438, 0.014711856842041016, 0.016264915466308594, 0.017817974090576172, 0.01937103271484375, 0.020924091339111328, 0.022477149963378906, 0.024030208587646484, 0.025583267211914062, 0.02713632583618164, 0.02868938446044922, 0.030242443084716797, 0.031795501708984375, 0.03334856033325195, 0.03490161895751953, 0.03645467758178711, 0.03800773620605469, 0.039560794830322266, 0.041113853454589844, 0.04266691207885742, 0.044219970703125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 2.0, 7.0, 11.0, 9.0, 12.0, 26.0, 41.0, 59.0, 106.0, 218.0, 540.0, 1660.0, 7799.0, 67616.0, 844158.0, 112145.0, 10761.0, 2151.0, 680.0, 251.0, 117.0, 63.0, 36.0, 26.0, 16.0, 8.0, 4.0, 10.0, 13.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47705078125, -0.4628486633300781, -0.44864654541015625, -0.4344444274902344, -0.4202423095703125, -0.4060401916503906, -0.39183807373046875, -0.3776359558105469, -0.363433837890625, -0.3492317199707031, -0.33502960205078125, -0.3208274841308594, -0.3066253662109375, -0.2924232482910156, -0.27822113037109375, -0.2640190124511719, -0.24981689453125, -0.23561477661132812, -0.22141265869140625, -0.20721054077148438, -0.1930084228515625, -0.17880630493164062, -0.16460418701171875, -0.15040206909179688, -0.136199951171875, -0.12199783325195312, -0.10779571533203125, -0.09359359741210938, -0.0793914794921875, -0.06518936157226562, -0.05098724365234375, -0.036785125732421875, -0.0225830078125, -0.008380889892578125, 0.00582122802734375, 0.020023345947265625, 0.0342254638671875, 0.048427581787109375, 0.06262969970703125, 0.07683181762695312, 0.091033935546875, 0.10523605346679688, 0.11943817138671875, 0.13364028930664062, 0.1478424072265625, 0.16204452514648438, 0.17624664306640625, 0.19044876098632812, 0.20465087890625, 0.21885299682617188, 0.23305511474609375, 0.24725723266601562, 0.2614593505859375, 0.2756614685058594, 0.28986358642578125, 0.3040657043457031, 0.318267822265625, 0.3324699401855469, 0.34667205810546875, 0.3608741760253906, 0.3750762939453125, 0.3892784118652344, 0.40348052978515625, 0.4176826477050781, 0.431884765625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 2.0, 4.0, 1.0, 3.0, 5.0, 4.0, 3.0, 9.0, 10.0, 11.0, 9.0, 20.0, 20.0, 18.0, 27.0, 18.0, 36.0, 27.0, 23.0, 41.0, 35.0, 37.0, 34.0, 45.0, 42.0, 31.0, 33.0, 46.0, 43.0, 44.0, 46.0, 32.0, 33.0, 28.0, 22.0, 34.0, 16.0, 23.0, 23.0, 10.0, 20.0, 13.0, 4.0, 11.0, 2.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1571044921875, -0.15178489685058594, -0.14646530151367188, -0.1411457061767578, -0.13582611083984375, -0.1305065155029297, -0.12518692016601562, -0.11986732482910156, -0.1145477294921875, -0.10922813415527344, -0.10390853881835938, -0.09858894348144531, -0.09326934814453125, -0.08794975280761719, -0.08263015747070312, -0.07731056213378906, -0.071990966796875, -0.06667137145996094, -0.061351776123046875, -0.05603218078613281, -0.05071258544921875, -0.04539299011230469, -0.040073394775390625, -0.03475379943847656, -0.0294342041015625, -0.024114608764648438, -0.018795013427734375, -0.013475418090820312, -0.00815582275390625, -0.0028362274169921875, 0.002483367919921875, 0.0078029632568359375, 0.01312255859375, 0.018442153930664062, 0.023761749267578125, 0.029081344604492188, 0.03440093994140625, 0.03972053527832031, 0.045040130615234375, 0.05035972595214844, 0.0556793212890625, 0.06099891662597656, 0.06631851196289062, 0.07163810729980469, 0.07695770263671875, 0.08227729797363281, 0.08759689331054688, 0.09291648864746094, 0.098236083984375, 0.10355567932128906, 0.10887527465820312, 0.11419486999511719, 0.11951446533203125, 0.12483406066894531, 0.13015365600585938, 0.13547325134277344, 0.1407928466796875, 0.14611244201660156, 0.15143203735351562, 0.1567516326904297, 0.16207122802734375, 0.1673908233642578, 0.17271041870117188, 0.17803001403808594, 0.183349609375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 6.0, 4.0, 7.0, 6.0, 5.0, 13.0, 16.0, 24.0, 32.0, 46.0, 59.0, 72.0, 128.0, 200.0, 366.0, 613.0, 1093.0, 2227.0, 6290.0, 38004.0, 927846.0, 58286.0, 7846.0, 2529.0, 1154.0, 600.0, 369.0, 225.0, 138.0, 109.0, 70.0, 50.0, 28.0, 25.0, 14.0, 8.0, 9.0, 7.0, 7.0, 5.0, 5.0, 6.0, 6.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0], "bins": [-0.37060546875, -0.3601875305175781, -0.34976959228515625, -0.3393516540527344, -0.3289337158203125, -0.3185157775878906, -0.30809783935546875, -0.2976799011230469, -0.287261962890625, -0.2768440246582031, -0.26642608642578125, -0.2560081481933594, -0.2455902099609375, -0.23517227172851562, -0.22475433349609375, -0.21433639526367188, -0.20391845703125, -0.19350051879882812, -0.18308258056640625, -0.17266464233398438, -0.1622467041015625, -0.15182876586914062, -0.14141082763671875, -0.13099288940429688, -0.120574951171875, -0.11015701293945312, -0.09973907470703125, -0.08932113647460938, -0.0789031982421875, -0.06848526000976562, -0.05806732177734375, -0.047649383544921875, -0.0372314453125, -0.026813507080078125, -0.01639556884765625, -0.005977630615234375, 0.0044403076171875, 0.014858245849609375, 0.02527618408203125, 0.035694122314453125, 0.046112060546875, 0.056529998779296875, 0.06694793701171875, 0.07736587524414062, 0.0877838134765625, 0.09820175170898438, 0.10861968994140625, 0.11903762817382812, 0.12945556640625, 0.13987350463867188, 0.15029144287109375, 0.16070938110351562, 0.1711273193359375, 0.18154525756835938, 0.19196319580078125, 0.20238113403320312, 0.212799072265625, 0.22321701049804688, 0.23363494873046875, 0.24405288696289062, 0.2544708251953125, 0.2648887634277344, 0.27530670166015625, 0.2857246398925781, 0.296142578125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 5.0, 8.0, 10.0, 7.0, 22.0, 23.0, 46.0, 72.0, 166.0, 354.0, 95.0, 55.0, 33.0, 32.0, 17.0, 11.0, 6.0, 6.0, 7.0, 4.0, 4.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0027408599853515625, -0.0026322901248931885, -0.0025237202644348145, -0.0024151504039764404, -0.0023065805435180664, -0.0021980106830596924, -0.0020894408226013184, -0.0019808709621429443, -0.0018723011016845703, -0.0017637312412261963, -0.0016551613807678223, -0.0015465915203094482, -0.0014380216598510742, -0.0013294517993927002, -0.0012208819389343262, -0.0011123120784759521, -0.0010037422180175781, -0.0008951723575592041, -0.0007866024971008301, -0.0006780326366424561, -0.000569462776184082, -0.000460892915725708, -0.000352323055267334, -0.00024375319480895996, -0.00013518333435058594, -2.6613473892211914e-05, 8.195638656616211e-05, 0.00019052624702453613, 0.00029909610748291016, 0.0004076659679412842, 0.0005162358283996582, 0.0006248056888580322, 0.0007333755493164062, 0.0008419454097747803, 0.0009505152702331543, 0.0010590851306915283, 0.0011676549911499023, 0.0012762248516082764, 0.0013847947120666504, 0.0014933645725250244, 0.0016019344329833984, 0.0017105042934417725, 0.0018190741539001465, 0.0019276440143585205, 0.0020362138748168945, 0.0021447837352752686, 0.0022533535957336426, 0.0023619234561920166, 0.0024704933166503906, 0.0025790631771087646, 0.0026876330375671387, 0.0027962028980255127, 0.0029047727584838867, 0.0030133426189422607, 0.0031219124794006348, 0.003230482339859009, 0.003339052200317383, 0.003447622060775757, 0.003556191921234131, 0.003664761781692505, 0.003773331642150879, 0.003881901502609253, 0.003990471363067627, 0.004099041223526001, 0.004207611083984375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 8.0, 8.0, 4.0, 14.0, 19.0, 14.0, 24.0, 37.0, 46.0, 65.0, 91.0, 126.0, 209.0, 283.0, 458.0, 713.0, 1216.0, 2078.0, 3726.0, 7742.0, 17547.0, 52170.0, 308153.0, 536997.0, 75093.0, 22438.0, 8983.0, 4202.0, 2293.0, 1324.0, 784.0, 511.0, 342.0, 214.0, 183.0, 118.0, 100.0, 60.0, 32.0, 30.0, 26.0, 15.0, 24.0, 13.0, 4.0, 8.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.136474609375, -0.132354736328125, -0.12823486328125, -0.124114990234375, -0.1199951171875, -0.115875244140625, -0.11175537109375, -0.107635498046875, -0.103515625, -0.099395751953125, -0.09527587890625, -0.091156005859375, -0.0870361328125, -0.082916259765625, -0.07879638671875, -0.074676513671875, -0.070556640625, -0.066436767578125, -0.06231689453125, -0.058197021484375, -0.0540771484375, -0.049957275390625, -0.04583740234375, -0.041717529296875, -0.03759765625, -0.033477783203125, -0.02935791015625, -0.025238037109375, -0.0211181640625, -0.016998291015625, -0.01287841796875, -0.008758544921875, -0.004638671875, -0.000518798828125, 0.00360107421875, 0.007720947265625, 0.0118408203125, 0.015960693359375, 0.02008056640625, 0.024200439453125, 0.0283203125, 0.032440185546875, 0.03656005859375, 0.040679931640625, 0.0447998046875, 0.048919677734375, 0.05303955078125, 0.057159423828125, 0.061279296875, 0.065399169921875, 0.06951904296875, 0.073638916015625, 0.0777587890625, 0.081878662109375, 0.08599853515625, 0.090118408203125, 0.09423828125, 0.098358154296875, 0.10247802734375, 0.106597900390625, 0.1107177734375, 0.114837646484375, 0.11895751953125, 0.123077392578125, 0.127197265625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 7.0, 8.0, 6.0, 6.0, 7.0, 8.0, 10.0, 11.0, 13.0, 17.0, 33.0, 17.0, 33.0, 44.0, 57.0, 94.0, 93.0, 77.0, 88.0, 61.0, 62.0, 46.0, 37.0, 32.0, 32.0, 21.0, 20.0, 18.0, 11.0, 7.0, 4.0, 6.0, 2.0, 1.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1636962890625, -0.1591930389404297, -0.15468978881835938, -0.15018653869628906, -0.14568328857421875, -0.14118003845214844, -0.13667678833007812, -0.1321735382080078, -0.1276702880859375, -0.12316703796386719, -0.11866378784179688, -0.11416053771972656, -0.10965728759765625, -0.10515403747558594, -0.10065078735351562, -0.09614753723144531, -0.091644287109375, -0.08714103698730469, -0.08263778686523438, -0.07813453674316406, -0.07363128662109375, -0.06912803649902344, -0.06462478637695312, -0.06012153625488281, -0.0556182861328125, -0.05111503601074219, -0.046611785888671875, -0.04210853576660156, -0.03760528564453125, -0.03310203552246094, -0.028598785400390625, -0.024095535278320312, -0.01959228515625, -0.015089035034179688, -0.010585784912109375, -0.0060825347900390625, -0.00157928466796875, 0.0029239654541015625, 0.007427215576171875, 0.011930465698242188, 0.0164337158203125, 0.020936965942382812, 0.025440216064453125, 0.029943466186523438, 0.03444671630859375, 0.03894996643066406, 0.043453216552734375, 0.04795646667480469, 0.052459716796875, 0.05696296691894531, 0.061466217041015625, 0.06596946716308594, 0.07047271728515625, 0.07497596740722656, 0.07947921752929688, 0.08398246765136719, 0.0884857177734375, 0.09298896789550781, 0.09749221801757812, 0.10199546813964844, 0.10649871826171875, 0.11100196838378906, 0.11550521850585938, 0.12000846862792969, 0.12451171875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 8.0, 35.0, 288.0, 468.0, 122.0, 38.0, 16.0, 14.0, 7.0, 6.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.625552654266357, -5.473827362060547, -5.322101593017578, -5.170376300811768, -5.018650531768799, -4.866925239562988, -4.7151994705200195, -4.563474178314209, -4.411748886108398, -4.260023593902588, -4.108297824859619, -3.9565722942352295, -3.80484676361084, -3.6531214714050293, -3.5013959407806396, -3.34967041015625, -3.1979446411132812, -3.0462191104888916, -2.894493579864502, -2.7427680492401123, -2.5910425186157227, -2.439317226409912, -2.2875916957855225, -2.135866165161133, -1.9841406345367432, -1.8324151039123535, -1.6806895732879639, -1.5289641618728638, -1.3772386312484741, -1.2255131006240845, -1.0737876892089844, -0.9220621585845947, -0.7703366279602051, -0.6186110973358154, -0.46688562631607056, -0.3151601254940033, -0.16343462467193604, -0.011709094047546387, 0.1400163769721985, 0.29174184799194336, 0.443467378616333, 0.5951929092407227, 0.7469183802604675, 0.8986438512802124, 1.050369381904602, 1.2020949125289917, 1.3538203239440918, 1.5055458545684814, 1.657271385192871, 1.8089969158172607, 1.9607224464416504, 2.11244797706604, 2.2641735076904297, 2.4158987998962402, 2.56762433052063, 2.7193498611450195, 2.871075391769409, 3.022800922393799, 3.1745264530181885, 3.326251983642578, 3.4779772758483887, 3.6297030448913574, 3.781428337097168, 3.9331538677215576, 4.084879398345947]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 6.0, 2.0, 6.0, 3.0, 7.0, 13.0, 26.0, 40.0, 63.0, 84.0, 123.0, 141.0, 140.0, 97.0, 90.0, 57.0, 28.0, 22.0, 13.0, 6.0, 2.0, 7.0, 4.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-3.130622625350952, -3.0262396335601807, -2.9218568801879883, -2.817473888397217, -2.7130911350250244, -2.608708143234253, -2.5043253898620605, -2.399942398071289, -2.2955594062805176, -2.191176414489746, -2.0867936611175537, -1.9824106693267822, -1.8780279159545898, -1.7736449241638184, -1.6692620515823364, -1.5648791790008545, -1.460496425628662, -1.3561135530471802, -1.2517306804656982, -1.1473476886749268, -1.0429649353027344, -0.9385820031166077, -0.834199070930481, -0.729816198348999, -0.6254333257675171, -0.5210504531860352, -0.41666755080223083, -0.3122846484184265, -0.20790177583694458, -0.10351890325546265, 0.0008640289306640625, 0.105246901512146, 0.20962977409362793, 0.31401264667510986, 0.4183955490589142, 0.5227784514427185, 0.6271613240242004, 0.7315441966056824, 0.8359271287918091, 0.940310001373291, 1.044692873954773, 1.1490757465362549, 1.2534586191177368, 1.3578414916992188, 1.4622244834899902, 1.5666072368621826, 1.670990228652954, 1.775373101234436, 1.879755973815918, 1.9841388463974, 2.088521718978882, 2.1929047107696533, 2.2972874641418457, 2.401670455932617, 2.5060534477233887, 2.610436201095581, 2.7148189544677734, 2.819201946258545, 2.9235846996307373, 3.027967691421509, 3.132350444793701, 3.2367334365844727, 3.341116428375244, 3.4454991817474365, 3.549882173538208]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 6.0, 11.0, 10.0, 19.0, 28.0, 69.0, 133.0, 399.0, 1411.0, 8174.0, 3873327.0, 304272.0, 4911.0, 941.0, 321.0, 135.0, 55.0, 30.0, 11.0, 4.0, 12.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.134765625, -2.088287353515625, -2.04180908203125, -1.995330810546875, -1.9488525390625, -1.902374267578125, -1.85589599609375, -1.809417724609375, -1.762939453125, -1.716461181640625, -1.66998291015625, -1.623504638671875, -1.5770263671875, -1.530548095703125, -1.48406982421875, -1.437591552734375, -1.39111328125, -1.344635009765625, -1.29815673828125, -1.251678466796875, -1.2052001953125, -1.158721923828125, -1.11224365234375, -1.065765380859375, -1.019287109375, -0.972808837890625, -0.92633056640625, -0.879852294921875, -0.8333740234375, -0.786895751953125, -0.74041748046875, -0.693939208984375, -0.6474609375, -0.600982666015625, -0.55450439453125, -0.508026123046875, -0.4615478515625, -0.415069580078125, -0.36859130859375, -0.322113037109375, -0.275634765625, -0.229156494140625, -0.18267822265625, -0.136199951171875, -0.0897216796875, -0.043243408203125, 0.00323486328125, 0.049713134765625, 0.09619140625, 0.142669677734375, 0.18914794921875, 0.235626220703125, 0.2821044921875, 0.328582763671875, 0.37506103515625, 0.421539306640625, 0.468017578125, 0.514495849609375, 0.56097412109375, 0.607452392578125, 0.6539306640625, 0.700408935546875, 0.74688720703125, 0.793365478515625, 0.83984375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 6.0, 3.0, 5.0, 7.0, 13.0, 16.0, 16.0, 22.0, 38.0, 72.0, 113.0, 160.0, 170.0, 127.0, 73.0, 55.0, 32.0, 20.0, 10.0, 7.0, 8.0, 7.0, 2.0, 6.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.034576416015625, -0.033463478088378906, -0.03235054016113281, -0.03123760223388672, -0.030124664306640625, -0.02901172637939453, -0.027898788452148438, -0.026785850524902344, -0.02567291259765625, -0.024559974670410156, -0.023447036743164062, -0.02233409881591797, -0.021221160888671875, -0.02010822296142578, -0.018995285034179688, -0.017882347106933594, -0.0167694091796875, -0.015656471252441406, -0.014543533325195312, -0.013430595397949219, -0.012317657470703125, -0.011204719543457031, -0.010091781616210938, -0.008978843688964844, -0.00786590576171875, -0.006752967834472656, -0.0056400299072265625, -0.004527091979980469, -0.003414154052734375, -0.0023012161254882812, -0.0011882781982421875, -7.534027099609375e-05, 0.00103759765625, 0.0021505355834960938, 0.0032634735107421875, 0.004376411437988281, 0.005489349365234375, 0.006602287292480469, 0.0077152252197265625, 0.008828163146972656, 0.00994110107421875, 0.011054039001464844, 0.012166976928710938, 0.013279914855957031, 0.014392852783203125, 0.015505790710449219, 0.016618728637695312, 0.017731666564941406, 0.0188446044921875, 0.019957542419433594, 0.021070480346679688, 0.02218341827392578, 0.023296356201171875, 0.02440929412841797, 0.025522232055664062, 0.026635169982910156, 0.02774810791015625, 0.028861045837402344, 0.029973983764648438, 0.03108692169189453, 0.032199859619140625, 0.03331279754638672, 0.03442573547363281, 0.035538673400878906, 0.036651611328125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 5.0, 9.0, 13.0, 17.0, 41.0, 80.0, 142.0, 350.0, 697.0, 1549.0, 4021.0, 11684.0, 53695.0, 3676558.0, 400740.0, 30979.0, 8265.0, 2945.0, 1264.0, 627.0, 313.0, 133.0, 79.0, 39.0, 24.0, 11.0, 6.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2490234375, -0.2350616455078125, -0.221099853515625, -0.2071380615234375, -0.19317626953125, -0.1792144775390625, -0.165252685546875, -0.1512908935546875, -0.1373291015625, -0.1233673095703125, -0.109405517578125, -0.0954437255859375, -0.08148193359375, -0.0675201416015625, -0.053558349609375, -0.0395965576171875, -0.025634765625, -0.0116729736328125, 0.002288818359375, 0.0162506103515625, 0.03021240234375, 0.0441741943359375, 0.058135986328125, 0.0720977783203125, 0.0860595703125, 0.1000213623046875, 0.113983154296875, 0.1279449462890625, 0.14190673828125, 0.1558685302734375, 0.169830322265625, 0.1837921142578125, 0.19775390625, 0.2117156982421875, 0.225677490234375, 0.2396392822265625, 0.25360107421875, 0.2675628662109375, 0.281524658203125, 0.2954864501953125, 0.3094482421875, 0.3234100341796875, 0.337371826171875, 0.3513336181640625, 0.36529541015625, 0.3792572021484375, 0.393218994140625, 0.4071807861328125, 0.421142578125, 0.4351043701171875, 0.449066162109375, 0.4630279541015625, 0.47698974609375, 0.4909515380859375, 0.504913330078125, 0.5188751220703125, 0.5328369140625, 0.5467987060546875, 0.560760498046875, 0.5747222900390625, 0.58868408203125, 0.6026458740234375, 0.616607666015625, 0.6305694580078125, 0.64453125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 1.0, 2.0, 3.0, 0.0, 4.0, 6.0, 1.0, 9.0, 9.0, 13.0, 18.0, 34.0, 49.0, 72.0, 126.0, 337.0, 1952.0, 1033.0, 157.0, 79.0, 36.0, 33.0, 18.0, 17.0, 15.0, 14.0, 10.0, 10.0, 3.0, 4.0, 1.0, 2.0, 3.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.053497314453125, -0.05150556564331055, -0.049513816833496094, -0.04752206802368164, -0.04553031921386719, -0.043538570404052734, -0.04154682159423828, -0.03955507278442383, -0.037563323974609375, -0.03557157516479492, -0.03357982635498047, -0.031588077545166016, -0.029596328735351562, -0.02760457992553711, -0.025612831115722656, -0.023621082305908203, -0.02162933349609375, -0.019637584686279297, -0.017645835876464844, -0.01565408706665039, -0.013662338256835938, -0.011670589447021484, -0.009678840637207031, -0.007687091827392578, -0.005695343017578125, -0.003703594207763672, -0.0017118453979492188, 0.0002799034118652344, 0.0022716522216796875, 0.004263401031494141, 0.006255149841308594, 0.008246898651123047, 0.0102386474609375, 0.012230396270751953, 0.014222145080566406, 0.01621389389038086, 0.018205642700195312, 0.020197391510009766, 0.02218914031982422, 0.024180889129638672, 0.026172637939453125, 0.028164386749267578, 0.03015613555908203, 0.032147884368896484, 0.03413963317871094, 0.03613138198852539, 0.038123130798339844, 0.0401148796081543, 0.04210662841796875, 0.0440983772277832, 0.046090126037597656, 0.04808187484741211, 0.05007362365722656, 0.052065372467041016, 0.05405712127685547, 0.05604887008666992, 0.058040618896484375, 0.06003236770629883, 0.06202411651611328, 0.06401586532592773, 0.06600761413574219, 0.06799936294555664, 0.0699911117553711, 0.07198286056518555, 0.073974609375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 4.0, 10.0, 25.0, 54.0, 649.0, 237.0, 25.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.913608968257904, -0.8558057546615601, -0.7980024814605713, -0.7401992678642273, -0.6823960542678833, -0.6245927810668945, -0.5667895674705505, -0.5089863538742065, -0.45118311047554016, -0.3933798670768738, -0.3355766534805298, -0.2777734100818634, -0.21997018158435822, -0.16216695308685303, -0.10436370968818665, -0.04656049609184265, 0.01124274730682373, 0.06904597580432892, 0.1268492043018341, 0.1846524477005005, 0.24245567619800568, 0.30025890469551086, 0.35806214809417725, 0.41586536169052124, 0.4736686050891876, 0.531471848487854, 0.589275062084198, 0.647078275680542, 0.7048815488815308, 0.7626847624778748, 0.8204879760742188, 0.8782912492752075, 0.9360944032669067, 0.9938976168632507, 1.0517008304595947, 1.1095041036605835, 1.1673073768615723, 1.2251105308532715, 1.2829138040542603, 1.340717077255249, 1.3985202312469482, 1.456323504447937, 1.5141266584396362, 1.571929931640625, 1.6297332048416138, 1.687536358833313, 1.7453396320343018, 1.803142786026001, 1.8609461784362793, 1.918749451637268, 1.9765526056289673, 2.034355878829956, 2.0921590328216553, 2.1499624252319336, 2.207765579223633, 2.265568733215332, 2.3233718872070312, 2.3811750411987305, 2.438978433609009, 2.496781587600708, 2.5545847415924072, 2.6123881340026855, 2.6701912879943848, 2.727994441986084, 2.7857978343963623]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 6.0, 8.0, 10.0, 18.0, 10.0, 30.0, 38.0, 38.0, 72.0, 71.0, 67.0, 94.0, 98.0, 92.0, 67.0, 77.0, 65.0, 33.0, 28.0, 15.0, 16.0, 14.0, 4.0, 5.0, 5.0, 3.0, 2.0, 5.0, 1.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.36985695362091064, -0.3587307333946228, -0.34760454297065735, -0.3364783227443695, -0.32535210251808167, -0.3142258822917938, -0.30309969186782837, -0.2919734716415405, -0.2808472514152527, -0.26972103118896484, -0.2585948407649994, -0.24746862053871155, -0.2363424003124237, -0.22521619498729706, -0.2140899896621704, -0.20296376943588257, -0.19183756411075592, -0.18071135878562927, -0.16958513855934143, -0.15845893323421478, -0.14733271300792694, -0.1362065076828003, -0.12508028745651245, -0.1139540821313858, -0.10282786935567856, -0.09170165657997131, -0.08057544380426407, -0.06944923102855682, -0.05832302197813988, -0.04719680920243263, -0.036070600152015686, -0.02494438737630844, -0.013818174600601196, -0.002691962756216526, 0.008434249088168144, 0.01956046000123024, 0.030686672776937485, 0.04181288555264473, 0.052939094603061676, 0.06406530737876892, 0.07519152015447617, 0.08631773293018341, 0.09744394570589066, 0.1085701584815979, 0.11969636380672455, 0.1308225840330124, 0.14194878935813904, 0.15307500958442688, 0.16420121490955353, 0.17532742023468018, 0.18645364046096802, 0.19757984578609467, 0.2087060660123825, 0.21983227133750916, 0.230958491563797, 0.24208469688892365, 0.2532109022140503, 0.26433712244033813, 0.2754633128643036, 0.28658953309059143, 0.2977157533168793, 0.3088419735431671, 0.31996816396713257, 0.3310943841934204, 0.34222060441970825]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 6.0, 10.0, 9.0, 22.0, 20.0, 32.0, 29.0, 57.0, 87.0, 123.0, 172.0, 275.0, 363.0, 665.0, 980.0, 1647.0, 2619.0, 4718.0, 9049.0, 19721.0, 55210.0, 250457.0, 544867.0, 99547.0, 30051.0, 12597.0, 6331.0, 3467.0, 1931.0, 1251.0, 737.0, 474.0, 326.0, 232.0, 159.0, 94.0, 65.0, 48.0, 32.0, 23.0, 17.0, 15.0, 11.0, 7.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1348876953125, -0.13027191162109375, -0.1256561279296875, -0.12104034423828125, -0.116424560546875, -0.11180877685546875, -0.1071929931640625, -0.10257720947265625, -0.09796142578125, -0.09334564208984375, -0.0887298583984375, -0.08411407470703125, -0.079498291015625, -0.07488250732421875, -0.0702667236328125, -0.06565093994140625, -0.06103515625, -0.05641937255859375, -0.0518035888671875, -0.04718780517578125, -0.042572021484375, -0.03795623779296875, -0.0333404541015625, -0.02872467041015625, -0.02410888671875, -0.01949310302734375, -0.0148773193359375, -0.01026153564453125, -0.005645751953125, -0.00102996826171875, 0.0035858154296875, 0.00820159912109375, 0.0128173828125, 0.01743316650390625, 0.0220489501953125, 0.02666473388671875, 0.031280517578125, 0.03589630126953125, 0.0405120849609375, 0.04512786865234375, 0.04974365234375, 0.05435943603515625, 0.0589752197265625, 0.06359100341796875, 0.068206787109375, 0.07282257080078125, 0.0774383544921875, 0.08205413818359375, 0.086669921875, 0.09128570556640625, 0.0959014892578125, 0.10051727294921875, 0.105133056640625, 0.10974884033203125, 0.1143646240234375, 0.11898040771484375, 0.12359619140625, 0.12821197509765625, 0.1328277587890625, 0.13744354248046875, 0.142059326171875, 0.14667510986328125, 0.1512908935546875, 0.15590667724609375, 0.1605224609375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 4.0, 4.0, 6.0, 5.0, 1.0, 11.0, 7.0, 19.0, 9.0, 16.0, 18.0, 48.0, 50.0, 79.0, 93.0, 118.0, 118.0, 93.0, 82.0, 62.0, 44.0, 30.0, 19.0, 12.0, 20.0, 6.0, 4.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0279998779296875, -0.027262449264526367, -0.026525020599365234, -0.0257875919342041, -0.02505016326904297, -0.024312734603881836, -0.023575305938720703, -0.02283787727355957, -0.022100448608398438, -0.021363019943237305, -0.020625591278076172, -0.01988816261291504, -0.019150733947753906, -0.018413305282592773, -0.01767587661743164, -0.016938447952270508, -0.016201019287109375, -0.015463590621948242, -0.01472616195678711, -0.013988733291625977, -0.013251304626464844, -0.012513875961303711, -0.011776447296142578, -0.011039018630981445, -0.010301589965820312, -0.00956416130065918, -0.008826732635498047, -0.008089303970336914, -0.007351875305175781, -0.0066144466400146484, -0.005877017974853516, -0.005139589309692383, -0.00440216064453125, -0.003664731979370117, -0.0029273033142089844, -0.0021898746490478516, -0.0014524459838867188, -0.0007150173187255859, 2.2411346435546875e-05, 0.0007598400115966797, 0.0014972686767578125, 0.0022346973419189453, 0.002972126007080078, 0.003709554672241211, 0.004446983337402344, 0.0051844120025634766, 0.005921840667724609, 0.006659269332885742, 0.007396697998046875, 0.008134126663208008, 0.00887155532836914, 0.009608983993530273, 0.010346412658691406, 0.011083841323852539, 0.011821269989013672, 0.012558698654174805, 0.013296127319335938, 0.01403355598449707, 0.014770984649658203, 0.015508413314819336, 0.01624584197998047, 0.0169832706451416, 0.017720699310302734, 0.018458127975463867, 0.019195556640625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 1.0, 0.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 5.0, 6.0, 5.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 11.0, 21.0, 46.0, 313.0, 2559.0, 34654.0, 831124.0, 170656.0, 8174.0, 763.0, 115.0, 22.0, 12.0, 6.0, 3.0, 7.0, 4.0, 5.0, 2.0, 6.0, 1.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.44482421875, -0.4303550720214844, -0.41588592529296875, -0.4014167785644531, -0.3869476318359375, -0.3724784851074219, -0.35800933837890625, -0.3435401916503906, -0.329071044921875, -0.3146018981933594, -0.30013275146484375, -0.2856636047363281, -0.2711944580078125, -0.2567253112792969, -0.24225616455078125, -0.22778701782226562, -0.21331787109375, -0.19884872436523438, -0.18437957763671875, -0.16991043090820312, -0.1554412841796875, -0.14097213745117188, -0.12650299072265625, -0.11203384399414062, -0.097564697265625, -0.08309555053710938, -0.06862640380859375, -0.054157257080078125, -0.0396881103515625, -0.025218963623046875, -0.01074981689453125, 0.003719329833984375, 0.0181884765625, 0.032657623291015625, 0.04712677001953125, 0.061595916748046875, 0.0760650634765625, 0.09053421020507812, 0.10500335693359375, 0.11947250366210938, 0.133941650390625, 0.14841079711914062, 0.16287994384765625, 0.17734909057617188, 0.1918182373046875, 0.20628738403320312, 0.22075653076171875, 0.23522567749023438, 0.24969482421875, 0.2641639709472656, 0.27863311767578125, 0.2931022644042969, 0.3075714111328125, 0.3220405578613281, 0.33650970458984375, 0.3509788513183594, 0.365447998046875, 0.3799171447753906, 0.39438629150390625, 0.4088554382324219, 0.4233245849609375, 0.4377937316894531, 0.45226287841796875, 0.4667320251464844, 0.481201171875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 3.0, 5.0, 2.0, 4.0, 7.0, 12.0, 11.0, 5.0, 10.0, 15.0, 21.0, 23.0, 22.0, 32.0, 26.0, 28.0, 30.0, 40.0, 39.0, 41.0, 42.0, 50.0, 39.0, 38.0, 48.0, 47.0, 41.0, 41.0, 30.0, 31.0, 33.0, 32.0, 30.0, 18.0, 25.0, 19.0, 13.0, 13.0, 7.0, 8.0, 6.0, 4.0, 9.0, 1.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.09954833984375, -0.0966033935546875, -0.093658447265625, -0.0907135009765625, -0.0877685546875, -0.0848236083984375, -0.081878662109375, -0.0789337158203125, -0.07598876953125, -0.0730438232421875, -0.070098876953125, -0.0671539306640625, -0.064208984375, -0.0612640380859375, -0.058319091796875, -0.0553741455078125, -0.05242919921875, -0.0494842529296875, -0.046539306640625, -0.0435943603515625, -0.0406494140625, -0.0377044677734375, -0.034759521484375, -0.0318145751953125, -0.02886962890625, -0.0259246826171875, -0.022979736328125, -0.0200347900390625, -0.01708984375, -0.0141448974609375, -0.011199951171875, -0.0082550048828125, -0.00531005859375, -0.0023651123046875, 0.000579833984375, 0.0035247802734375, 0.0064697265625, 0.0094146728515625, 0.012359619140625, 0.0153045654296875, 0.01824951171875, 0.0211944580078125, 0.024139404296875, 0.0270843505859375, 0.030029296875, 0.0329742431640625, 0.035919189453125, 0.0388641357421875, 0.04180908203125, 0.0447540283203125, 0.047698974609375, 0.0506439208984375, 0.0535888671875, 0.0565338134765625, 0.059478759765625, 0.0624237060546875, 0.06536865234375, 0.0683135986328125, 0.071258544921875, 0.0742034912109375, 0.0771484375, 0.0800933837890625, 0.083038330078125, 0.0859832763671875, 0.08892822265625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 6.0, 11.0, 18.0, 26.0, 37.0, 285.0, 10549.0, 1036675.0, 778.0, 95.0, 25.0, 11.0, 11.0, 7.0, 5.0, 6.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.697265625, -3.592254638671875, -3.48724365234375, -3.382232666015625, -3.2772216796875, -3.172210693359375, -3.06719970703125, -2.962188720703125, -2.857177734375, -2.752166748046875, -2.64715576171875, -2.542144775390625, -2.4371337890625, -2.332122802734375, -2.22711181640625, -2.122100830078125, -2.01708984375, -1.912078857421875, -1.80706787109375, -1.702056884765625, -1.5970458984375, -1.492034912109375, -1.38702392578125, -1.282012939453125, -1.177001953125, -1.071990966796875, -0.96697998046875, -0.861968994140625, -0.7569580078125, -0.651947021484375, -0.54693603515625, -0.441925048828125, -0.3369140625, -0.231903076171875, -0.12689208984375, -0.021881103515625, 0.0831298828125, 0.188140869140625, 0.29315185546875, 0.398162841796875, 0.503173828125, 0.608184814453125, 0.71319580078125, 0.818206787109375, 0.9232177734375, 1.028228759765625, 1.13323974609375, 1.238250732421875, 1.34326171875, 1.448272705078125, 1.55328369140625, 1.658294677734375, 1.7633056640625, 1.868316650390625, 1.97332763671875, 2.078338623046875, 2.183349609375, 2.288360595703125, 2.39337158203125, 2.498382568359375, 2.6033935546875, 2.708404541015625, 2.81341552734375, 2.918426513671875, 3.0234375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 4.0, 5.0, 1.0, 2.0, 4.0, 7.0, 15.0, 12.0, 21.0, 22.0, 23.0, 51.0, 101.0, 223.0, 194.0, 135.0, 70.0, 32.0, 20.0, 11.0, 8.0, 9.0, 7.0, 6.0, 6.0, 7.0, 4.0, 0.0, 0.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007166862487792969, -0.0006956830620765686, -0.0006746798753738403, -0.0006536766886711121, -0.0006326735019683838, -0.0006116703152656555, -0.0005906671285629272, -0.000569663941860199, -0.0005486607551574707, -0.0005276575684547424, -0.0005066543817520142, -0.0004856511950492859, -0.0004646480083465576, -0.00044364482164382935, -0.0004226416349411011, -0.0004016384482383728, -0.00038063526153564453, -0.00035963207483291626, -0.000338628888130188, -0.0003176257014274597, -0.00029662251472473145, -0.0002756193280220032, -0.0002546161413192749, -0.00023361295461654663, -0.00021260976791381836, -0.0001916065812110901, -0.00017060339450836182, -0.00014960020780563354, -0.00012859702110290527, -0.000107593834400177, -8.659064769744873e-05, -6.558746099472046e-05, -4.458427429199219e-05, -2.3581087589263916e-05, -2.5779008865356445e-06, 1.8425285816192627e-05, 3.94284725189209e-05, 6.043165922164917e-05, 8.143484592437744e-05, 0.00010243803262710571, 0.00012344121932983398, 0.00014444440603256226, 0.00016544759273529053, 0.0001864507794380188, 0.00020745396614074707, 0.00022845715284347534, 0.0002494603395462036, 0.0002704635262489319, 0.00029146671295166016, 0.00031246989965438843, 0.0003334730863571167, 0.00035447627305984497, 0.00037547945976257324, 0.0003964826464653015, 0.0004174858331680298, 0.00043848901987075806, 0.00045949220657348633, 0.0004804953932762146, 0.0005014985799789429, 0.0005225017666816711, 0.0005435049533843994, 0.0005645081400871277, 0.000585511326789856, 0.0006065145134925842, 0.0006275177001953125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 10.0, 10.0, 19.0, 17.0, 18.0, 21.0, 22.0, 30.0, 44.0, 50.0, 79.0, 115.0, 212.0, 342.0, 799.0, 2352.0, 9009.0, 83864.0, 894500.0, 46617.0, 7005.0, 1904.0, 681.0, 325.0, 163.0, 93.0, 66.0, 31.0, 31.0, 27.0, 25.0, 15.0, 13.0, 6.0, 6.0, 6.0, 6.0, 6.0, 6.0, 1.0, 2.0, 3.0, 0.0, 2.0], "bins": [-0.37548828125, -0.3657112121582031, -0.35593414306640625, -0.3461570739746094, -0.3363800048828125, -0.3266029357910156, -0.31682586669921875, -0.3070487976074219, -0.297271728515625, -0.2874946594238281, -0.27771759033203125, -0.2679405212402344, -0.2581634521484375, -0.24838638305664062, -0.23860931396484375, -0.22883224487304688, -0.21905517578125, -0.20927810668945312, -0.19950103759765625, -0.18972396850585938, -0.1799468994140625, -0.17016983032226562, -0.16039276123046875, -0.15061569213867188, -0.140838623046875, -0.13106155395507812, -0.12128448486328125, -0.11150741577148438, -0.1017303466796875, -0.09195327758789062, -0.08217620849609375, -0.07239913940429688, -0.0626220703125, -0.052845001220703125, -0.04306793212890625, -0.033290863037109375, -0.0235137939453125, -0.013736724853515625, -0.00395965576171875, 0.005817413330078125, 0.015594482421875, 0.025371551513671875, 0.03514862060546875, 0.044925689697265625, 0.0547027587890625, 0.06447982788085938, 0.07425689697265625, 0.08403396606445312, 0.09381103515625, 0.10358810424804688, 0.11336517333984375, 0.12314224243164062, 0.1329193115234375, 0.14269638061523438, 0.15247344970703125, 0.16225051879882812, 0.172027587890625, 0.18180465698242188, 0.19158172607421875, 0.20135879516601562, 0.2111358642578125, 0.22091293334960938, 0.23069000244140625, 0.24046707153320312, 0.250244140625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 7.0, 3.0, 11.0, 10.0, 21.0, 49.0, 121.0, 240.0, 267.0, 132.0, 74.0, 36.0, 10.0, 8.0, 8.0, 7.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.378662109375, -0.3704719543457031, -0.36228179931640625, -0.3540916442871094, -0.3459014892578125, -0.3377113342285156, -0.32952117919921875, -0.3213310241699219, -0.313140869140625, -0.3049507141113281, -0.29676055908203125, -0.2885704040527344, -0.2803802490234375, -0.2721900939941406, -0.26399993896484375, -0.2558097839355469, -0.24761962890625, -0.23942947387695312, -0.23123931884765625, -0.22304916381835938, -0.2148590087890625, -0.20666885375976562, -0.19847869873046875, -0.19028854370117188, -0.182098388671875, -0.17390823364257812, -0.16571807861328125, -0.15752792358398438, -0.1493377685546875, -0.14114761352539062, -0.13295745849609375, -0.12476730346679688, -0.1165771484375, -0.10838699340820312, -0.10019683837890625, -0.09200668334960938, -0.0838165283203125, -0.07562637329101562, -0.06743621826171875, -0.059246063232421875, -0.051055908203125, -0.042865753173828125, -0.03467559814453125, -0.026485443115234375, -0.0182952880859375, -0.010105133056640625, -0.00191497802734375, 0.006275177001953125, 0.01446533203125, 0.022655487060546875, 0.03084564208984375, 0.039035797119140625, 0.0472259521484375, 0.055416107177734375, 0.06360626220703125, 0.07179641723632812, 0.079986572265625, 0.08817672729492188, 0.09636688232421875, 0.10455703735351562, 0.1127471923828125, 0.12093734741210938, 0.12912750244140625, 0.13731765747070312, 0.1455078125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 7.0, 3.0, 9.0, 7.0, 9.0, 30.0, 46.0, 71.0, 157.0, 282.0, 175.0, 79.0, 57.0, 29.0, 13.0, 9.0, 6.0, 7.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5559524297714233, -1.50979483127594, -1.463637351989746, -1.4174797534942627, -1.3713221549987793, -1.325164556503296, -1.2790069580078125, -1.2328494787216187, -1.1866918802261353, -1.1405342817306519, -1.094376802444458, -1.0482192039489746, -1.0020616054534912, -0.9559040069580078, -0.9097464680671692, -0.8635889291763306, -0.8174313306808472, -0.7712737321853638, -0.7251161932945251, -0.6789586544036865, -0.6328010559082031, -0.5866434574127197, -0.5404859185218811, -0.4943283498287201, -0.4481707811355591, -0.40201321244239807, -0.35585564374923706, -0.30969807505607605, -0.26354050636291504, -0.21738293766975403, -0.17122536897659302, -0.125067800283432, -0.078910231590271, -0.032752662897109985, 0.013404905796051025, 0.059562474489212036, 0.10572004318237305, 0.15187761187553406, 0.19803518056869507, 0.24419274926185608, 0.2903503179550171, 0.3365078866481781, 0.3826654553413391, 0.4288230240345001, 0.47498059272766113, 0.5211381912231445, 0.5672957301139832, 0.6134532690048218, 0.6596108675003052, 0.7057684659957886, 0.7519260048866272, 0.7980835437774658, 0.8442411422729492, 0.8903987407684326, 0.9365562796592712, 0.9827138185501099, 1.0288714170455933, 1.0750290155410767, 1.1211864948272705, 1.167344093322754, 1.2135016918182373, 1.2596592903137207, 1.305816888809204, 1.351974368095398, 1.3981319665908813]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 5.0, 9.0, 7.0, 12.0, 10.0, 15.0, 21.0, 22.0, 36.0, 37.0, 55.0, 72.0, 79.0, 81.0, 69.0, 70.0, 63.0, 66.0, 48.0, 41.0, 44.0, 28.0, 29.0, 20.0, 16.0, 8.0, 5.0, 7.0, 5.0, 3.0, 2.0, 5.0, 5.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1837421655654907, -1.1493579149246216, -1.114973783493042, -1.0805895328521729, -1.0462052822113037, -1.0118211507797241, -0.977436900138855, -0.9430527091026306, -0.9086685180664062, -0.8742843270301819, -0.8399001359939575, -0.8055158853530884, -0.771131694316864, -0.7367475032806396, -0.7023632526397705, -0.6679790616035461, -0.6335948705673218, -0.5992106795310974, -0.564826488494873, -0.5304422378540039, -0.49605804681777954, -0.4616738557815552, -0.4272896349430084, -0.39290541410446167, -0.3585212230682373, -0.32413703203201294, -0.2897528111934662, -0.25536859035491943, -0.22098439931869507, -0.1866001933813095, -0.15221598744392395, -0.11783178150653839, -0.08344769477844238, -0.049063488841056824, -0.014679282903671265, 0.019704923033714294, 0.054089128971099854, 0.08847333490848541, 0.12285754084587097, 0.15724174678325653, 0.1916259527206421, 0.22601015865802765, 0.2603943645954132, 0.29477858543395996, 0.3291627764701843, 0.3635469675064087, 0.39793118834495544, 0.4323154091835022, 0.46669960021972656, 0.5010837912559509, 0.5354679822921753, 0.5698522329330444, 0.6042364239692688, 0.6386206150054932, 0.6730048656463623, 0.7073890566825867, 0.741773247718811, 0.7761574387550354, 0.8105416297912598, 0.8449258804321289, 0.8793100714683533, 0.9136942625045776, 0.9480785131454468, 0.9824627041816711, 1.0168468952178955]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 4.0, 0.0, 2.0, 4.0, 1.0, 7.0, 5.0, 5.0, 22.0, 12.0, 39.0, 30.0, 58.0, 86.0, 161.0, 259.0, 432.0, 785.0, 1573.0, 3886.0, 11689.0, 62749.0, 3950422.0, 136279.0, 16552.0, 4895.0, 1983.0, 948.0, 503.0, 308.0, 192.0, 140.0, 72.0, 50.0, 39.0, 26.0, 23.0, 10.0, 5.0, 11.0, 10.0, 2.0, 2.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.673828125, -0.6549224853515625, -0.636016845703125, -0.6171112060546875, -0.59820556640625, -0.5792999267578125, -0.560394287109375, -0.5414886474609375, -0.5225830078125, -0.5036773681640625, -0.484771728515625, -0.4658660888671875, -0.44696044921875, -0.4280548095703125, -0.409149169921875, -0.3902435302734375, -0.371337890625, -0.3524322509765625, -0.333526611328125, -0.3146209716796875, -0.29571533203125, -0.2768096923828125, -0.257904052734375, -0.2389984130859375, -0.2200927734375, -0.2011871337890625, -0.182281494140625, -0.1633758544921875, -0.14447021484375, -0.1255645751953125, -0.106658935546875, -0.0877532958984375, -0.06884765625, -0.0499420166015625, -0.031036376953125, -0.0121307373046875, 0.00677490234375, 0.0256805419921875, 0.044586181640625, 0.0634918212890625, 0.0823974609375, 0.1013031005859375, 0.120208740234375, 0.1391143798828125, 0.15802001953125, 0.1769256591796875, 0.195831298828125, 0.2147369384765625, 0.233642578125, 0.2525482177734375, 0.271453857421875, 0.2903594970703125, 0.30926513671875, 0.3281707763671875, 0.347076416015625, 0.3659820556640625, 0.3848876953125, 0.4037933349609375, 0.422698974609375, 0.4416046142578125, 0.46051025390625, 0.4794158935546875, 0.498321533203125, 0.5172271728515625, 0.5361328125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 5.0, 6.0, 8.0, 3.0, 7.0, 19.0, 17.0, 30.0, 35.0, 46.0, 62.0, 78.0, 77.0, 106.0, 108.0, 99.0, 65.0, 55.0, 48.0, 33.0, 23.0, 15.0, 10.0, 13.0, 4.0, 2.0, 7.0, 7.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.020660400390625, -0.01999044418334961, -0.01932048797607422, -0.018650531768798828, -0.017980575561523438, -0.017310619354248047, -0.016640663146972656, -0.015970706939697266, -0.015300750732421875, -0.014630794525146484, -0.013960838317871094, -0.013290882110595703, -0.012620925903320312, -0.011950969696044922, -0.011281013488769531, -0.01061105728149414, -0.00994110107421875, -0.00927114486694336, -0.008601188659667969, -0.007931232452392578, -0.0072612762451171875, -0.006591320037841797, -0.005921363830566406, -0.005251407623291016, -0.004581451416015625, -0.003911495208740234, -0.0032415390014648438, -0.002571582794189453, -0.0019016265869140625, -0.0012316703796386719, -0.0005617141723632812, 0.00010824203491210938, 0.0007781982421875, 0.0014481544494628906, 0.0021181106567382812, 0.002788066864013672, 0.0034580230712890625, 0.004127979278564453, 0.004797935485839844, 0.005467891693115234, 0.006137847900390625, 0.006807804107666016, 0.007477760314941406, 0.008147716522216797, 0.008817672729492188, 0.009487628936767578, 0.010157585144042969, 0.01082754135131836, 0.01149749755859375, 0.01216745376586914, 0.012837409973144531, 0.013507366180419922, 0.014177322387695312, 0.014847278594970703, 0.015517234802246094, 0.016187191009521484, 0.016857147216796875, 0.017527103424072266, 0.018197059631347656, 0.018867015838623047, 0.019536972045898438, 0.020206928253173828, 0.02087688446044922, 0.02154684066772461, 0.022216796875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 4.0, 6.0, 11.0, 8.0, 38.0, 47.0, 92.0, 546.0, 17184.0, 4153678.0, 21877.0, 611.0, 82.0, 39.0, 14.0, 7.0, 17.0, 10.0, 6.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.111328125, -2.0669021606445312, -2.0224761962890625, -1.9780502319335938, -1.933624267578125, -1.8891983032226562, -1.8447723388671875, -1.8003463745117188, -1.75592041015625, -1.7114944458007812, -1.6670684814453125, -1.6226425170898438, -1.578216552734375, -1.5337905883789062, -1.4893646240234375, -1.4449386596679688, -1.4005126953125, -1.3560867309570312, -1.3116607666015625, -1.2672348022460938, -1.222808837890625, -1.1783828735351562, -1.1339569091796875, -1.0895309448242188, -1.04510498046875, -1.0006790161132812, -0.9562530517578125, -0.9118270874023438, -0.867401123046875, -0.8229751586914062, -0.7785491943359375, -0.7341232299804688, -0.689697265625, -0.6452713012695312, -0.6008453369140625, -0.5564193725585938, -0.511993408203125, -0.46756744384765625, -0.4231414794921875, -0.37871551513671875, -0.33428955078125, -0.28986358642578125, -0.2454376220703125, -0.20101165771484375, -0.156585693359375, -0.11215972900390625, -0.0677337646484375, -0.02330780029296875, 0.0211181640625, 0.06554412841796875, 0.1099700927734375, 0.15439605712890625, 0.198822021484375, 0.24324798583984375, 0.2876739501953125, 0.33209991455078125, 0.37652587890625, 0.42095184326171875, 0.4653778076171875, 0.5098037719726562, 0.554229736328125, 0.5986557006835938, 0.6430816650390625, 0.6875076293945312, 0.73193359375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 4.0, 4.0, 2.0, 5.0, 6.0, 6.0, 10.0, 8.0, 13.0, 12.0, 19.0, 19.0, 44.0, 66.0, 151.0, 174.0, 430.0, 1430.0, 861.0, 296.0, 147.0, 95.0, 64.0, 43.0, 31.0, 25.0, 18.0, 19.0, 16.0, 8.0, 6.0, 7.0, 12.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.042755126953125, -0.04141378402709961, -0.04007244110107422, -0.03873109817504883, -0.03738975524902344, -0.03604841232299805, -0.034707069396972656, -0.033365726470947266, -0.032024383544921875, -0.030683040618896484, -0.029341697692871094, -0.028000354766845703, -0.026659011840820312, -0.025317668914794922, -0.02397632598876953, -0.02263498306274414, -0.02129364013671875, -0.01995229721069336, -0.01861095428466797, -0.017269611358642578, -0.015928268432617188, -0.014586925506591797, -0.013245582580566406, -0.011904239654541016, -0.010562896728515625, -0.009221553802490234, -0.007880210876464844, -0.006538867950439453, -0.0051975250244140625, -0.003856182098388672, -0.0025148391723632812, -0.0011734962463378906, 0.0001678466796875, 0.0015091896057128906, 0.0028505325317382812, 0.004191875457763672, 0.0055332183837890625, 0.006874561309814453, 0.008215904235839844, 0.009557247161865234, 0.010898590087890625, 0.012239933013916016, 0.013581275939941406, 0.014922618865966797, 0.016263961791992188, 0.017605304718017578, 0.01894664764404297, 0.02028799057006836, 0.02162933349609375, 0.02297067642211914, 0.02431201934814453, 0.025653362274169922, 0.026994705200195312, 0.028336048126220703, 0.029677391052246094, 0.031018733978271484, 0.032360076904296875, 0.033701419830322266, 0.035042762756347656, 0.03638410568237305, 0.03772544860839844, 0.03906679153442383, 0.04040813446044922, 0.04174947738647461, 0.0430908203125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 13.0, 409.0, 569.0, 16.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.047494888305664, -4.958988666534424, -4.870481967926025, -4.781975746154785, -4.693469047546387, -4.6049628257751465, -4.516456127166748, -4.427949905395508, -4.339443206787109, -4.250936985015869, -4.162430286407471, -4.0739240646362305, -3.985417366027832, -3.896911144256592, -3.8084046840667725, -3.719898223876953, -3.631392002105713, -3.5428855419158936, -3.454379081726074, -3.365872621536255, -3.2773661613464355, -3.1888599395751953, -3.100353479385376, -3.0118470191955566, -2.9233405590057373, -2.834834098815918, -2.7463276386260986, -2.6578211784362793, -2.569314956665039, -2.4808084964752197, -2.3923020362854004, -2.303795576095581, -2.2152891159057617, -2.1267826557159424, -2.038276195526123, -1.9497698545455933, -1.861263394355774, -1.7727569341659546, -1.6842505931854248, -1.5957441329956055, -1.5072376728057861, -1.4187312126159668, -1.3302247524261475, -1.2417184114456177, -1.1532119512557983, -1.064705491065979, -0.9761990904808044, -0.8876926898956299, -0.7991862893104553, -0.7106798887252808, -0.6221734285354614, -0.5336669683456421, -0.44516056776046753, -0.3566541373729706, -0.26814770698547363, -0.17964130640029907, -0.09113484621047974, -0.002628415822982788, 0.08587801456451416, 0.1743844449520111, 0.26289087533950806, 0.351397305727005, 0.43990373611450195, 0.5284101366996765, 0.6169165968894958]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 8.0, 9.0, 21.0, 23.0, 39.0, 51.0, 83.0, 102.0, 133.0, 126.0, 130.0, 101.0, 73.0, 48.0, 32.0, 13.0, 5.0, 7.0, 7.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8497622609138489, -0.8315975069999695, -0.8134327530860901, -0.7952679395675659, -0.7771031856536865, -0.7589384317398071, -0.7407736778259277, -0.7226089239120483, -0.704444169998169, -0.6862794160842896, -0.6681146621704102, -0.649949848651886, -0.6317850947380066, -0.6136203408241272, -0.5954555869102478, -0.5772908329963684, -0.5591260194778442, -0.5409612655639648, -0.5227965116500854, -0.5046316981315613, -0.4864669442176819, -0.4683021903038025, -0.4501374363899231, -0.4319726824760437, -0.4138078987598419, -0.3956431448459625, -0.37747836112976074, -0.35931360721588135, -0.34114885330200195, -0.32298406958580017, -0.3048193156719208, -0.286654531955719, -0.2684897780418396, -0.2503250241279602, -0.23216024041175842, -0.21399548649787903, -0.19583071768283844, -0.17766594886779785, -0.15950119495391846, -0.14133642613887787, -0.12317165732383728, -0.10500688850879669, -0.0868421271443367, -0.06867736577987671, -0.05051259696483612, -0.03234782814979553, -0.01418306678533554, 0.003981694579124451, 0.02214646339416504, 0.04031122848391533, 0.05847599357366562, 0.07664075493812561, 0.0948055237531662, 0.11297029256820679, 0.13113504648208618, 0.14929981529712677, 0.16746458411216736, 0.18562935292720795, 0.20379412174224854, 0.22195887565612793, 0.24012364447116852, 0.2582884132862091, 0.2764531672000885, 0.2946179509162903, 0.3127827048301697]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 5.0, 3.0, 8.0, 16.0, 8.0, 15.0, 21.0, 25.0, 29.0, 34.0, 44.0, 44.0, 44.0, 57.0, 455.0, 56357.0, 988470.0, 2390.0, 138.0, 52.0, 62.0, 59.0, 39.0, 36.0, 27.0, 25.0, 13.0, 16.0, 21.0, 11.0, 10.0, 6.0, 7.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.029296875, -0.9928436279296875, -0.956390380859375, -0.9199371337890625, -0.88348388671875, -0.8470306396484375, -0.810577392578125, -0.7741241455078125, -0.7376708984375, -0.7012176513671875, -0.664764404296875, -0.6283111572265625, -0.59185791015625, -0.5554046630859375, -0.518951416015625, -0.4824981689453125, -0.446044921875, -0.4095916748046875, -0.373138427734375, -0.3366851806640625, -0.30023193359375, -0.2637786865234375, -0.227325439453125, -0.1908721923828125, -0.1544189453125, -0.1179656982421875, -0.081512451171875, -0.0450592041015625, -0.00860595703125, 0.0278472900390625, 0.064300537109375, 0.1007537841796875, 0.13720703125, 0.1736602783203125, 0.210113525390625, 0.2465667724609375, 0.28302001953125, 0.3194732666015625, 0.355926513671875, 0.3923797607421875, 0.4288330078125, 0.4652862548828125, 0.501739501953125, 0.5381927490234375, 0.57464599609375, 0.6110992431640625, 0.647552490234375, 0.6840057373046875, 0.720458984375, 0.7569122314453125, 0.793365478515625, 0.8298187255859375, 0.86627197265625, 0.9027252197265625, 0.939178466796875, 0.9756317138671875, 1.0120849609375, 1.0485382080078125, 1.084991455078125, 1.1214447021484375, 1.15789794921875, 1.1943511962890625, 1.230804443359375, 1.2672576904296875, 1.3037109375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 21.0, 114.0, 304.0, 391.0, 154.0, 27.0, 3.0, 3.0], "bins": [-0.228271484375, -0.22440552711486816, -0.22053956985473633, -0.2166736125946045, -0.21280765533447266, -0.20894169807434082, -0.20507574081420898, -0.20120978355407715, -0.1973438262939453, -0.19347786903381348, -0.18961191177368164, -0.1857459545135498, -0.18187999725341797, -0.17801403999328613, -0.1741480827331543, -0.17028212547302246, -0.16641616821289062, -0.1625502109527588, -0.15868425369262695, -0.15481829643249512, -0.15095233917236328, -0.14708638191223145, -0.1432204246520996, -0.13935446739196777, -0.13548851013183594, -0.1316225528717041, -0.12775659561157227, -0.12389063835144043, -0.1200246810913086, -0.11615872383117676, -0.11229276657104492, -0.10842680931091309, -0.10456085205078125, -0.10069489479064941, -0.09682893753051758, -0.09296298027038574, -0.0890970230102539, -0.08523106575012207, -0.08136510848999023, -0.0774991512298584, -0.07363319396972656, -0.06976723670959473, -0.06590127944946289, -0.062035322189331055, -0.05816936492919922, -0.05430340766906738, -0.05043745040893555, -0.04657149314880371, -0.042705535888671875, -0.03883957862854004, -0.0349736213684082, -0.031107664108276367, -0.02724170684814453, -0.023375749588012695, -0.01950979232788086, -0.015643835067749023, -0.011777877807617188, -0.007911920547485352, -0.004045963287353516, -0.0001800060272216797, 0.0036859512329101562, 0.007551908493041992, 0.011417865753173828, 0.015283823013305664, 0.0191497802734375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 9.0, 8.0, 14.0, 11.0, 13.0, 13.0, 22.0, 32.0, 61.0, 96.0, 171.0, 315.0, 596.0, 1327.0, 2573.0, 5470.0, 12722.0, 31172.0, 90488.0, 327859.0, 397600.0, 113081.0, 37511.0, 14793.0, 6439.0, 3004.0, 1470.0, 725.0, 397.0, 211.0, 149.0, 74.0, 42.0, 29.0, 24.0, 7.0, 10.0, 7.0, 8.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1654052734375, -0.15971946716308594, -0.15403366088867188, -0.1483478546142578, -0.14266204833984375, -0.1369762420654297, -0.13129043579101562, -0.12560462951660156, -0.1199188232421875, -0.11423301696777344, -0.10854721069335938, -0.10286140441894531, -0.09717559814453125, -0.09148979187011719, -0.08580398559570312, -0.08011817932128906, -0.074432373046875, -0.06874656677246094, -0.06306076049804688, -0.05737495422363281, -0.05168914794921875, -0.04600334167480469, -0.040317535400390625, -0.03463172912597656, -0.0289459228515625, -0.023260116577148438, -0.017574310302734375, -0.011888504028320312, -0.00620269775390625, -0.0005168914794921875, 0.005168914794921875, 0.010854721069335938, 0.01654052734375, 0.022226333618164062, 0.027912139892578125, 0.03359794616699219, 0.03928375244140625, 0.04496955871582031, 0.050655364990234375, 0.05634117126464844, 0.0620269775390625, 0.06771278381347656, 0.07339859008789062, 0.07908439636230469, 0.08477020263671875, 0.09045600891113281, 0.09614181518554688, 0.10182762145996094, 0.107513427734375, 0.11319923400878906, 0.11888504028320312, 0.12457084655761719, 0.13025665283203125, 0.1359424591064453, 0.14162826538085938, 0.14731407165527344, 0.1529998779296875, 0.15868568420410156, 0.16437149047851562, 0.1700572967529297, 0.17574310302734375, 0.1814289093017578, 0.18711471557617188, 0.19280052185058594, 0.198486328125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 9.0, 4.0, 6.0, 5.0, 1.0, 11.0, 6.0, 10.0, 14.0, 19.0, 19.0, 21.0, 28.0, 28.0, 31.0, 37.0, 37.0, 35.0, 55.0, 42.0, 55.0, 51.0, 64.0, 57.0, 49.0, 42.0, 32.0, 34.0, 35.0, 30.0, 26.0, 26.0, 13.0, 13.0, 10.0, 13.0, 11.0, 5.0, 6.0, 5.0, 3.0, 6.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.148193359375, -0.1429595947265625, -0.137725830078125, -0.1324920654296875, -0.12725830078125, -0.1220245361328125, -0.116790771484375, -0.1115570068359375, -0.1063232421875, -0.1010894775390625, -0.095855712890625, -0.0906219482421875, -0.08538818359375, -0.0801544189453125, -0.074920654296875, -0.0696868896484375, -0.064453125, -0.0592193603515625, -0.053985595703125, -0.0487518310546875, -0.04351806640625, -0.0382843017578125, -0.033050537109375, -0.0278167724609375, -0.0225830078125, -0.0173492431640625, -0.012115478515625, -0.0068817138671875, -0.00164794921875, 0.0035858154296875, 0.008819580078125, 0.0140533447265625, 0.019287109375, 0.0245208740234375, 0.029754638671875, 0.0349884033203125, 0.04022216796875, 0.0454559326171875, 0.050689697265625, 0.0559234619140625, 0.0611572265625, 0.0663909912109375, 0.071624755859375, 0.0768585205078125, 0.08209228515625, 0.0873260498046875, 0.092559814453125, 0.0977935791015625, 0.10302734375, 0.1082611083984375, 0.113494873046875, 0.1187286376953125, 0.12396240234375, 0.1291961669921875, 0.134429931640625, 0.1396636962890625, 0.1448974609375, 0.1501312255859375, 0.155364990234375, 0.1605987548828125, 0.16583251953125, 0.1710662841796875, 0.176300048828125, 0.1815338134765625, 0.186767578125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 6.0, 1.0, 3.0, 6.0, 4.0, 2.0, 7.0, 18.0, 17.0, 18.0, 17.0, 32.0, 58.0, 79.0, 170.0, 420.0, 1455.0, 7675.0, 126635.0, 865655.0, 40374.0, 4309.0, 942.0, 296.0, 132.0, 74.0, 41.0, 18.0, 22.0, 15.0, 8.0, 8.0, 6.0, 11.0, 6.0, 2.0, 5.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3232421875, -0.31183624267578125, -0.3004302978515625, -0.28902435302734375, -0.277618408203125, -0.26621246337890625, -0.2548065185546875, -0.24340057373046875, -0.23199462890625, -0.22058868408203125, -0.2091827392578125, -0.19777679443359375, -0.186370849609375, -0.17496490478515625, -0.1635589599609375, -0.15215301513671875, -0.1407470703125, -0.12934112548828125, -0.1179351806640625, -0.10652923583984375, -0.095123291015625, -0.08371734619140625, -0.0723114013671875, -0.06090545654296875, -0.04949951171875, -0.03809356689453125, -0.0266876220703125, -0.01528167724609375, -0.003875732421875, 0.00753021240234375, 0.0189361572265625, 0.03034210205078125, 0.041748046875, 0.05315399169921875, 0.0645599365234375, 0.07596588134765625, 0.087371826171875, 0.09877777099609375, 0.1101837158203125, 0.12158966064453125, 0.13299560546875, 0.14440155029296875, 0.1558074951171875, 0.16721343994140625, 0.178619384765625, 0.19002532958984375, 0.2014312744140625, 0.21283721923828125, 0.2242431640625, 0.23564910888671875, 0.2470550537109375, 0.25846099853515625, 0.269866943359375, 0.28127288818359375, 0.2926788330078125, 0.30408477783203125, 0.31549072265625, 0.32689666748046875, 0.3383026123046875, 0.34970855712890625, 0.361114501953125, 0.37252044677734375, 0.3839263916015625, 0.39533233642578125, 0.40673828125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 2.0, 3.0, 5.0, 6.0, 9.0, 12.0, 9.0, 19.0, 16.0, 39.0, 47.0, 50.0, 74.0, 95.0, 140.0, 94.0, 87.0, 63.0, 46.0, 45.0, 32.0, 23.0, 16.0, 21.0, 8.0, 8.0, 4.0, 6.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0006394386291503906, -0.0006220713257789612, -0.0006047040224075317, -0.0005873367190361023, -0.0005699694156646729, -0.0005526021122932434, -0.000535234808921814, -0.0005178675055503845, -0.0005005002021789551, -0.00048313289880752563, -0.0004657655954360962, -0.00044839829206466675, -0.0004310309886932373, -0.00041366368532180786, -0.0003962963819503784, -0.000378929078578949, -0.00036156177520751953, -0.0003441944718360901, -0.00032682716846466064, -0.0003094598650932312, -0.00029209256172180176, -0.0002747252583503723, -0.00025735795497894287, -0.00023999065160751343, -0.00022262334823608398, -0.00020525604486465454, -0.0001878887414932251, -0.00017052143812179565, -0.0001531541347503662, -0.00013578683137893677, -0.00011841952800750732, -0.00010105222463607788, -8.368492126464844e-05, -6.6317617893219e-05, -4.895031452178955e-05, -3.158301115036011e-05, -1.4215707778930664e-05, 3.1515955924987793e-06, 2.0518898963928223e-05, 3.7886202335357666e-05, 5.525350570678711e-05, 7.262080907821655e-05, 8.9988112449646e-05, 0.00010735541582107544, 0.00012472271919250488, 0.00014209002256393433, 0.00015945732593536377, 0.0001768246293067932, 0.00019419193267822266, 0.0002115592360496521, 0.00022892653942108154, 0.000246293842792511, 0.00026366114616394043, 0.0002810284495353699, 0.0002983957529067993, 0.00031576305627822876, 0.0003331303596496582, 0.00035049766302108765, 0.0003678649663925171, 0.00038523226976394653, 0.000402599573135376, 0.0004199668765068054, 0.00043733417987823486, 0.0004547014832496643, 0.00047206878662109375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 1.0, 7.0, 2.0, 12.0, 22.0, 31.0, 84.0, 364.0, 1782.0, 16783.0, 865695.0, 156484.0, 6028.0, 853.0, 232.0, 75.0, 34.0, 19.0, 9.0, 5.0, 6.0, 4.0, 2.0, 3.0, 5.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3720703125, -0.355743408203125, -0.33941650390625, -0.323089599609375, -0.3067626953125, -0.290435791015625, -0.27410888671875, -0.257781982421875, -0.241455078125, -0.225128173828125, -0.20880126953125, -0.192474365234375, -0.1761474609375, -0.159820556640625, -0.14349365234375, -0.127166748046875, -0.11083984375, -0.094512939453125, -0.07818603515625, -0.061859130859375, -0.0455322265625, -0.029205322265625, -0.01287841796875, 0.003448486328125, 0.019775390625, 0.036102294921875, 0.05242919921875, 0.068756103515625, 0.0850830078125, 0.101409912109375, 0.11773681640625, 0.134063720703125, 0.150390625, 0.166717529296875, 0.18304443359375, 0.199371337890625, 0.2156982421875, 0.232025146484375, 0.24835205078125, 0.264678955078125, 0.281005859375, 0.297332763671875, 0.31365966796875, 0.329986572265625, 0.3463134765625, 0.362640380859375, 0.37896728515625, 0.395294189453125, 0.41162109375, 0.427947998046875, 0.44427490234375, 0.460601806640625, 0.4769287109375, 0.493255615234375, 0.50958251953125, 0.525909423828125, 0.542236328125, 0.558563232421875, 0.57489013671875, 0.591217041015625, 0.6075439453125, 0.623870849609375, 0.64019775390625, 0.656524658203125, 0.6728515625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 4.0, 3.0, 4.0, 6.0, 7.0, 15.0, 10.0, 26.0, 52.0, 114.0, 228.0, 245.0, 134.0, 58.0, 34.0, 15.0, 7.0, 6.0, 6.0, 10.0, 4.0, 3.0, 8.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16162109375, -0.15393829345703125, -0.1462554931640625, -0.13857269287109375, -0.130889892578125, -0.12320709228515625, -0.1155242919921875, -0.10784149169921875, -0.10015869140625, -0.09247589111328125, -0.0847930908203125, -0.07711029052734375, -0.069427490234375, -0.06174468994140625, -0.0540618896484375, -0.04637908935546875, -0.0386962890625, -0.03101348876953125, -0.0233306884765625, -0.01564788818359375, -0.007965087890625, -0.00028228759765625, 0.0074005126953125, 0.01508331298828125, 0.02276611328125, 0.03044891357421875, 0.0381317138671875, 0.04581451416015625, 0.053497314453125, 0.06118011474609375, 0.0688629150390625, 0.07654571533203125, 0.084228515625, 0.09191131591796875, 0.0995941162109375, 0.10727691650390625, 0.114959716796875, 0.12264251708984375, 0.1303253173828125, 0.13800811767578125, 0.14569091796875, 0.15337371826171875, 0.1610565185546875, 0.16873931884765625, 0.176422119140625, 0.18410491943359375, 0.1917877197265625, 0.19947052001953125, 0.2071533203125, 0.21483612060546875, 0.2225189208984375, 0.23020172119140625, 0.237884521484375, 0.24556732177734375, 0.2532501220703125, 0.26093292236328125, 0.26861572265625, 0.27629852294921875, 0.2839813232421875, 0.29166412353515625, 0.299346923828125, 0.30702972412109375, 0.3147125244140625, 0.32239532470703125, 0.330078125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 716.0, 285.0, 11.0, 2.0], "bins": [-35.85194778442383, -35.262821197509766, -34.67369079589844, -34.084564208984375, -33.49543380737305, -32.906307220458984, -32.317176818847656, -31.728050231933594, -31.1389217376709, -30.549793243408203, -29.960664749145508, -29.371536254882812, -28.782407760620117, -28.193279266357422, -27.60415267944336, -27.015024185180664, -26.42589569091797, -25.836767196655273, -25.247638702392578, -24.658510208129883, -24.069381713867188, -23.480255126953125, -22.891124725341797, -22.301998138427734, -21.712867736816406, -21.12373924255371, -20.534610748291016, -19.94548225402832, -19.356353759765625, -18.767227172851562, -18.178096771240234, -17.588970184326172, -16.999839782714844, -16.41071128845215, -15.821582794189453, -15.232454299926758, -14.643326759338379, -14.054198265075684, -13.465069770812988, -12.87594223022461, -12.286813735961914, -11.697685241699219, -11.108556747436523, -10.519428253173828, -9.93030071258545, -9.341172218322754, -8.752043724060059, -8.16291618347168, -7.573787689208984, -6.984659194946289, -6.395531177520752, -5.806402683258057, -5.2172746658325195, -4.628146171569824, -4.039017677307129, -3.449889659881592, -2.8607611656188965, -2.2716329097747803, -1.6825045347213745, -1.0933761596679688, -0.5042479038238525, 0.08488035202026367, 0.674008846282959, 1.263136863708496, 1.8522653579711914]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 5.0, 18.0, 21.0, 37.0, 51.0, 80.0, 84.0, 93.0, 92.0, 106.0, 95.0, 88.0, 73.0, 55.0, 42.0, 19.0, 20.0, 6.0, 7.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.1014342308044434, -3.031130075454712, -2.9608261585235596, -2.890522003173828, -2.8202178478240967, -2.7499136924743652, -2.679609775543213, -2.6093056201934814, -2.53900146484375, -2.4686973094940186, -2.398393392562866, -2.3280892372131348, -2.2577850818634033, -2.187480926513672, -2.1171770095825195, -2.046872854232788, -1.9765689373016357, -1.9062649011611938, -1.8359607458114624, -1.7656567096710205, -1.695352554321289, -1.6250485181808472, -1.5547444820404053, -1.4844403266906738, -1.414136290550232, -1.34383225440979, -1.2735280990600586, -1.2032240629196167, -1.1329200267791748, -1.0626158714294434, -0.9923118352890015, -0.9220077395439148, -0.851703405380249, -0.7813993096351624, -0.7110952138900757, -0.6407911777496338, -0.5704870820045471, -0.5001829862594604, -0.42987892031669617, -0.3595748543739319, -0.2892707586288452, -0.21896667778491974, -0.14866259694099426, -0.07835851609706879, -0.00805443525314331, 0.06224966049194336, 0.13255372643470764, 0.20285779237747192, 0.2731618881225586, 0.34346598386764526, 0.41377004981040955, 0.48407411575317383, 0.5543782114982605, 0.6246823072433472, 0.6949863433837891, 0.7652904391288757, 0.8355945348739624, 0.9058986306190491, 0.9762027263641357, 1.0465067625045776, 1.1168107986450195, 1.187114953994751, 1.2574189901351929, 1.3277230262756348, 1.3980271816253662]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 12.0, 7.0, 22.0, 43.0, 84.0, 131.0, 242.0, 500.0, 281616.0, 3911146.0, 420.0, 54.0, 10.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.203125, -9.029586791992188, -8.856048583984375, -8.682510375976562, -8.50897216796875, -8.335433959960938, -8.161895751953125, -7.9883575439453125, -7.8148193359375, -7.6412811279296875, -7.467742919921875, -7.2942047119140625, -7.12066650390625, -6.9471282958984375, -6.773590087890625, -6.6000518798828125, -6.426513671875, -6.2529754638671875, -6.079437255859375, -5.9058990478515625, -5.73236083984375, -5.5588226318359375, -5.385284423828125, -5.2117462158203125, -5.0382080078125, -4.8646697998046875, -4.691131591796875, -4.5175933837890625, -4.34405517578125, -4.1705169677734375, -3.996978759765625, -3.8234405517578125, -3.64990234375, -3.4763641357421875, -3.302825927734375, -3.1292877197265625, -2.95574951171875, -2.7822113037109375, -2.608673095703125, -2.4351348876953125, -2.2615966796875, -2.0880584716796875, -1.914520263671875, -1.7409820556640625, -1.56744384765625, -1.3939056396484375, -1.220367431640625, -1.0468292236328125, -0.873291015625, -0.6997528076171875, -0.526214599609375, -0.3526763916015625, -0.17913818359375, -0.0055999755859375, 0.167938232421875, 0.3414764404296875, 0.5150146484375, 0.6885528564453125, 0.862091064453125, 1.0356292724609375, 1.20916748046875, 1.3827056884765625, 1.556243896484375, 1.7297821044921875, 1.9033203125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 14.0, 22.0, 109.0, 253.0, 358.0, 181.0, 61.0, 14.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.258544921875, -0.2536892890930176, -0.24883365631103516, -0.24397802352905273, -0.2391223907470703, -0.2342667579650879, -0.22941112518310547, -0.22455549240112305, -0.21969985961914062, -0.2148442268371582, -0.20998859405517578, -0.20513296127319336, -0.20027732849121094, -0.19542169570922852, -0.1905660629272461, -0.18571043014526367, -0.18085479736328125, -0.17599916458129883, -0.1711435317993164, -0.16628789901733398, -0.16143226623535156, -0.15657663345336914, -0.15172100067138672, -0.1468653678894043, -0.14200973510742188, -0.13715410232543945, -0.13229846954345703, -0.1274428367614746, -0.12258720397949219, -0.11773157119750977, -0.11287593841552734, -0.10802030563354492, -0.1031646728515625, -0.09830904006958008, -0.09345340728759766, -0.08859777450561523, -0.08374214172363281, -0.07888650894165039, -0.07403087615966797, -0.06917524337768555, -0.06431961059570312, -0.0594639778137207, -0.05460834503173828, -0.04975271224975586, -0.04489707946777344, -0.040041446685791016, -0.035185813903808594, -0.030330181121826172, -0.02547454833984375, -0.020618915557861328, -0.015763282775878906, -0.010907649993896484, -0.0060520172119140625, -0.0011963844299316406, 0.0036592483520507812, 0.008514881134033203, 0.013370513916015625, 0.018226146697998047, 0.02308177947998047, 0.02793741226196289, 0.03279304504394531, 0.037648677825927734, 0.042504310607910156, 0.04735994338989258, 0.052215576171875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 7.0, 11.0, 23.0, 48.0, 93.0, 128.0, 163.0, 245.0, 325.0, 4059024.0, 133454.0, 365.0, 184.0, 84.0, 63.0, 33.0, 26.0, 7.0, 7.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8125, -8.6119384765625, -8.411376953125, -8.2108154296875, -8.01025390625, -7.8096923828125, -7.609130859375, -7.4085693359375, -7.2080078125, -7.0074462890625, -6.806884765625, -6.6063232421875, -6.40576171875, -6.2052001953125, -6.004638671875, -5.8040771484375, -5.603515625, -5.4029541015625, -5.202392578125, -5.0018310546875, -4.80126953125, -4.6007080078125, -4.400146484375, -4.1995849609375, -3.9990234375, -3.7984619140625, -3.597900390625, -3.3973388671875, -3.19677734375, -2.9962158203125, -2.795654296875, -2.5950927734375, -2.39453125, -2.1939697265625, -1.993408203125, -1.7928466796875, -1.59228515625, -1.3917236328125, -1.191162109375, -0.9906005859375, -0.7900390625, -0.5894775390625, -0.388916015625, -0.1883544921875, 0.01220703125, 0.2127685546875, 0.413330078125, 0.6138916015625, 0.814453125, 1.0150146484375, 1.215576171875, 1.4161376953125, 1.61669921875, 1.8172607421875, 2.017822265625, 2.2183837890625, 2.4189453125, 2.6195068359375, 2.820068359375, 3.0206298828125, 3.22119140625, 3.4217529296875, 3.622314453125, 3.8228759765625, 4.0234375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 13.0, 834.0, 3081.0, 118.0, 27.0, 12.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.263671875, -1.2394065856933594, -1.2151412963867188, -1.1908760070800781, -1.1666107177734375, -1.1423454284667969, -1.1180801391601562, -1.0938148498535156, -1.069549560546875, -1.0452842712402344, -1.0210189819335938, -0.9967536926269531, -0.9724884033203125, -0.9482231140136719, -0.9239578247070312, -0.8996925354003906, -0.87542724609375, -0.8511619567871094, -0.8268966674804688, -0.8026313781738281, -0.7783660888671875, -0.7541007995605469, -0.7298355102539062, -0.7055702209472656, -0.681304931640625, -0.6570396423339844, -0.6327743530273438, -0.6085090637207031, -0.5842437744140625, -0.5599784851074219, -0.5357131958007812, -0.5114479064941406, -0.4871826171875, -0.4629173278808594, -0.43865203857421875, -0.4143867492675781, -0.3901214599609375, -0.3658561706542969, -0.34159088134765625, -0.3173255920410156, -0.293060302734375, -0.2687950134277344, -0.24452972412109375, -0.22026443481445312, -0.1959991455078125, -0.17173385620117188, -0.14746856689453125, -0.12320327758789062, -0.09893798828125, -0.07467269897460938, -0.05040740966796875, -0.026142120361328125, -0.0018768310546875, 0.022388458251953125, 0.04665374755859375, 0.07091903686523438, 0.095184326171875, 0.11944961547851562, 0.14371490478515625, 0.16798019409179688, 0.1922454833984375, 0.21651077270507812, 0.24077606201171875, 0.2650413513183594, 0.289306640625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 32.0, 189.0, 662.0, 100.0, 21.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.177988052368164, -7.979977130889893, -7.781966686248779, -7.583955764770508, -7.385944843292236, -7.187933921813965, -6.989923477172852, -6.79191255569458, -6.593901634216309, -6.395890712738037, -6.197880268096924, -5.999869346618652, -5.801858425140381, -5.603847503662109, -5.405837059020996, -5.207826137542725, -5.009815216064453, -4.811804294586182, -4.613793849945068, -4.415782928466797, -4.217772006988525, -4.019761085510254, -3.8217506408691406, -3.623739719390869, -3.425729274749756, -3.2277185916900635, -3.029707670211792, -2.8316969871520996, -2.633686065673828, -2.4356753826141357, -2.2376646995544434, -2.039653778076172, -1.8416428565979004, -1.6436320543289185, -1.4456212520599365, -1.2476105690002441, -1.0495996475219727, -0.8515889048576355, -0.6535781621932983, -0.4555673599243164, -0.2575565576553345, -0.05954577028751373, 0.138465017080307, 0.33647578954696655, 0.5344865918159485, 0.7324973940849304, 0.9305081367492676, 1.1285189390182495, 1.3265297412872314, 1.5245405435562134, 1.7225513458251953, 1.9205620288848877, 2.118572950363159, 2.3165836334228516, 2.514594554901123, 2.7126052379608154, 2.910615921020508, 3.1086266040802, 3.3066375255584717, 3.504648208618164, 3.7026591300964355, 3.900669813156128, 4.09868049621582, 4.296691417694092, 4.494702339172363]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 4.0, 3.0, 17.0, 31.0, 48.0, 69.0, 127.0, 145.0, 154.0, 140.0, 88.0, 82.0, 58.0, 16.0, 16.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9885764122009277, -3.8607213497161865, -3.7328662872314453, -3.605011224746704, -3.477156162261963, -3.349301338195801, -3.2214462757110596, -3.0935912132263184, -2.965736150741577, -2.837881088256836, -2.7100260257720947, -2.5821709632873535, -2.4543161392211914, -2.326460838317871, -2.198606014251709, -2.0707509517669678, -1.9428958892822266, -1.8150408267974854, -1.6871857643127441, -1.5593308210372925, -1.4314757585525513, -1.30362069606781, -1.1757657527923584, -1.0479106903076172, -0.920055627822876, -0.7922005653381348, -0.6643455624580383, -0.5364905595779419, -0.4086354970932007, -0.2807804346084595, -0.15292543172836304, -0.0250704288482666, 0.10278463363647461, 0.23063966631889343, 0.35849469900131226, 0.4863497316837311, 0.6142047643661499, 0.7420598268508911, 0.8699148297309875, 0.997769832611084, 1.1256248950958252, 1.2534799575805664, 1.3813350200653076, 1.5091899633407593, 1.6370450258255005, 1.7649000883102417, 1.8927550315856934, 2.0206100940704346, 2.148465156555176, 2.276320219039917, 2.404175281524658, 2.5320303440093994, 2.6598854064941406, 2.7877402305603027, 2.915595293045044, 3.043450355529785, 3.1713054180145264, 3.2991604804992676, 3.427015542984009, 3.55487060546875, 3.682725429534912, 3.8105807304382324, 3.9384355545043945, 4.066290855407715, 4.194145679473877]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 2.0, 14.0, 12.0, 17.0, 29.0, 36.0, 52.0, 92.0, 134.0, 304.0, 847.0, 3132.0, 26193.0, 876757.0, 131568.0, 6928.0, 1499.0, 452.0, 182.0, 91.0, 72.0, 39.0, 32.0, 18.0, 18.0, 13.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.689453125, -1.6421661376953125, -1.594879150390625, -1.5475921630859375, -1.50030517578125, -1.4530181884765625, -1.405731201171875, -1.3584442138671875, -1.3111572265625, -1.2638702392578125, -1.216583251953125, -1.1692962646484375, -1.12200927734375, -1.0747222900390625, -1.027435302734375, -0.9801483154296875, -0.932861328125, -0.8855743408203125, -0.838287353515625, -0.7910003662109375, -0.74371337890625, -0.6964263916015625, -0.649139404296875, -0.6018524169921875, -0.5545654296875, -0.5072784423828125, -0.459991455078125, -0.4127044677734375, -0.36541748046875, -0.3181304931640625, -0.270843505859375, -0.2235565185546875, -0.17626953125, -0.1289825439453125, -0.081695556640625, -0.0344085693359375, 0.01287841796875, 0.0601654052734375, 0.107452392578125, 0.1547393798828125, 0.2020263671875, 0.2493133544921875, 0.296600341796875, 0.3438873291015625, 0.39117431640625, 0.4384613037109375, 0.485748291015625, 0.5330352783203125, 0.580322265625, 0.6276092529296875, 0.674896240234375, 0.7221832275390625, 0.76947021484375, 0.8167572021484375, 0.864044189453125, 0.9113311767578125, 0.9586181640625, 1.0059051513671875, 1.053192138671875, 1.1004791259765625, 1.14776611328125, 1.1950531005859375, 1.242340087890625, 1.2896270751953125, 1.3369140625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 1.0, 5.0, 15.0, 31.0, 50.0, 90.0, 153.0, 175.0, 167.0, 127.0, 89.0, 51.0, 29.0, 11.0, 8.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.344482421875, -0.3369712829589844, -0.32946014404296875, -0.3219490051269531, -0.3144378662109375, -0.3069267272949219, -0.29941558837890625, -0.2919044494628906, -0.284393310546875, -0.2768821716308594, -0.26937103271484375, -0.2618598937988281, -0.2543487548828125, -0.24683761596679688, -0.23932647705078125, -0.23181533813476562, -0.22430419921875, -0.21679306030273438, -0.20928192138671875, -0.20177078247070312, -0.1942596435546875, -0.18674850463867188, -0.17923736572265625, -0.17172622680664062, -0.164215087890625, -0.15670394897460938, -0.14919281005859375, -0.14168167114257812, -0.1341705322265625, -0.12665939331054688, -0.11914825439453125, -0.11163711547851562, -0.1041259765625, -0.09661483764648438, -0.08910369873046875, -0.08159255981445312, -0.0740814208984375, -0.06657028198242188, -0.05905914306640625, -0.051548004150390625, -0.044036865234375, -0.036525726318359375, -0.02901458740234375, -0.021503448486328125, -0.0139923095703125, -0.006481170654296875, 0.00102996826171875, 0.008541107177734375, 0.01605224609375, 0.023563385009765625, 0.03107452392578125, 0.038585662841796875, 0.0460968017578125, 0.053607940673828125, 0.06111907958984375, 0.06863021850585938, 0.076141357421875, 0.08365249633789062, 0.09116363525390625, 0.09867477416992188, 0.1061859130859375, 0.11369705200195312, 0.12120819091796875, 0.12871932983398438, 0.13623046875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 5.0, 8.0, 8.0, 3.0, 6.0, 13.0, 13.0, 13.0, 14.0, 27.0, 39.0, 41.0, 103.0, 200.0, 477.0, 1552.0, 7747.0, 72380.0, 807991.0, 142566.0, 12034.0, 2140.0, 600.0, 247.0, 116.0, 57.0, 34.0, 28.0, 16.0, 15.0, 8.0, 11.0, 9.0, 9.0, 8.0, 5.0, 4.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64453125, -0.6234817504882812, -0.6024322509765625, -0.5813827514648438, -0.560333251953125, -0.5392837524414062, -0.5182342529296875, -0.49718475341796875, -0.47613525390625, -0.45508575439453125, -0.4340362548828125, -0.41298675537109375, -0.391937255859375, -0.37088775634765625, -0.3498382568359375, -0.32878875732421875, -0.3077392578125, -0.28668975830078125, -0.2656402587890625, -0.24459075927734375, -0.223541259765625, -0.20249176025390625, -0.1814422607421875, -0.16039276123046875, -0.13934326171875, -0.11829376220703125, -0.0972442626953125, -0.07619476318359375, -0.055145263671875, -0.03409576416015625, -0.0130462646484375, 0.00800323486328125, 0.029052734375, 0.05010223388671875, 0.0711517333984375, 0.09220123291015625, 0.113250732421875, 0.13430023193359375, 0.1553497314453125, 0.17639923095703125, 0.19744873046875, 0.21849822998046875, 0.2395477294921875, 0.26059722900390625, 0.281646728515625, 0.30269622802734375, 0.3237457275390625, 0.34479522705078125, 0.3658447265625, 0.38689422607421875, 0.4079437255859375, 0.42899322509765625, 0.450042724609375, 0.47109222412109375, 0.4921417236328125, 0.5131912231445312, 0.53424072265625, 0.5552902221679688, 0.5763397216796875, 0.5973892211914062, 0.618438720703125, 0.6394882202148438, 0.6605377197265625, 0.6815872192382812, 0.70263671875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 8.0, 9.0, 7.0, 6.0, 8.0, 8.0, 10.0, 17.0, 12.0, 22.0, 31.0, 38.0, 35.0, 42.0, 46.0, 45.0, 63.0, 59.0, 56.0, 48.0, 46.0, 55.0, 50.0, 44.0, 50.0, 35.0, 23.0, 22.0, 24.0, 16.0, 13.0, 8.0, 5.0, 13.0, 4.0, 6.0, 7.0, 4.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.362548828125, -0.3512382507324219, -0.33992767333984375, -0.3286170959472656, -0.3173065185546875, -0.3059959411621094, -0.29468536376953125, -0.2833747863769531, -0.272064208984375, -0.2607536315917969, -0.24944305419921875, -0.23813247680664062, -0.2268218994140625, -0.21551132202148438, -0.20420074462890625, -0.19289016723632812, -0.18157958984375, -0.17026901245117188, -0.15895843505859375, -0.14764785766601562, -0.1363372802734375, -0.12502670288085938, -0.11371612548828125, -0.10240554809570312, -0.091094970703125, -0.07978439331054688, -0.06847381591796875, -0.057163238525390625, -0.0458526611328125, -0.034542083740234375, -0.02323150634765625, -0.011920928955078125, -0.0006103515625, 0.010700225830078125, 0.02201080322265625, 0.033321380615234375, 0.0446319580078125, 0.055942535400390625, 0.06725311279296875, 0.07856369018554688, 0.089874267578125, 0.10118484497070312, 0.11249542236328125, 0.12380599975585938, 0.1351165771484375, 0.14642715454101562, 0.15773773193359375, 0.16904830932617188, 0.18035888671875, 0.19166946411132812, 0.20298004150390625, 0.21429061889648438, 0.2256011962890625, 0.23691177368164062, 0.24822235107421875, 0.2595329284667969, 0.270843505859375, 0.2821540832519531, 0.29346466064453125, 0.3047752380371094, 0.3160858154296875, 0.3273963928222656, 0.33870697021484375, 0.3500175476074219, 0.361328125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 5.0, 1.0, 9.0, 5.0, 6.0, 23.0, 31.0, 36.0, 73.0, 155.0, 276.0, 786.0, 2824.0, 20945.0, 887824.0, 126701.0, 6471.0, 1425.0, 470.0, 226.0, 111.0, 54.0, 33.0, 27.0, 15.0, 10.0, 2.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.763671875, -0.742889404296875, -0.72210693359375, -0.701324462890625, -0.6805419921875, -0.659759521484375, -0.63897705078125, -0.618194580078125, -0.597412109375, -0.576629638671875, -0.55584716796875, -0.535064697265625, -0.5142822265625, -0.493499755859375, -0.47271728515625, -0.451934814453125, -0.43115234375, -0.410369873046875, -0.38958740234375, -0.368804931640625, -0.3480224609375, -0.327239990234375, -0.30645751953125, -0.285675048828125, -0.264892578125, -0.244110107421875, -0.22332763671875, -0.202545166015625, -0.1817626953125, -0.160980224609375, -0.14019775390625, -0.119415283203125, -0.0986328125, -0.077850341796875, -0.05706787109375, -0.036285400390625, -0.0155029296875, 0.005279541015625, 0.02606201171875, 0.046844482421875, 0.067626953125, 0.088409423828125, 0.10919189453125, 0.129974365234375, 0.1507568359375, 0.171539306640625, 0.19232177734375, 0.213104248046875, 0.23388671875, 0.254669189453125, 0.27545166015625, 0.296234130859375, 0.3170166015625, 0.337799072265625, 0.35858154296875, 0.379364013671875, 0.400146484375, 0.420928955078125, 0.44171142578125, 0.462493896484375, 0.4832763671875, 0.504058837890625, 0.52484130859375, 0.545623779296875, 0.56640625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 6.0, 4.0, 9.0, 13.0, 19.0, 31.0, 42.0, 63.0, 87.0, 142.0, 192.0, 123.0, 89.0, 57.0, 40.0, 28.0, 18.0, 19.0, 12.0, 6.0, 4.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.000949859619140625, -0.0009294338524341583, -0.0009090080857276917, -0.000888582319021225, -0.0008681565523147583, -0.0008477307856082916, -0.000827305018901825, -0.0008068792521953583, -0.0007864534854888916, -0.0007660277187824249, -0.0007456019520759583, -0.0007251761853694916, -0.0007047504186630249, -0.0006843246519565582, -0.0006638988852500916, -0.0006434731185436249, -0.0006230473518371582, -0.0006026215851306915, -0.0005821958184242249, -0.0005617700517177582, -0.0005413442850112915, -0.0005209185183048248, -0.0005004927515983582, -0.0004800669848918915, -0.0004596412181854248, -0.00043921545147895813, -0.00041878968477249146, -0.0003983639180660248, -0.0003779381513595581, -0.00035751238465309143, -0.00033708661794662476, -0.0003166608512401581, -0.0002962350845336914, -0.00027580931782722473, -0.00025538355112075806, -0.00023495778441429138, -0.0002145320177078247, -0.00019410625100135803, -0.00017368048429489136, -0.00015325471758842468, -0.000132828950881958, -0.00011240318417549133, -9.197741746902466e-05, -7.155165076255798e-05, -5.112588405609131e-05, -3.0700117349624634e-05, -1.0274350643157959e-05, 1.0151416063308716e-05, 3.057718276977539e-05, 5.1002949476242065e-05, 7.142871618270874e-05, 9.185448288917542e-05, 0.00011228024959564209, 0.00013270601630210876, 0.00015313178300857544, 0.00017355754971504211, 0.0001939833164215088, 0.00021440908312797546, 0.00023483484983444214, 0.0002552606165409088, 0.0002756863832473755, 0.00029611214995384216, 0.00031653791666030884, 0.0003369636833667755, 0.0003573894500732422]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 4.0, 9.0, 17.0, 28.0, 43.0, 86.0, 193.0, 369.0, 962.0, 3627.0, 24012.0, 727462.0, 274901.0, 12961.0, 2483.0, 795.0, 283.0, 134.0, 66.0, 36.0, 29.0, 18.0, 7.0, 8.0, 2.0, 6.0, 2.0, 7.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.595703125, -0.5790901184082031, -0.5624771118164062, -0.5458641052246094, -0.5292510986328125, -0.5126380920410156, -0.49602508544921875, -0.4794120788574219, -0.462799072265625, -0.4461860656738281, -0.42957305908203125, -0.4129600524902344, -0.3963470458984375, -0.3797340393066406, -0.36312103271484375, -0.3465080261230469, -0.32989501953125, -0.3132820129394531, -0.29666900634765625, -0.2800559997558594, -0.2634429931640625, -0.24682998657226562, -0.23021697998046875, -0.21360397338867188, -0.196990966796875, -0.18037796020507812, -0.16376495361328125, -0.14715194702148438, -0.1305389404296875, -0.11392593383789062, -0.09731292724609375, -0.08069992065429688, -0.0640869140625, -0.047473907470703125, -0.03086090087890625, -0.014247894287109375, 0.0023651123046875, 0.018978118896484375, 0.03559112548828125, 0.052204132080078125, 0.068817138671875, 0.08543014526367188, 0.10204315185546875, 0.11865615844726562, 0.1352691650390625, 0.15188217163085938, 0.16849517822265625, 0.18510818481445312, 0.20172119140625, 0.21833419799804688, 0.23494720458984375, 0.2515602111816406, 0.2681732177734375, 0.2847862243652344, 0.30139923095703125, 0.3180122375488281, 0.334625244140625, 0.3512382507324219, 0.36785125732421875, 0.3844642639160156, 0.4010772705078125, 0.4176902770996094, 0.43430328369140625, 0.4509162902832031, 0.467529296875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 7.0, 4.0, 6.0, 16.0, 16.0, 31.0, 61.0, 114.0, 198.0, 230.0, 141.0, 72.0, 39.0, 23.0, 22.0, 7.0, 5.0, 4.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.339599609375, -0.3299293518066406, -0.32025909423828125, -0.3105888366699219, -0.3009185791015625, -0.2912483215332031, -0.28157806396484375, -0.2719078063964844, -0.262237548828125, -0.2525672912597656, -0.24289703369140625, -0.23322677612304688, -0.2235565185546875, -0.21388626098632812, -0.20421600341796875, -0.19454574584960938, -0.18487548828125, -0.17520523071289062, -0.16553497314453125, -0.15586471557617188, -0.1461944580078125, -0.13652420043945312, -0.12685394287109375, -0.11718368530273438, -0.107513427734375, -0.09784317016601562, -0.08817291259765625, -0.07850265502929688, -0.0688323974609375, -0.059162139892578125, -0.04949188232421875, -0.039821624755859375, -0.0301513671875, -0.020481109619140625, -0.01081085205078125, -0.001140594482421875, 0.0085296630859375, 0.018199920654296875, 0.02787017822265625, 0.037540435791015625, 0.047210693359375, 0.056880950927734375, 0.06655120849609375, 0.07622146606445312, 0.0858917236328125, 0.09556198120117188, 0.10523223876953125, 0.11490249633789062, 0.12457275390625, 0.13424301147460938, 0.14391326904296875, 0.15358352661132812, 0.1632537841796875, 0.17292404174804688, 0.18259429931640625, 0.19226455688476562, 0.201934814453125, 0.21160507202148438, 0.22127532958984375, 0.23094558715820312, 0.2406158447265625, 0.2502861022949219, 0.25995635986328125, 0.2696266174316406, 0.279296875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 55.0, 713.0, 216.0, 19.0, 5.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.172452926635742, -16.811790466308594, -16.451126098632812, -16.09046173095703, -15.729799270629883, -15.369135856628418, -15.008472442626953, -14.647809028625488, -14.287145614624023, -13.926482200622559, -13.565818786621094, -13.205155372619629, -12.844491958618164, -12.4838285446167, -12.123165130615234, -11.76250171661377, -11.401838302612305, -11.04117488861084, -10.680511474609375, -10.31984806060791, -9.959184646606445, -9.59852123260498, -9.237857818603516, -8.87719440460205, -8.516530990600586, -8.155867576599121, -7.795204162597656, -7.434540748596191, -7.073877334594727, -6.713213920593262, -6.352550506591797, -5.991887092590332, -5.631224632263184, -5.270561218261719, -4.909897804260254, -4.549234390258789, -4.188570976257324, -3.8279075622558594, -3.4672441482543945, -3.1065807342529297, -2.745917320251465, -2.38525390625, -2.024590492248535, -1.6639270782470703, -1.3032636642456055, -0.9426002502441406, -0.5819368362426758, -0.22127342224121094, 0.1393899917602539, 0.5000534057617188, 0.8607168197631836, 1.2213802337646484, 1.5820436477661133, 1.9427070617675781, 2.303370475769043, 2.664033889770508, 3.0246973037719727, 3.3853607177734375, 3.7460241317749023, 4.106687545776367, 4.467350959777832, 4.828014373779297, 5.188677787780762, 5.549341201782227, 5.910004615783691]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 6.0, 3.0, 9.0, 15.0, 15.0, 10.0, 18.0, 35.0, 32.0, 38.0, 48.0, 50.0, 63.0, 53.0, 61.0, 44.0, 69.0, 66.0, 46.0, 57.0, 49.0, 41.0, 37.0, 23.0, 20.0, 22.0, 17.0, 15.0, 10.0, 5.0, 7.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3792190551757812, -2.297229528427124, -2.215240001678467, -2.1332504749298096, -2.0512609481811523, -1.9692714214324951, -1.887281894683838, -1.8052923679351807, -1.7233028411865234, -1.6413133144378662, -1.559323787689209, -1.4773342609405518, -1.3953447341918945, -1.3133552074432373, -1.23136568069458, -1.1493761539459229, -1.0673866271972656, -0.9853971004486084, -0.9034075736999512, -0.821418046951294, -0.7394285202026367, -0.6574389934539795, -0.5754494667053223, -0.49345993995666504, -0.4114704132080078, -0.3294808864593506, -0.24749135971069336, -0.16550183296203613, -0.0835123062133789, -0.0015227794647216797, 0.08046674728393555, 0.16245627403259277, 0.24444580078125, 0.3264353275299072, 0.40842485427856445, 0.4904143810272217, 0.5724039077758789, 0.6543934345245361, 0.7363829612731934, 0.8183724880218506, 0.9003620147705078, 0.982351541519165, 1.0643410682678223, 1.1463305950164795, 1.2283201217651367, 1.310309648513794, 1.3922991752624512, 1.4742887020111084, 1.5562782287597656, 1.6382677555084229, 1.72025728225708, 1.8022468090057373, 1.8842363357543945, 1.9662258625030518, 2.048215389251709, 2.130204916000366, 2.2121944427490234, 2.2941839694976807, 2.376173496246338, 2.458163022994995, 2.5401525497436523, 2.6221420764923096, 2.704131603240967, 2.786121129989624, 2.8681106567382812]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 1.0, 4.0, 2.0, 7.0, 7.0, 13.0, 6.0, 24.0, 13.0, 25.0, 31.0, 32.0, 44.0, 56.0, 84.0, 112.0, 149.0, 243.0, 470.0, 1061.0, 3158.0, 16811.0, 304873.0, 3817401.0, 41708.0, 5820.0, 1401.0, 448.0, 149.0, 72.0, 33.0, 11.0, 7.0, 4.0, 2.0, 1.0, 1.0], "bins": [-2.439453125, -2.3908462524414062, -2.3422393798828125, -2.2936325073242188, -2.245025634765625, -2.1964187622070312, -2.1478118896484375, -2.0992050170898438, -2.05059814453125, -2.0019912719726562, -1.9533843994140625, -1.9047775268554688, -1.856170654296875, -1.8075637817382812, -1.7589569091796875, -1.7103500366210938, -1.6617431640625, -1.6131362915039062, -1.5645294189453125, -1.5159225463867188, -1.467315673828125, -1.4187088012695312, -1.3701019287109375, -1.3214950561523438, -1.27288818359375, -1.2242813110351562, -1.1756744384765625, -1.1270675659179688, -1.078460693359375, -1.0298538208007812, -0.9812469482421875, -0.9326400756835938, -0.884033203125, -0.8354263305664062, -0.7868194580078125, -0.7382125854492188, -0.689605712890625, -0.6409988403320312, -0.5923919677734375, -0.5437850952148438, -0.49517822265625, -0.44657135009765625, -0.3979644775390625, -0.34935760498046875, -0.300750732421875, -0.25214385986328125, -0.2035369873046875, -0.15493011474609375, -0.1063232421875, -0.05771636962890625, -0.0091094970703125, 0.03949737548828125, 0.088104248046875, 0.13671112060546875, 0.1853179931640625, 0.23392486572265625, 0.28253173828125, 0.33113861083984375, 0.3797454833984375, 0.42835235595703125, 0.476959228515625, 0.5255661010742188, 0.5741729736328125, 0.6227798461914062, 0.67138671875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 11.0, 12.0, 30.0, 56.0, 86.0, 109.0, 138.0, 172.0, 135.0, 104.0, 52.0, 42.0, 26.0, 22.0, 7.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.352783203125, -0.3457651138305664, -0.3387470245361328, -0.3317289352416992, -0.3247108459472656, -0.31769275665283203, -0.31067466735839844, -0.30365657806396484, -0.29663848876953125, -0.28962039947509766, -0.28260231018066406, -0.27558422088623047, -0.2685661315917969, -0.2615480422973633, -0.2545299530029297, -0.2475118637084961, -0.2404937744140625, -0.2334756851196289, -0.2264575958251953, -0.21943950653076172, -0.21242141723632812, -0.20540332794189453, -0.19838523864746094, -0.19136714935302734, -0.18434906005859375, -0.17733097076416016, -0.17031288146972656, -0.16329479217529297, -0.15627670288085938, -0.14925861358642578, -0.1422405242919922, -0.1352224349975586, -0.128204345703125, -0.1211862564086914, -0.11416816711425781, -0.10715007781982422, -0.10013198852539062, -0.09311389923095703, -0.08609580993652344, -0.07907772064208984, -0.07205963134765625, -0.06504154205322266, -0.05802345275878906, -0.05100536346435547, -0.043987274169921875, -0.03696918487548828, -0.029951095581054688, -0.022933006286621094, -0.0159149169921875, -0.008896827697753906, -0.0018787384033203125, 0.005139350891113281, 0.012157440185546875, 0.01917552947998047, 0.026193618774414062, 0.033211708068847656, 0.04022979736328125, 0.047247886657714844, 0.05426597595214844, 0.06128406524658203, 0.06830215454101562, 0.07532024383544922, 0.08233833312988281, 0.0893564224243164, 0.09637451171875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 10.0, 12.0, 31.0, 79.0, 123.0, 321.0, 1191.0, 84105.0, 4106574.0, 1421.0, 250.0, 83.0, 45.0, 27.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3515625, -7.201904296875, -7.05224609375, -6.902587890625, -6.7529296875, -6.603271484375, -6.45361328125, -6.303955078125, -6.154296875, -6.004638671875, -5.85498046875, -5.705322265625, -5.5556640625, -5.406005859375, -5.25634765625, -5.106689453125, -4.95703125, -4.807373046875, -4.65771484375, -4.508056640625, -4.3583984375, -4.208740234375, -4.05908203125, -3.909423828125, -3.759765625, -3.610107421875, -3.46044921875, -3.310791015625, -3.1611328125, -3.011474609375, -2.86181640625, -2.712158203125, -2.5625, -2.412841796875, -2.26318359375, -2.113525390625, -1.9638671875, -1.814208984375, -1.66455078125, -1.514892578125, -1.365234375, -1.215576171875, -1.06591796875, -0.916259765625, -0.7666015625, -0.616943359375, -0.46728515625, -0.317626953125, -0.16796875, -0.018310546875, 0.13134765625, 0.281005859375, 0.4306640625, 0.580322265625, 0.72998046875, 0.879638671875, 1.029296875, 1.178955078125, 1.32861328125, 1.478271484375, 1.6279296875, 1.777587890625, 1.92724609375, 2.076904296875, 2.2265625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 4.0, 12.0, 42.0, 94.0, 508.0, 3076.0, 232.0, 53.0, 26.0, 13.0, 9.0, 4.0, 1.0, 2.0, 3.0], "bins": [-0.8466796875, -0.8310966491699219, -0.8155136108398438, -0.7999305725097656, -0.7843475341796875, -0.7687644958496094, -0.7531814575195312, -0.7375984191894531, -0.722015380859375, -0.7064323425292969, -0.6908493041992188, -0.6752662658691406, -0.6596832275390625, -0.6441001892089844, -0.6285171508789062, -0.6129341125488281, -0.59735107421875, -0.5817680358886719, -0.5661849975585938, -0.5506019592285156, -0.5350189208984375, -0.5194358825683594, -0.5038528442382812, -0.4882698059082031, -0.472686767578125, -0.4571037292480469, -0.44152069091796875, -0.4259376525878906, -0.4103546142578125, -0.3947715759277344, -0.37918853759765625, -0.3636054992675781, -0.3480224609375, -0.3324394226074219, -0.31685638427734375, -0.3012733459472656, -0.2856903076171875, -0.2701072692871094, -0.25452423095703125, -0.23894119262695312, -0.223358154296875, -0.20777511596679688, -0.19219207763671875, -0.17660903930664062, -0.1610260009765625, -0.14544296264648438, -0.12985992431640625, -0.11427688598632812, -0.09869384765625, -0.08311080932617188, -0.06752777099609375, -0.051944732666015625, -0.0363616943359375, -0.020778656005859375, -0.00519561767578125, 0.010387420654296875, 0.025970458984375, 0.041553497314453125, 0.05713653564453125, 0.07271957397460938, 0.0883026123046875, 0.10388565063476562, 0.11946868896484375, 0.13505172729492188, 0.150634765625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 3.0, 4.0, 3.0, 8.0, 15.0, 63.0, 303.0, 457.0, 116.0, 21.0, 8.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8174827098846436, -3.7092814445495605, -3.6010801792144775, -3.4928789138793945, -3.3846778869628906, -3.2764766216278076, -3.1682753562927246, -3.0600740909576416, -2.9518728256225586, -2.8436715602874756, -2.7354702949523926, -2.6272692680358887, -2.5190680027008057, -2.4108667373657227, -2.3026654720306396, -2.1944642066955566, -2.0862631797790527, -1.9780619144439697, -1.8698607683181763, -1.7616595029830933, -1.6534582376480103, -1.5452570915222168, -1.4370558261871338, -1.3288545608520508, -1.2206532955169678, -1.1124520301818848, -1.0042508840560913, -0.8960496187210083, -0.7878483533859253, -0.6796471476554871, -0.5714459419250488, -0.4632446765899658, -0.3550434112548828, -0.2468421757221222, -0.13864095509052277, -0.03043973445892334, 0.07776150107383728, 0.1859627366065979, 0.29416394233703613, 0.40236520767211914, 0.5105664134025574, 0.6187676191329956, 0.7269688844680786, 0.8351700901985168, 0.9433712959289551, 1.051572561264038, 1.159773826599121, 1.267975091934204, 1.3761762380599976, 1.4843775033950806, 1.592578649520874, 1.700779914855957, 1.80898118019104, 1.917182445526123, 2.025383472442627, 2.133584976196289, 2.241786003112793, 2.349987268447876, 2.458188533782959, 2.566389560699463, 2.674590826034546, 2.782792091369629, 2.890993356704712, 2.999194622039795, 3.107395887374878]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 12.0, 29.0, 44.0, 58.0, 79.0, 81.0, 98.0, 142.0, 113.0, 78.0, 91.0, 57.0, 43.0, 37.0, 15.0, 9.0, 4.0, 2.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1972384452819824, -2.1311795711517334, -2.0651204586029053, -1.9990615844726562, -1.9330027103424072, -1.8669437170028687, -1.80088472366333, -1.734825849533081, -1.668766975402832, -1.6027079820632935, -1.5366491079330444, -1.4705901145935059, -1.4045312404632568, -1.3384722471237183, -1.2724132537841797, -1.2063543796539307, -1.140295386314392, -1.0742363929748535, -1.0081775188446045, -0.9421185255050659, -0.8760596513748169, -0.8100006580352783, -0.7439417243003845, -0.6778827905654907, -0.6118238568305969, -0.5457649230957031, -0.4797059893608093, -0.41364702582359314, -0.34758809208869934, -0.28152915835380554, -0.21547019481658936, -0.14941126108169556, -0.08335232734680176, -0.017293386161327362, 0.048765555024147034, 0.11482450366020203, 0.18088343739509583, 0.24694237112998962, 0.3130013346672058, 0.3790602684020996, 0.4451192021369934, 0.5111781358718872, 0.577237069606781, 0.6432960033416748, 0.7093549966812134, 0.7754138708114624, 0.841472864151001, 0.9075317978858948, 0.9735907316207886, 1.0396497249603271, 1.1057085990905762, 1.1717675924301147, 1.2378264665603638, 1.3038854598999023, 1.3699443340301514, 1.43600332736969, 1.5020623207092285, 1.568121314048767, 1.6341801881790161, 1.7002391815185547, 1.7662980556488037, 1.8323570489883423, 1.8984160423278809, 1.9644749164581299, 2.030533790588379]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 2.0, 6.0, 11.0, 16.0, 9.0, 19.0, 36.0, 33.0, 51.0, 81.0, 106.0, 189.0, 359.0, 583.0, 1276.0, 3682.0, 14768.0, 102571.0, 758103.0, 140754.0, 18553.0, 4271.0, 1469.0, 653.0, 332.0, 213.0, 120.0, 75.0, 55.0, 37.0, 31.0, 28.0, 10.0, 16.0, 8.0, 5.0, 7.0, 8.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.85546875, -0.830718994140625, -0.80596923828125, -0.781219482421875, -0.7564697265625, -0.731719970703125, -0.70697021484375, -0.682220458984375, -0.657470703125, -0.632720947265625, -0.60797119140625, -0.583221435546875, -0.5584716796875, -0.533721923828125, -0.50897216796875, -0.484222412109375, -0.45947265625, -0.434722900390625, -0.40997314453125, -0.385223388671875, -0.3604736328125, -0.335723876953125, -0.31097412109375, -0.286224365234375, -0.261474609375, -0.236724853515625, -0.21197509765625, -0.187225341796875, -0.1624755859375, -0.137725830078125, -0.11297607421875, -0.088226318359375, -0.0634765625, -0.038726806640625, -0.01397705078125, 0.010772705078125, 0.0355224609375, 0.060272216796875, 0.08502197265625, 0.109771728515625, 0.134521484375, 0.159271240234375, 0.18402099609375, 0.208770751953125, 0.2335205078125, 0.258270263671875, 0.28302001953125, 0.307769775390625, 0.33251953125, 0.357269287109375, 0.38201904296875, 0.406768798828125, 0.4315185546875, 0.456268310546875, 0.48101806640625, 0.505767822265625, 0.530517578125, 0.555267333984375, 0.58001708984375, 0.604766845703125, 0.6295166015625, 0.654266357421875, 0.67901611328125, 0.703765869140625, 0.728515625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 8.0, 9.0, 15.0, 28.0, 58.0, 73.0, 90.0, 103.0, 129.0, 125.0, 99.0, 98.0, 62.0, 44.0, 24.0, 16.0, 9.0, 4.0, 0.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0], "bins": [-0.358154296875, -0.35033416748046875, -0.3425140380859375, -0.33469390869140625, -0.326873779296875, -0.31905364990234375, -0.3112335205078125, -0.30341339111328125, -0.29559326171875, -0.28777313232421875, -0.2799530029296875, -0.27213287353515625, -0.264312744140625, -0.25649261474609375, -0.2486724853515625, -0.24085235595703125, -0.2330322265625, -0.22521209716796875, -0.2173919677734375, -0.20957183837890625, -0.201751708984375, -0.19393157958984375, -0.1861114501953125, -0.17829132080078125, -0.17047119140625, -0.16265106201171875, -0.1548309326171875, -0.14701080322265625, -0.139190673828125, -0.13137054443359375, -0.1235504150390625, -0.11573028564453125, -0.10791015625, -0.10009002685546875, -0.0922698974609375, -0.08444976806640625, -0.076629638671875, -0.06880950927734375, -0.0609893798828125, -0.05316925048828125, -0.04534912109375, -0.03752899169921875, -0.0297088623046875, -0.02188873291015625, -0.014068603515625, -0.00624847412109375, 0.0015716552734375, 0.00939178466796875, 0.0172119140625, 0.02503204345703125, 0.0328521728515625, 0.04067230224609375, 0.048492431640625, 0.05631256103515625, 0.0641326904296875, 0.07195281982421875, 0.07977294921875, 0.08759307861328125, 0.0954132080078125, 0.10323333740234375, 0.111053466796875, 0.11887359619140625, 0.1266937255859375, 0.13451385498046875, 0.142333984375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 8.0, 8.0, 7.0, 8.0, 14.0, 27.0, 25.0, 47.0, 101.0, 158.0, 336.0, 795.0, 2299.0, 7868.0, 38259.0, 407027.0, 529414.0, 48386.0, 9239.0, 2754.0, 928.0, 390.0, 175.0, 99.0, 51.0, 27.0, 20.0, 17.0, 17.0, 7.0, 3.0, 8.0, 8.0, 5.0, 4.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5732421875, -0.5547866821289062, -0.5363311767578125, -0.5178756713867188, -0.499420166015625, -0.48096466064453125, -0.4625091552734375, -0.44405364990234375, -0.42559814453125, -0.40714263916015625, -0.3886871337890625, -0.37023162841796875, -0.351776123046875, -0.33332061767578125, -0.3148651123046875, -0.29640960693359375, -0.2779541015625, -0.25949859619140625, -0.2410430908203125, -0.22258758544921875, -0.204132080078125, -0.18567657470703125, -0.1672210693359375, -0.14876556396484375, -0.13031005859375, -0.11185455322265625, -0.0933990478515625, -0.07494354248046875, -0.056488037109375, -0.03803253173828125, -0.0195770263671875, -0.00112152099609375, 0.017333984375, 0.03578948974609375, 0.0542449951171875, 0.07270050048828125, 0.091156005859375, 0.10961151123046875, 0.1280670166015625, 0.14652252197265625, 0.16497802734375, 0.18343353271484375, 0.2018890380859375, 0.22034454345703125, 0.238800048828125, 0.25725555419921875, 0.2757110595703125, 0.29416656494140625, 0.3126220703125, 0.33107757568359375, 0.3495330810546875, 0.36798858642578125, 0.386444091796875, 0.40489959716796875, 0.4233551025390625, 0.44181060791015625, 0.46026611328125, 0.47872161865234375, 0.4971771240234375, 0.5156326293945312, 0.534088134765625, 0.5525436401367188, 0.5709991455078125, 0.5894546508789062, 0.60791015625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 7.0, 10.0, 4.0, 9.0, 9.0, 12.0, 7.0, 22.0, 18.0, 34.0, 29.0, 44.0, 46.0, 52.0, 51.0, 54.0, 44.0, 71.0, 57.0, 74.0, 60.0, 47.0, 30.0, 37.0, 34.0, 25.0, 18.0, 20.0, 7.0, 13.0, 14.0, 5.0, 5.0, 5.0, 9.0, 7.0, 2.0, 1.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.5009765625, -0.48497772216796875, -0.4689788818359375, -0.45298004150390625, -0.436981201171875, -0.42098236083984375, -0.4049835205078125, -0.38898468017578125, -0.37298583984375, -0.35698699951171875, -0.3409881591796875, -0.32498931884765625, -0.308990478515625, -0.29299163818359375, -0.2769927978515625, -0.26099395751953125, -0.2449951171875, -0.22899627685546875, -0.2129974365234375, -0.19699859619140625, -0.180999755859375, -0.16500091552734375, -0.1490020751953125, -0.13300323486328125, -0.11700439453125, -0.10100555419921875, -0.0850067138671875, -0.06900787353515625, -0.053009033203125, -0.03701019287109375, -0.0210113525390625, -0.00501251220703125, 0.010986328125, 0.02698516845703125, 0.0429840087890625, 0.05898284912109375, 0.074981689453125, 0.09098052978515625, 0.1069793701171875, 0.12297821044921875, 0.13897705078125, 0.15497589111328125, 0.1709747314453125, 0.18697357177734375, 0.202972412109375, 0.21897125244140625, 0.2349700927734375, 0.25096893310546875, 0.2669677734375, 0.28296661376953125, 0.2989654541015625, 0.31496429443359375, 0.330963134765625, 0.34696197509765625, 0.3629608154296875, 0.37895965576171875, 0.39495849609375, 0.41095733642578125, 0.4269561767578125, 0.44295501708984375, 0.458953857421875, 0.47495269775390625, 0.4909515380859375, 0.5069503784179688, 0.52294921875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 1.0, 2.0, 4.0, 6.0, 3.0, 3.0, 6.0, 3.0, 12.0, 8.0, 17.0, 24.0, 47.0, 62.0, 94.0, 207.0, 412.0, 967.0, 2486.0, 7692.0, 39571.0, 739279.0, 232314.0, 17601.0, 4726.0, 1629.0, 685.0, 293.0, 159.0, 84.0, 43.0, 29.0, 20.0, 11.0, 13.0, 7.0, 9.0, 2.0, 9.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.337158203125, -0.3265533447265625, -0.315948486328125, -0.3053436279296875, -0.29473876953125, -0.2841339111328125, -0.273529052734375, -0.2629241943359375, -0.2523193359375, -0.2417144775390625, -0.231109619140625, -0.2205047607421875, -0.20989990234375, -0.1992950439453125, -0.188690185546875, -0.1780853271484375, -0.16748046875, -0.1568756103515625, -0.146270751953125, -0.1356658935546875, -0.12506103515625, -0.1144561767578125, -0.103851318359375, -0.0932464599609375, -0.0826416015625, -0.0720367431640625, -0.061431884765625, -0.0508270263671875, -0.04022216796875, -0.0296173095703125, -0.019012451171875, -0.0084075927734375, 0.002197265625, 0.0128021240234375, 0.023406982421875, 0.0340118408203125, 0.04461669921875, 0.0552215576171875, 0.065826416015625, 0.0764312744140625, 0.0870361328125, 0.0976409912109375, 0.108245849609375, 0.1188507080078125, 0.12945556640625, 0.1400604248046875, 0.150665283203125, 0.1612701416015625, 0.171875, 0.1824798583984375, 0.193084716796875, 0.2036895751953125, 0.21429443359375, 0.2248992919921875, 0.235504150390625, 0.2461090087890625, 0.2567138671875, 0.2673187255859375, 0.277923583984375, 0.2885284423828125, 0.29913330078125, 0.3097381591796875, 0.320343017578125, 0.3309478759765625, 0.341552734375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 7.0, 5.0, 9.0, 9.0, 23.0, 27.0, 28.0, 39.0, 52.0, 60.0, 81.0, 100.0, 102.0, 121.0, 80.0, 52.0, 43.0, 45.0, 19.0, 17.0, 20.0, 17.0, 13.0, 6.0, 5.0, 5.0, 4.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020074844360351562, -0.00019417330622673035, -0.00018759816884994507, -0.0001810230314731598, -0.0001744478940963745, -0.00016787275671958923, -0.00016129761934280396, -0.00015472248196601868, -0.0001481473445892334, -0.00014157220721244812, -0.00013499706983566284, -0.00012842193245887756, -0.00012184679508209229, -0.00011527165770530701, -0.00010869652032852173, -0.00010212138295173645, -9.554624557495117e-05, -8.89711081981659e-05, -8.239597082138062e-05, -7.582083344459534e-05, -6.924569606781006e-05, -6.267055869102478e-05, -5.60954213142395e-05, -4.9520283937454224e-05, -4.2945146560668945e-05, -3.637000918388367e-05, -2.979487180709839e-05, -2.321973443031311e-05, -1.6644597053527832e-05, -1.0069459676742554e-05, -3.4943222999572754e-06, 3.080815076828003e-06, 9.655952453613281e-06, 1.623108983039856e-05, 2.2806227207183838e-05, 2.9381364583969116e-05, 3.5956501960754395e-05, 4.253163933753967e-05, 4.910677671432495e-05, 5.568191409111023e-05, 6.225705146789551e-05, 6.883218884468079e-05, 7.540732622146606e-05, 8.198246359825134e-05, 8.855760097503662e-05, 9.51327383518219e-05, 0.00010170787572860718, 0.00010828301310539246, 0.00011485815048217773, 0.00012143328785896301, 0.0001280084252357483, 0.00013458356261253357, 0.00014115869998931885, 0.00014773383736610413, 0.0001543089747428894, 0.00016088411211967468, 0.00016745924949645996, 0.00017403438687324524, 0.00018060952425003052, 0.0001871846616268158, 0.00019375979900360107, 0.00020033493638038635, 0.00020691007375717163, 0.0002134852111339569, 0.0002200603485107422]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 8.0, 2.0, 9.0, 10.0, 7.0, 5.0, 20.0, 27.0, 29.0, 64.0, 62.0, 93.0, 157.0, 233.0, 363.0, 681.0, 1137.0, 2168.0, 4105.0, 8915.0, 29630.0, 224974.0, 659007.0, 86581.0, 16838.0, 6391.0, 3094.0, 1643.0, 871.0, 515.0, 319.0, 190.0, 105.0, 81.0, 47.0, 36.0, 23.0, 33.0, 27.0, 12.0, 13.0, 6.0, 7.0, 8.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.2147216796875, -0.20827293395996094, -0.20182418823242188, -0.1953754425048828, -0.18892669677734375, -0.1824779510498047, -0.17602920532226562, -0.16958045959472656, -0.1631317138671875, -0.15668296813964844, -0.15023422241210938, -0.1437854766845703, -0.13733673095703125, -0.1308879852294922, -0.12443923950195312, -0.11799049377441406, -0.111541748046875, -0.10509300231933594, -0.09864425659179688, -0.09219551086425781, -0.08574676513671875, -0.07929801940917969, -0.07284927368164062, -0.06640052795410156, -0.0599517822265625, -0.05350303649902344, -0.047054290771484375, -0.04060554504394531, -0.03415679931640625, -0.027708053588867188, -0.021259307861328125, -0.014810562133789062, -0.00836181640625, -0.0019130706787109375, 0.004535675048828125, 0.010984420776367188, 0.01743316650390625, 0.023881912231445312, 0.030330657958984375, 0.03677940368652344, 0.0432281494140625, 0.04967689514160156, 0.056125640869140625, 0.06257438659667969, 0.06902313232421875, 0.07547187805175781, 0.08192062377929688, 0.08836936950683594, 0.094818115234375, 0.10126686096191406, 0.10771560668945312, 0.11416435241699219, 0.12061309814453125, 0.1270618438720703, 0.13351058959960938, 0.13995933532714844, 0.1464080810546875, 0.15285682678222656, 0.15930557250976562, 0.1657543182373047, 0.17220306396484375, 0.1786518096923828, 0.18510055541992188, 0.19154930114746094, 0.197998046875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 2.0, 2.0, 8.0, 10.0, 10.0, 23.0, 44.0, 63.0, 89.0, 142.0, 180.0, 149.0, 99.0, 57.0, 38.0, 25.0, 15.0, 10.0, 7.0, 4.0, 3.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2044677734375, -0.19840049743652344, -0.19233322143554688, -0.1862659454345703, -0.18019866943359375, -0.1741313934326172, -0.16806411743164062, -0.16199684143066406, -0.1559295654296875, -0.14986228942871094, -0.14379501342773438, -0.1377277374267578, -0.13166046142578125, -0.1255931854248047, -0.11952590942382812, -0.11345863342285156, -0.107391357421875, -0.10132408142089844, -0.09525680541992188, -0.08918952941894531, -0.08312225341796875, -0.07705497741699219, -0.07098770141601562, -0.06492042541503906, -0.0588531494140625, -0.05278587341308594, -0.046718597412109375, -0.04065132141113281, -0.03458404541015625, -0.028516769409179688, -0.022449493408203125, -0.016382217407226562, -0.01031494140625, -0.0042476654052734375, 0.001819610595703125, 0.007886886596679688, 0.01395416259765625, 0.020021438598632812, 0.026088714599609375, 0.03215599060058594, 0.0382232666015625, 0.04429054260253906, 0.050357818603515625, 0.05642509460449219, 0.06249237060546875, 0.06855964660644531, 0.07462692260742188, 0.08069419860839844, 0.086761474609375, 0.09282875061035156, 0.09889602661132812, 0.10496330261230469, 0.11103057861328125, 0.11709785461425781, 0.12316513061523438, 0.12923240661621094, 0.1352996826171875, 0.14136695861816406, 0.14743423461914062, 0.1535015106201172, 0.15956878662109375, 0.1656360626220703, 0.17170333862304688, 0.17777061462402344, 0.183837890625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 4.0, 7.0, 8.0, 27.0, 52.0, 88.0, 158.0, 219.0, 190.0, 107.0, 57.0, 30.0, 12.0, 14.0, 4.0, 9.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4275474548339844, -3.336244821548462, -3.2449419498443604, -3.153639316558838, -3.0623364448547363, -2.971033811569214, -2.8797311782836914, -2.78842830657959, -2.6971256732940674, -2.605823040008545, -2.5145201683044434, -2.423217535018921, -2.3319146633148193, -2.240612030029297, -2.1493091583251953, -2.058006525039673, -1.9667037725448608, -1.8754010200500488, -1.7840982675552368, -1.6927955150604248, -1.6014928817749023, -1.5101901292800903, -1.4188873767852783, -1.3275847434997559, -1.2362818717956543, -1.1449791193008423, -1.0536763668060303, -0.962373673915863, -0.8710709810256958, -0.7797682285308838, -0.6884654760360718, -0.5971627831459045, -0.5058600902557373, -0.4145573675632477, -0.32325464487075806, -0.23195189237594604, -0.14064916968345642, -0.0493464469909668, 0.041956305503845215, 0.13325899839401245, 0.22456175088882446, 0.3158644735813141, 0.4071671962738037, 0.4984699487686157, 0.5897727012634277, 0.681075394153595, 0.772378146648407, 0.8636808395385742, 0.9549835920333862, 1.0462863445281982, 1.1375890970230103, 1.2288918495178223, 1.3201944828033447, 1.4114972352981567, 1.5027999877929688, 1.5941026210784912, 1.6854054927825928, 1.7767082452774048, 1.8680109977722168, 1.9593136310577393, 2.050616502761841, 2.1419191360473633, 2.233222007751465, 2.3245246410369873, 2.4158272743225098]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 8.0, 3.0, 2.0, 10.0, 6.0, 7.0, 15.0, 21.0, 15.0, 19.0, 26.0, 27.0, 29.0, 34.0, 43.0, 33.0, 38.0, 43.0, 47.0, 38.0, 47.0, 42.0, 44.0, 42.0, 37.0, 43.0, 51.0, 33.0, 28.0, 20.0, 29.0, 23.0, 12.0, 16.0, 12.0, 12.0, 7.0, 12.0, 7.0, 10.0, 5.0, 6.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.403439521789551, -2.3265132904052734, -2.249587059020996, -2.1726608276367188, -2.0957345962524414, -2.018808364868164, -1.9418822526931763, -1.864956021308899, -1.7880297899246216, -1.7111035585403442, -1.634177327156067, -1.5572510957717896, -1.4803249835968018, -1.4033987522125244, -1.326472520828247, -1.2495462894439697, -1.1726200580596924, -1.095693826675415, -1.0187675952911377, -0.9418414235115051, -0.8649151921272278, -0.7879889607429504, -0.7110627889633179, -0.6341365575790405, -0.5572103261947632, -0.48028409481048584, -0.4033578932285309, -0.3264316916465759, -0.24950546026229858, -0.17257922887802124, -0.09565302729606628, -0.018726825714111328, 0.058199405670166016, 0.13512562215328217, 0.21205183863639832, 0.28897804021835327, 0.3659042716026306, 0.44283050298690796, 0.5197566747665405, 0.5966829061508179, 0.6736091375350952, 0.7505353689193726, 0.8274616003036499, 0.9043877720832825, 0.9813140034675598, 1.0582401752471924, 1.1351664066314697, 1.212092638015747, 1.2890188694000244, 1.3659451007843018, 1.442871332168579, 1.5197975635528564, 1.5967237949371338, 1.6736500263214111, 1.750576138496399, 1.8275023698806763, 1.9044286012649536, 1.981354832649231, 2.0582809448242188, 2.135207176208496, 2.2121334075927734, 2.289059638977051, 2.365985870361328, 2.4429121017456055, 2.519838333129883]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 5.0, 2.0, 6.0, 8.0, 5.0, 13.0, 10.0, 18.0, 18.0, 37.0, 37.0, 55.0, 65.0, 96.0, 131.0, 195.0, 282.0, 522.0, 1033.0, 2577.0, 8856.0, 54036.0, 3771524.0, 322194.0, 24179.0, 5139.0, 1719.0, 724.0, 363.0, 195.0, 97.0, 57.0, 29.0, 20.0, 18.0, 8.0, 5.0, 1.0, 0.0, 5.0, 2.0], "bins": [-1.498046875, -1.46533203125, -1.4326171875, -1.39990234375, -1.3671875, -1.33447265625, -1.3017578125, -1.26904296875, -1.236328125, -1.20361328125, -1.1708984375, -1.13818359375, -1.10546875, -1.07275390625, -1.0400390625, -1.00732421875, -0.974609375, -0.94189453125, -0.9091796875, -0.87646484375, -0.84375, -0.81103515625, -0.7783203125, -0.74560546875, -0.712890625, -0.68017578125, -0.6474609375, -0.61474609375, -0.58203125, -0.54931640625, -0.5166015625, -0.48388671875, -0.451171875, -0.41845703125, -0.3857421875, -0.35302734375, -0.3203125, -0.28759765625, -0.2548828125, -0.22216796875, -0.189453125, -0.15673828125, -0.1240234375, -0.09130859375, -0.05859375, -0.02587890625, 0.0068359375, 0.03955078125, 0.072265625, 0.10498046875, 0.1376953125, 0.17041015625, 0.203125, 0.23583984375, 0.2685546875, 0.30126953125, 0.333984375, 0.36669921875, 0.3994140625, 0.43212890625, 0.46484375, 0.49755859375, 0.5302734375, 0.56298828125, 0.595703125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 16.0, 11.0, 29.0, 42.0, 76.0, 99.0, 96.0, 107.0, 126.0, 100.0, 82.0, 89.0, 47.0, 25.0, 22.0, 9.0, 8.0, 3.0, 3.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0], "bins": [-0.364990234375, -0.3570709228515625, -0.349151611328125, -0.3412322998046875, -0.33331298828125, -0.3253936767578125, -0.317474365234375, -0.3095550537109375, -0.3016357421875, -0.2937164306640625, -0.285797119140625, -0.2778778076171875, -0.26995849609375, -0.2620391845703125, -0.254119873046875, -0.2462005615234375, -0.23828125, -0.2303619384765625, -0.222442626953125, -0.2145233154296875, -0.20660400390625, -0.1986846923828125, -0.190765380859375, -0.1828460693359375, -0.1749267578125, -0.1670074462890625, -0.159088134765625, -0.1511688232421875, -0.14324951171875, -0.1353302001953125, -0.127410888671875, -0.1194915771484375, -0.111572265625, -0.1036529541015625, -0.095733642578125, -0.0878143310546875, -0.07989501953125, -0.0719757080078125, -0.064056396484375, -0.0561370849609375, -0.0482177734375, -0.0402984619140625, -0.032379150390625, -0.0244598388671875, -0.01654052734375, -0.0086212158203125, -0.000701904296875, 0.0072174072265625, 0.01513671875, 0.0230560302734375, 0.030975341796875, 0.0388946533203125, 0.04681396484375, 0.0547332763671875, 0.062652587890625, 0.0705718994140625, 0.0784912109375, 0.0864105224609375, 0.094329833984375, 0.1022491455078125, 0.11016845703125, 0.1180877685546875, 0.126007080078125, 0.1339263916015625, 0.141845703125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 6.0, 10.0, 42.0, 46.0, 136.0, 245.0, 549.0, 2116.0, 30431.0, 4116669.0, 40785.0, 2206.0, 603.0, 267.0, 94.0, 39.0, 18.0, 11.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.46484375, -1.41839599609375, -1.3719482421875, -1.32550048828125, -1.279052734375, -1.23260498046875, -1.1861572265625, -1.13970947265625, -1.09326171875, -1.04681396484375, -1.0003662109375, -0.95391845703125, -0.907470703125, -0.86102294921875, -0.8145751953125, -0.76812744140625, -0.7216796875, -0.67523193359375, -0.6287841796875, -0.58233642578125, -0.535888671875, -0.48944091796875, -0.4429931640625, -0.39654541015625, -0.35009765625, -0.30364990234375, -0.2572021484375, -0.21075439453125, -0.164306640625, -0.11785888671875, -0.0714111328125, -0.02496337890625, 0.021484375, 0.06793212890625, 0.1143798828125, 0.16082763671875, 0.207275390625, 0.25372314453125, 0.3001708984375, 0.34661865234375, 0.39306640625, 0.43951416015625, 0.4859619140625, 0.53240966796875, 0.578857421875, 0.62530517578125, 0.6717529296875, 0.71820068359375, 0.7646484375, 0.81109619140625, 0.8575439453125, 0.90399169921875, 0.950439453125, 0.99688720703125, 1.0433349609375, 1.08978271484375, 1.13623046875, 1.18267822265625, 1.2291259765625, 1.27557373046875, 1.322021484375, 1.36846923828125, 1.4149169921875, 1.46136474609375, 1.5078125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 9.0, 7.0, 5.0, 13.0, 21.0, 43.0, 111.0, 347.0, 2571.0, 686.0, 146.0, 62.0, 28.0, 5.0, 14.0, 12.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.256103515625, -0.24776077270507812, -0.23941802978515625, -0.23107528686523438, -0.2227325439453125, -0.21438980102539062, -0.20604705810546875, -0.19770431518554688, -0.189361572265625, -0.18101882934570312, -0.17267608642578125, -0.16433334350585938, -0.1559906005859375, -0.14764785766601562, -0.13930511474609375, -0.13096237182617188, -0.12261962890625, -0.11427688598632812, -0.10593414306640625, -0.09759140014648438, -0.0892486572265625, -0.08090591430664062, -0.07256317138671875, -0.06422042846679688, -0.055877685546875, -0.047534942626953125, -0.03919219970703125, -0.030849456787109375, -0.0225067138671875, -0.014163970947265625, -0.00582122802734375, 0.002521514892578125, 0.0108642578125, 0.019207000732421875, 0.02754974365234375, 0.035892486572265625, 0.0442352294921875, 0.052577972412109375, 0.06092071533203125, 0.06926345825195312, 0.077606201171875, 0.08594894409179688, 0.09429168701171875, 0.10263442993164062, 0.1109771728515625, 0.11931991577148438, 0.12766265869140625, 0.13600540161132812, 0.14434814453125, 0.15269088745117188, 0.16103363037109375, 0.16937637329101562, 0.1777191162109375, 0.18606185913085938, 0.19440460205078125, 0.20274734497070312, 0.211090087890625, 0.21943283081054688, 0.22777557373046875, 0.23611831665039062, 0.2444610595703125, 0.2528038024902344, 0.26114654541015625, 0.2694892883300781, 0.27783203125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 7.0, 10.0, 14.0, 90.0, 527.0, 329.0, 28.0, 8.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.754229545593262, -4.660699844360352, -4.5671706199646, -4.4736409187316895, -4.3801116943359375, -4.286581993103027, -4.193052768707275, -4.099523067474365, -4.005993843078613, -3.9124643802642822, -3.818934917449951, -3.72540545463562, -3.631875991821289, -3.538346529006958, -3.444817066192627, -3.351287603378296, -3.257758140563965, -3.164228677749634, -3.0706992149353027, -2.9771697521209717, -2.8836402893066406, -2.7901108264923096, -2.6965813636779785, -2.6030519008636475, -2.5095221996307373, -2.4159927368164062, -2.322463274002075, -2.228933811187744, -2.135404348373413, -2.041874885559082, -1.948345422744751, -1.85481595993042, -1.7612864971160889, -1.6677570343017578, -1.5742275714874268, -1.4806981086730957, -1.3871686458587646, -1.2936391830444336, -1.2001097202301025, -1.1065802574157715, -1.0130507946014404, -0.9195213317871094, -0.8259918689727783, -0.7324624061584473, -0.6389329433441162, -0.5454034805297852, -0.4518739581108093, -0.35834449529647827, -0.26481497287750244, -0.1712855100631714, -0.07775603234767914, 0.01577344536781311, 0.10930290818214417, 0.20283237099647522, 0.29636186361312866, 0.3898913264274597, 0.48342078924179077, 0.5769502520561218, 0.6704797148704529, 0.7640092372894287, 0.8575387001037598, 0.9510681629180908, 1.0445976257324219, 1.138127088546753, 1.231656551361084]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 1.0, 3.0, 2.0, 6.0, 12.0, 6.0, 15.0, 18.0, 14.0, 24.0, 29.0, 25.0, 25.0, 45.0, 47.0, 63.0, 62.0, 52.0, 64.0, 53.0, 60.0, 59.0, 37.0, 51.0, 32.0, 36.0, 35.0, 36.0, 20.0, 15.0, 14.0, 9.0, 3.0, 10.0, 7.0, 8.0, 3.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5759319067001343, -0.5590312480926514, -0.5421305298805237, -0.5252298712730408, -0.5083291530609131, -0.4914284944534302, -0.4745278060436249, -0.4576271176338196, -0.4407264292240143, -0.423825740814209, -0.4069250524044037, -0.3900243639945984, -0.3731237053871155, -0.3562229871749878, -0.3393223285675049, -0.3224216401576996, -0.3055209517478943, -0.288620263338089, -0.2717195749282837, -0.2548188865184784, -0.2379182130098343, -0.221017524600029, -0.2041168510913849, -0.1872161626815796, -0.1703154742717743, -0.153414785861969, -0.1365140974521637, -0.11961342394351959, -0.1027127355337143, -0.085812047123909, -0.0689113661646843, -0.052010685205459595, -0.0351099967956543, -0.018209312111139297, -0.001308627426624298, 0.015592057257890701, 0.0324927419424057, 0.049393430352211, 0.0662941113114357, 0.0831947922706604, 0.1000954806804657, 0.116996169090271, 0.1338968575000763, 0.1507975310087204, 0.1676982194185257, 0.184598907828331, 0.2014995813369751, 0.2184002697467804, 0.2353009581565857, 0.252201646566391, 0.2691023349761963, 0.2860030233860016, 0.3029037117958069, 0.3198043704032898, 0.3367050588130951, 0.3536057472229004, 0.3705064356327057, 0.387407124042511, 0.4043078124523163, 0.4212085008621216, 0.4381091594696045, 0.4550098776817322, 0.4719105362892151, 0.4888112246990204, 0.5057119131088257]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 4.0, 8.0, 8.0, 8.0, 16.0, 24.0, 33.0, 45.0, 64.0, 109.0, 182.0, 326.0, 728.0, 1666.0, 5611.0, 30722.0, 406472.0, 551782.0, 40587.0, 6510.0, 1963.0, 802.0, 361.0, 202.0, 108.0, 60.0, 55.0, 35.0, 24.0, 12.0, 14.0, 6.0, 10.0, 4.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9697265625, -0.9420700073242188, -0.9144134521484375, -0.8867568969726562, -0.859100341796875, -0.8314437866210938, -0.8037872314453125, -0.7761306762695312, -0.74847412109375, -0.7208175659179688, -0.6931610107421875, -0.6655044555664062, -0.637847900390625, -0.6101913452148438, -0.5825347900390625, -0.5548782348632812, -0.5272216796875, -0.49956512451171875, -0.4719085693359375, -0.44425201416015625, -0.416595458984375, -0.38893890380859375, -0.3612823486328125, -0.33362579345703125, -0.30596923828125, -0.27831268310546875, -0.2506561279296875, -0.22299957275390625, -0.195343017578125, -0.16768646240234375, -0.1400299072265625, -0.11237335205078125, -0.084716796875, -0.05706024169921875, -0.0294036865234375, -0.00174713134765625, 0.025909423828125, 0.05356597900390625, 0.0812225341796875, 0.10887908935546875, 0.13653564453125, 0.16419219970703125, 0.1918487548828125, 0.21950531005859375, 0.247161865234375, 0.27481842041015625, 0.3024749755859375, 0.33013153076171875, 0.3577880859375, 0.38544464111328125, 0.4131011962890625, 0.44075775146484375, 0.468414306640625, 0.49607086181640625, 0.5237274169921875, 0.5513839721679688, 0.57904052734375, 0.6066970825195312, 0.6343536376953125, 0.6620101928710938, 0.689666748046875, 0.7173233032226562, 0.7449798583984375, 0.7726364135742188, 0.80029296875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 7.0, 11.0, 19.0, 39.0, 54.0, 77.0, 83.0, 114.0, 113.0, 106.0, 101.0, 72.0, 77.0, 44.0, 33.0, 20.0, 9.0, 5.0, 3.0, 4.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.3544921875, -0.346588134765625, -0.33868408203125, -0.330780029296875, -0.3228759765625, -0.314971923828125, -0.30706787109375, -0.299163818359375, -0.291259765625, -0.283355712890625, -0.27545166015625, -0.267547607421875, -0.2596435546875, -0.251739501953125, -0.24383544921875, -0.235931396484375, -0.22802734375, -0.220123291015625, -0.21221923828125, -0.204315185546875, -0.1964111328125, -0.188507080078125, -0.18060302734375, -0.172698974609375, -0.164794921875, -0.156890869140625, -0.14898681640625, -0.141082763671875, -0.1331787109375, -0.125274658203125, -0.11737060546875, -0.109466552734375, -0.1015625, -0.093658447265625, -0.08575439453125, -0.077850341796875, -0.0699462890625, -0.062042236328125, -0.05413818359375, -0.046234130859375, -0.038330078125, -0.030426025390625, -0.02252197265625, -0.014617919921875, -0.0067138671875, 0.001190185546875, 0.00909423828125, 0.016998291015625, 0.02490234375, 0.032806396484375, 0.04071044921875, 0.048614501953125, 0.0565185546875, 0.064422607421875, 0.07232666015625, 0.080230712890625, 0.088134765625, 0.096038818359375, 0.10394287109375, 0.111846923828125, 0.1197509765625, 0.127655029296875, 0.13555908203125, 0.143463134765625, 0.1513671875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 7.0, 8.0, 8.0, 13.0, 20.0, 30.0, 51.0, 82.0, 163.0, 358.0, 861.0, 2932.0, 14276.0, 166386.0, 790330.0, 62244.0, 7750.0, 1852.0, 636.0, 246.0, 127.0, 62.0, 39.0, 21.0, 13.0, 10.0, 9.0, 5.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-1.021484375, -0.9948348999023438, -0.9681854248046875, -0.9415359497070312, -0.914886474609375, -0.8882369995117188, -0.8615875244140625, -0.8349380493164062, -0.80828857421875, -0.7816390991210938, -0.7549896240234375, -0.7283401489257812, -0.701690673828125, -0.6750411987304688, -0.6483917236328125, -0.6217422485351562, -0.5950927734375, -0.5684432983398438, -0.5417938232421875, -0.5151443481445312, -0.488494873046875, -0.46184539794921875, -0.4351959228515625, -0.40854644775390625, -0.38189697265625, -0.35524749755859375, -0.3285980224609375, -0.30194854736328125, -0.275299072265625, -0.24864959716796875, -0.2220001220703125, -0.19535064697265625, -0.168701171875, -0.14205169677734375, -0.1154022216796875, -0.08875274658203125, -0.062103271484375, -0.03545379638671875, -0.0088043212890625, 0.01784515380859375, 0.04449462890625, 0.07114410400390625, 0.0977935791015625, 0.12444305419921875, 0.151092529296875, 0.17774200439453125, 0.2043914794921875, 0.23104095458984375, 0.2576904296875, 0.28433990478515625, 0.3109893798828125, 0.33763885498046875, 0.364288330078125, 0.39093780517578125, 0.4175872802734375, 0.44423675537109375, 0.47088623046875, 0.49753570556640625, 0.5241851806640625, 0.5508346557617188, 0.577484130859375, 0.6041336059570312, 0.6307830810546875, 0.6574325561523438, 0.68408203125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 5.0, 4.0, 8.0, 7.0, 18.0, 15.0, 22.0, 33.0, 34.0, 61.0, 51.0, 63.0, 72.0, 78.0, 75.0, 94.0, 87.0, 50.0, 52.0, 41.0, 38.0, 21.0, 25.0, 10.0, 10.0, 7.0, 8.0, 1.0, 4.0, 2.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.99755859375, -0.9715118408203125, -0.945465087890625, -0.9194183349609375, -0.89337158203125, -0.8673248291015625, -0.841278076171875, -0.8152313232421875, -0.7891845703125, -0.7631378173828125, -0.737091064453125, -0.7110443115234375, -0.68499755859375, -0.6589508056640625, -0.632904052734375, -0.6068572998046875, -0.580810546875, -0.5547637939453125, -0.528717041015625, -0.5026702880859375, -0.47662353515625, -0.4505767822265625, -0.424530029296875, -0.3984832763671875, -0.3724365234375, -0.3463897705078125, -0.320343017578125, -0.2942962646484375, -0.26824951171875, -0.2422027587890625, -0.216156005859375, -0.1901092529296875, -0.1640625, -0.1380157470703125, -0.111968994140625, -0.0859222412109375, -0.05987548828125, -0.0338287353515625, -0.007781982421875, 0.0182647705078125, 0.0443115234375, 0.0703582763671875, 0.096405029296875, 0.1224517822265625, 0.14849853515625, 0.1745452880859375, 0.200592041015625, 0.2266387939453125, 0.252685546875, 0.2787322998046875, 0.304779052734375, 0.3308258056640625, 0.35687255859375, 0.3829193115234375, 0.408966064453125, 0.4350128173828125, 0.4610595703125, 0.4871063232421875, 0.513153076171875, 0.5391998291015625, 0.56524658203125, 0.5912933349609375, 0.617340087890625, 0.6433868408203125, 0.66943359375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 10.0, 13.0, 14.0, 45.0, 59.0, 155.0, 327.0, 830.0, 3206.0, 24965.0, 657966.0, 343261.0, 14333.0, 2206.0, 636.0, 248.0, 119.0, 64.0, 36.0, 23.0, 8.0, 8.0, 7.0, 5.0, 1.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.474853515625, -0.46378135681152344, -0.4527091979980469, -0.4416370391845703, -0.43056488037109375, -0.4194927215576172, -0.4084205627441406, -0.39734840393066406, -0.3862762451171875, -0.37520408630371094, -0.3641319274902344, -0.3530597686767578, -0.34198760986328125, -0.3309154510498047, -0.3198432922363281, -0.30877113342285156, -0.297698974609375, -0.28662681579589844, -0.2755546569824219, -0.2644824981689453, -0.25341033935546875, -0.2423381805419922, -0.23126602172851562, -0.22019386291503906, -0.2091217041015625, -0.19804954528808594, -0.18697738647460938, -0.1759052276611328, -0.16483306884765625, -0.1537609100341797, -0.14268875122070312, -0.13161659240722656, -0.12054443359375, -0.10947227478027344, -0.09840011596679688, -0.08732795715332031, -0.07625579833984375, -0.06518363952636719, -0.054111480712890625, -0.04303932189941406, -0.0319671630859375, -0.020895004272460938, -0.009822845458984375, 0.0012493133544921875, 0.01232147216796875, 0.023393630981445312, 0.034465789794921875, 0.04553794860839844, 0.056610107421875, 0.06768226623535156, 0.07875442504882812, 0.08982658386230469, 0.10089874267578125, 0.11197090148925781, 0.12304306030273438, 0.13411521911621094, 0.1451873779296875, 0.15625953674316406, 0.16733169555664062, 0.1784038543701172, 0.18947601318359375, 0.2005481719970703, 0.21162033081054688, 0.22269248962402344, 0.2337646484375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 4.0, 9.0, 21.0, 11.0, 24.0, 37.0, 47.0, 63.0, 93.0, 117.0, 144.0, 125.0, 94.0, 72.0, 43.0, 37.0, 24.0, 12.0, 10.0, 5.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002193450927734375, -0.00021189451217651367, -0.00020444393157958984, -0.00019699335098266602, -0.0001895427703857422, -0.00018209218978881836, -0.00017464160919189453, -0.0001671910285949707, -0.00015974044799804688, -0.00015228986740112305, -0.00014483928680419922, -0.0001373887062072754, -0.00012993812561035156, -0.00012248754501342773, -0.0001150369644165039, -0.00010758638381958008, -0.00010013580322265625, -9.268522262573242e-05, -8.52346420288086e-05, -7.778406143188477e-05, -7.033348083496094e-05, -6.288290023803711e-05, -5.543231964111328e-05, -4.798173904418945e-05, -4.0531158447265625e-05, -3.30805778503418e-05, -2.562999725341797e-05, -1.817941665649414e-05, -1.0728836059570312e-05, -3.2782554626464844e-06, 4.172325134277344e-06, 1.1622905731201172e-05, 1.9073486328125e-05, 2.6524066925048828e-05, 3.3974647521972656e-05, 4.1425228118896484e-05, 4.887580871582031e-05, 5.632638931274414e-05, 6.377696990966797e-05, 7.12275505065918e-05, 7.867813110351562e-05, 8.612871170043945e-05, 9.357929229736328e-05, 0.00010102987289428711, 0.00010848045349121094, 0.00011593103408813477, 0.0001233816146850586, 0.00013083219528198242, 0.00013828277587890625, 0.00014573335647583008, 0.0001531839370727539, 0.00016063451766967773, 0.00016808509826660156, 0.0001755356788635254, 0.00018298625946044922, 0.00019043684005737305, 0.00019788742065429688, 0.0002053380012512207, 0.00021278858184814453, 0.00022023916244506836, 0.0002276897430419922, 0.00023514032363891602, 0.00024259090423583984, 0.00025004148483276367, 0.0002574920654296875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 8.0, 9.0, 15.0, 21.0, 29.0, 45.0, 81.0, 160.0, 292.0, 636.0, 1443.0, 3893.0, 15761.0, 128755.0, 724536.0, 148430.0, 17272.0, 4249.0, 1508.0, 644.0, 347.0, 165.0, 91.0, 51.0, 44.0, 25.0, 11.0, 13.0, 7.0, 6.0, 3.0, 0.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.209228515625, -0.20214271545410156, -0.19505691528320312, -0.1879711151123047, -0.18088531494140625, -0.1737995147705078, -0.16671371459960938, -0.15962791442871094, -0.1525421142578125, -0.14545631408691406, -0.13837051391601562, -0.1312847137451172, -0.12419891357421875, -0.11711311340332031, -0.11002731323242188, -0.10294151306152344, -0.095855712890625, -0.08876991271972656, -0.08168411254882812, -0.07459831237792969, -0.06751251220703125, -0.06042671203613281, -0.053340911865234375, -0.04625511169433594, -0.0391693115234375, -0.03208351135253906, -0.024997711181640625, -0.017911911010742188, -0.01082611083984375, -0.0037403106689453125, 0.003345489501953125, 0.010431289672851562, 0.01751708984375, 0.024602890014648438, 0.031688690185546875, 0.03877449035644531, 0.04586029052734375, 0.05294609069824219, 0.060031890869140625, 0.06711769104003906, 0.0742034912109375, 0.08128929138183594, 0.08837509155273438, 0.09546089172363281, 0.10254669189453125, 0.10963249206542969, 0.11671829223632812, 0.12380409240722656, 0.130889892578125, 0.13797569274902344, 0.14506149291992188, 0.1521472930908203, 0.15923309326171875, 0.1663188934326172, 0.17340469360351562, 0.18049049377441406, 0.1875762939453125, 0.19466209411621094, 0.20174789428710938, 0.2088336944580078, 0.21591949462890625, 0.2230052947998047, 0.23009109497070312, 0.23717689514160156, 0.2442626953125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 6.0, 9.0, 11.0, 28.0, 35.0, 60.0, 119.0, 146.0, 136.0, 142.0, 121.0, 72.0, 40.0, 23.0, 17.0, 11.0, 11.0, 3.0, 4.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2012939453125, -0.19450759887695312, -0.18772125244140625, -0.18093490600585938, -0.1741485595703125, -0.16736221313476562, -0.16057586669921875, -0.15378952026367188, -0.147003173828125, -0.14021682739257812, -0.13343048095703125, -0.12664413452148438, -0.1198577880859375, -0.11307144165039062, -0.10628509521484375, -0.09949874877929688, -0.09271240234375, -0.08592605590820312, -0.07913970947265625, -0.07235336303710938, -0.0655670166015625, -0.058780670166015625, -0.05199432373046875, -0.045207977294921875, -0.038421630859375, -0.031635284423828125, -0.02484893798828125, -0.018062591552734375, -0.0112762451171875, -0.004489898681640625, 0.00229644775390625, 0.009082794189453125, 0.015869140625, 0.022655487060546875, 0.02944183349609375, 0.036228179931640625, 0.0430145263671875, 0.049800872802734375, 0.05658721923828125, 0.06337356567382812, 0.070159912109375, 0.07694625854492188, 0.08373260498046875, 0.09051895141601562, 0.0973052978515625, 0.10409164428710938, 0.11087799072265625, 0.11766433715820312, 0.12445068359375, 0.13123703002929688, 0.13802337646484375, 0.14480972290039062, 0.1515960693359375, 0.15838241577148438, 0.16516876220703125, 0.17195510864257812, 0.178741455078125, 0.18552780151367188, 0.19231414794921875, 0.19910049438476562, 0.2058868408203125, 0.21267318725585938, 0.21945953369140625, 0.22624588012695312, 0.2330322265625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 6.0, 9.0, 24.0, 113.0, 350.0, 324.0, 122.0, 47.0, 9.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-11.79746150970459, -11.58298110961914, -11.368501663208008, -11.154021263122559, -10.93954086303711, -10.72506046295166, -10.510580062866211, -10.296100616455078, -10.081620216369629, -9.86713981628418, -9.652660369873047, -9.438179969787598, -9.223699569702148, -9.0092191696167, -8.79473876953125, -8.580259323120117, -8.365778923034668, -8.151298522949219, -7.936818599700928, -7.722338676452637, -7.5078582763671875, -7.293377876281738, -7.078897953033447, -6.864418029785156, -6.649937629699707, -6.435457229614258, -6.220977306365967, -6.006497383117676, -5.792016983032227, -5.577536582946777, -5.363056659698486, -5.148576736450195, -4.934096336364746, -4.719615936279297, -4.505136013031006, -4.290656089782715, -4.076175689697266, -3.8616955280303955, -3.6472153663635254, -3.4327352046966553, -3.2182552814483643, -3.003775119781494, -2.789294958114624, -2.574814796447754, -2.360334634780884, -2.1458544731140137, -1.9313743114471436, -1.7168941497802734, -1.5024139881134033, -1.2879338264465332, -1.073453664779663, -0.858973503112793, -0.6444933414459229, -0.43001317977905273, -0.21553301811218262, -0.0010528564453125, 0.21342730522155762, 0.42790746688842773, 0.6423876285552979, 0.856867790222168, 1.071347951889038, 1.2858281135559082, 1.5003082752227783, 1.7147884368896484, 1.9292685985565186]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 8.0, 4.0, 3.0, 9.0, 16.0, 13.0, 19.0, 21.0, 19.0, 21.0, 24.0, 29.0, 34.0, 39.0, 54.0, 48.0, 47.0, 42.0, 53.0, 53.0, 44.0, 47.0, 56.0, 43.0, 45.0, 37.0, 38.0, 26.0, 20.0, 12.0, 18.0, 10.0, 10.0, 6.0, 11.0, 6.0, 3.0, 2.0, 7.0, 0.0, 1.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6948161125183105, -2.5970306396484375, -2.4992451667785645, -2.4014594554901123, -2.3036739826202393, -2.205888509750366, -2.108102798461914, -2.010317325592041, -1.912531852722168, -1.814746379852295, -1.7169607877731323, -1.6191751956939697, -1.5213897228240967, -1.4236042499542236, -1.325818657875061, -1.2280330657958984, -1.1302475929260254, -1.0324621200561523, -0.9346765279769897, -0.8368909955024719, -0.7391054630279541, -0.6413199305534363, -0.5435343980789185, -0.44574886560440063, -0.3479633331298828, -0.250177800655365, -0.15239226818084717, -0.054606735706329346, 0.04317879676818848, 0.1409643292427063, 0.23874986171722412, 0.33653539419174194, 0.43432092666625977, 0.5321064591407776, 0.6298919916152954, 0.7276775240898132, 0.825463056564331, 0.9232485890388489, 1.0210341215133667, 1.1188197135925293, 1.2166051864624023, 1.3143906593322754, 1.412176251411438, 1.5099618434906006, 1.6077473163604736, 1.7055327892303467, 1.8033183813095093, 1.9011039733886719, 1.998889446258545, 2.096674919128418, 2.194460391998291, 2.292246103286743, 2.390031576156616, 2.4878170490264893, 2.5856027603149414, 2.6833882331848145, 2.7811737060546875, 2.8789591789245605, 2.9767446517944336, 3.0745303630828857, 3.172315835952759, 3.270101308822632, 3.367887020111084, 3.465672492980957, 3.56345796585083]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 4.0, 9.0, 10.0, 12.0, 9.0, 8.0, 12.0, 25.0, 31.0, 47.0, 57.0, 90.0, 104.0, 166.0, 299.0, 520.0, 1062.0, 2196.0, 6392.0, 31391.0, 762183.0, 3329656.0, 46896.0, 8400.0, 2612.0, 1083.0, 482.0, 228.0, 115.0, 63.0, 44.0, 29.0, 15.0, 8.0, 11.0, 5.0, 2.0, 3.0, 0.0, 1.0, 2.0], "bins": [-1.7333984375, -1.6940765380859375, -1.654754638671875, -1.6154327392578125, -1.57611083984375, -1.5367889404296875, -1.497467041015625, -1.4581451416015625, -1.4188232421875, -1.3795013427734375, -1.340179443359375, -1.3008575439453125, -1.26153564453125, -1.2222137451171875, -1.182891845703125, -1.1435699462890625, -1.104248046875, -1.0649261474609375, -1.025604248046875, -0.9862823486328125, -0.94696044921875, -0.9076385498046875, -0.868316650390625, -0.8289947509765625, -0.7896728515625, -0.7503509521484375, -0.711029052734375, -0.6717071533203125, -0.63238525390625, -0.5930633544921875, -0.553741455078125, -0.5144195556640625, -0.47509765625, -0.4357757568359375, -0.396453857421875, -0.3571319580078125, -0.31781005859375, -0.2784881591796875, -0.239166259765625, -0.1998443603515625, -0.1605224609375, -0.1212005615234375, -0.081878662109375, -0.0425567626953125, -0.00323486328125, 0.0360870361328125, 0.075408935546875, 0.1147308349609375, 0.154052734375, 0.1933746337890625, 0.232696533203125, 0.2720184326171875, 0.31134033203125, 0.3506622314453125, 0.389984130859375, 0.4293060302734375, 0.4686279296875, 0.5079498291015625, 0.547271728515625, 0.5865936279296875, 0.62591552734375, 0.6652374267578125, 0.704559326171875, 0.7438812255859375, 0.783203125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 13.0, 18.0, 29.0, 49.0, 57.0, 94.0, 96.0, 121.0, 112.0, 102.0, 81.0, 71.0, 54.0, 47.0, 21.0, 15.0, 11.0, 2.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36376953125, -0.3553581237792969, -0.34694671630859375, -0.3385353088378906, -0.3301239013671875, -0.3217124938964844, -0.31330108642578125, -0.3048896789550781, -0.296478271484375, -0.2880668640136719, -0.27965545654296875, -0.2712440490722656, -0.2628326416015625, -0.2544212341308594, -0.24600982666015625, -0.23759841918945312, -0.22918701171875, -0.22077560424804688, -0.21236419677734375, -0.20395278930664062, -0.1955413818359375, -0.18712997436523438, -0.17871856689453125, -0.17030715942382812, -0.161895751953125, -0.15348434448242188, -0.14507293701171875, -0.13666152954101562, -0.1282501220703125, -0.11983871459960938, -0.11142730712890625, -0.10301589965820312, -0.0946044921875, -0.08619308471679688, -0.07778167724609375, -0.06937026977539062, -0.0609588623046875, -0.052547454833984375, -0.04413604736328125, -0.035724639892578125, -0.027313232421875, -0.018901824951171875, -0.01049041748046875, -0.002079010009765625, 0.0063323974609375, 0.014743804931640625, 0.02315521240234375, 0.031566619873046875, 0.03997802734375, 0.048389434814453125, 0.05680084228515625, 0.06521224975585938, 0.0736236572265625, 0.08203506469726562, 0.09044647216796875, 0.09885787963867188, 0.107269287109375, 0.11568069458007812, 0.12409210205078125, 0.13250350952148438, 0.1409149169921875, 0.14932632446289062, 0.15773773193359375, 0.16614913940429688, 0.174560546875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 7.0, 17.0, 14.0, 29.0, 31.0, 38.0, 92.0, 176.0, 367.0, 888.0, 2922.0, 18616.0, 4103116.0, 62271.0, 4185.0, 951.0, 305.0, 118.0, 56.0, 36.0, 20.0, 8.0, 5.0, 8.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.986328125, -2.9110565185546875, -2.835784912109375, -2.7605133056640625, -2.68524169921875, -2.6099700927734375, -2.534698486328125, -2.4594268798828125, -2.3841552734375, -2.3088836669921875, -2.233612060546875, -2.1583404541015625, -2.08306884765625, -2.0077972412109375, -1.932525634765625, -1.8572540283203125, -1.781982421875, -1.7067108154296875, -1.631439208984375, -1.5561676025390625, -1.48089599609375, -1.4056243896484375, -1.330352783203125, -1.2550811767578125, -1.1798095703125, -1.1045379638671875, -1.029266357421875, -0.9539947509765625, -0.87872314453125, -0.8034515380859375, -0.728179931640625, -0.6529083251953125, -0.57763671875, -0.5023651123046875, -0.427093505859375, -0.3518218994140625, -0.27655029296875, -0.2012786865234375, -0.126007080078125, -0.0507354736328125, 0.0245361328125, 0.0998077392578125, 0.175079345703125, 0.2503509521484375, 0.32562255859375, 0.4008941650390625, 0.476165771484375, 0.5514373779296875, 0.626708984375, 0.7019805908203125, 0.777252197265625, 0.8525238037109375, 0.92779541015625, 1.0030670166015625, 1.078338623046875, 1.1536102294921875, 1.2288818359375, 1.3041534423828125, 1.379425048828125, 1.4546966552734375, 1.52996826171875, 1.6052398681640625, 1.680511474609375, 1.7557830810546875, 1.8310546875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 2.0, 6.0, 7.0, 25.0, 32.0, 93.0, 421.0, 3057.0, 317.0, 63.0, 26.0, 4.0, 5.0, 4.0, 1.0, 1.0, 6.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.4033203125, -1.37548828125, -1.34765625, -1.31982421875, -1.2919921875, -1.26416015625, -1.236328125, -1.20849609375, -1.1806640625, -1.15283203125, -1.125, -1.09716796875, -1.0693359375, -1.04150390625, -1.013671875, -0.98583984375, -0.9580078125, -0.93017578125, -0.90234375, -0.87451171875, -0.8466796875, -0.81884765625, -0.791015625, -0.76318359375, -0.7353515625, -0.70751953125, -0.6796875, -0.65185546875, -0.6240234375, -0.59619140625, -0.568359375, -0.54052734375, -0.5126953125, -0.48486328125, -0.45703125, -0.42919921875, -0.4013671875, -0.37353515625, -0.345703125, -0.31787109375, -0.2900390625, -0.26220703125, -0.234375, -0.20654296875, -0.1787109375, -0.15087890625, -0.123046875, -0.09521484375, -0.0673828125, -0.03955078125, -0.01171875, 0.01611328125, 0.0439453125, 0.07177734375, 0.099609375, 0.12744140625, 0.1552734375, 0.18310546875, 0.2109375, 0.23876953125, 0.2666015625, 0.29443359375, 0.322265625, 0.35009765625, 0.3779296875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 5.0, 15.0, 40.0, 102.0, 289.0, 297.0, 159.0, 49.0, 18.0, 8.0, 3.0, 8.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7295894622802734, -3.623584032058716, -3.517578601837158, -3.4115729331970215, -3.305567502975464, -3.1995620727539062, -3.0935564041137695, -2.987550973892212, -2.8815455436706543, -2.7755401134490967, -2.669534683227539, -2.5635290145874023, -2.4575235843658447, -2.351518154144287, -2.2455124855041504, -2.1395070552825928, -2.033501625061035, -1.9274961948394775, -1.8214906454086304, -1.7154850959777832, -1.6094796657562256, -1.503474235534668, -1.3974686861038208, -1.2914631366729736, -1.185457706451416, -1.0794522762298584, -0.9734467267990112, -0.8674412369728088, -0.7614357471466064, -0.655430257320404, -0.5494247674942017, -0.44341927766799927, -0.3374135494232178, -0.23140805959701538, -0.125402569770813, -0.019397079944610596, 0.0866084098815918, 0.1926138997077942, 0.2986193895339966, 0.404624879360199, 0.5106303691864014, 0.6166358590126038, 0.7226413488388062, 0.8286468386650085, 0.9346523284912109, 1.0406577587127686, 1.1466633081436157, 1.252668857574463, 1.3586742877960205, 1.4646797180175781, 1.5706852674484253, 1.6766908168792725, 1.78269624710083, 1.8887016773223877, 1.9947072267532349, 2.100712776184082, 2.2067182064056396, 2.3127236366271973, 2.418729305267334, 2.5247347354888916, 2.630740165710449, 2.736745595932007, 2.8427510261535645, 2.948756694793701, 3.054762125015259]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 15.0, 20.0, 40.0, 72.0, 108.0, 139.0, 155.0, 168.0, 129.0, 79.0, 42.0, 22.0, 6.0, 9.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.620720863342285, -4.48499870300293, -4.349277019500732, -4.213555335998535, -4.07783317565918, -3.9421112537384033, -3.806389331817627, -3.6706674098968506, -3.534945487976074, -3.399223566055298, -3.2635016441345215, -3.127779722213745, -2.9920578002929688, -2.8563358783721924, -2.720613956451416, -2.5848920345306396, -2.4491701126098633, -2.313448190689087, -2.1777262687683105, -2.042004346847534, -1.9062824249267578, -1.7705605030059814, -1.634838581085205, -1.4991166591644287, -1.3633947372436523, -1.227672815322876, -1.0919508934020996, -0.9562289714813232, -0.8205070495605469, -0.6847851276397705, -0.5490632057189941, -0.4133412837982178, -0.2776193618774414, -0.14189743995666504, -0.006175518035888672, 0.1295464038848877, 0.26526832580566406, 0.40099024772644043, 0.5367121696472168, 0.6724340915679932, 0.8081560134887695, 0.9438779354095459, 1.0795998573303223, 1.2153217792510986, 1.351043701171875, 1.4867656230926514, 1.6224875450134277, 1.758209466934204, 1.8939313888549805, 2.029653310775757, 2.165375232696533, 2.3010971546173096, 2.436819076538086, 2.5725409984588623, 2.7082629203796387, 2.843984842300415, 2.9797067642211914, 3.1154286861419678, 3.251150608062744, 3.3868725299835205, 3.522594451904297, 3.6583163738250732, 3.7940382957458496, 3.929760217666626, 4.065482139587402]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 6.0, 10.0, 10.0, 11.0, 21.0, 33.0, 29.0, 80.0, 106.0, 150.0, 216.0, 377.0, 699.0, 1444.0, 4138.0, 19291.0, 191988.0, 731609.0, 82082.0, 10860.0, 2765.0, 1125.0, 600.0, 301.0, 196.0, 127.0, 80.0, 59.0, 32.0, 24.0, 22.0, 18.0, 7.0, 6.0, 11.0, 5.0, 4.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.94384765625, -0.9171371459960938, -0.8904266357421875, -0.8637161254882812, -0.837005615234375, -0.8102951049804688, -0.7835845947265625, -0.7568740844726562, -0.73016357421875, -0.7034530639648438, -0.6767425537109375, -0.6500320434570312, -0.623321533203125, -0.5966110229492188, -0.5699005126953125, -0.5431900024414062, -0.5164794921875, -0.48976898193359375, -0.4630584716796875, -0.43634796142578125, -0.409637451171875, -0.38292694091796875, -0.3562164306640625, -0.32950592041015625, -0.30279541015625, -0.27608489990234375, -0.2493743896484375, -0.22266387939453125, -0.195953369140625, -0.16924285888671875, -0.1425323486328125, -0.11582183837890625, -0.089111328125, -0.06240081787109375, -0.0356903076171875, -0.00897979736328125, 0.017730712890625, 0.04444122314453125, 0.0711517333984375, 0.09786224365234375, 0.12457275390625, 0.15128326416015625, 0.1779937744140625, 0.20470428466796875, 0.231414794921875, 0.25812530517578125, 0.2848358154296875, 0.31154632568359375, 0.3382568359375, 0.36496734619140625, 0.3916778564453125, 0.41838836669921875, 0.445098876953125, 0.47180938720703125, 0.4985198974609375, 0.5252304077148438, 0.55194091796875, 0.5786514282226562, 0.6053619384765625, 0.6320724487304688, 0.658782958984375, 0.6854934692382812, 0.7122039794921875, 0.7389144897460938, 0.765625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 6.0, 14.0, 34.0, 64.0, 100.0, 118.0, 124.0, 135.0, 122.0, 108.0, 81.0, 42.0, 27.0, 11.0, 11.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4404296875, -0.4297676086425781, -0.41910552978515625, -0.4084434509277344, -0.3977813720703125, -0.3871192932128906, -0.37645721435546875, -0.3657951354980469, -0.355133056640625, -0.3444709777832031, -0.33380889892578125, -0.3231468200683594, -0.3124847412109375, -0.3018226623535156, -0.29116058349609375, -0.2804985046386719, -0.26983642578125, -0.2591743469238281, -0.24851226806640625, -0.23785018920898438, -0.2271881103515625, -0.21652603149414062, -0.20586395263671875, -0.19520187377929688, -0.184539794921875, -0.17387771606445312, -0.16321563720703125, -0.15255355834960938, -0.1418914794921875, -0.13122940063476562, -0.12056732177734375, -0.10990524291992188, -0.0992431640625, -0.08858108520507812, -0.07791900634765625, -0.06725692749023438, -0.0565948486328125, -0.045932769775390625, -0.03527069091796875, -0.024608612060546875, -0.013946533203125, -0.003284454345703125, 0.00737762451171875, 0.018039703369140625, 0.0287017822265625, 0.039363861083984375, 0.05002593994140625, 0.060688018798828125, 0.07135009765625, 0.08201217651367188, 0.09267425537109375, 0.10333633422851562, 0.1139984130859375, 0.12466049194335938, 0.13532257080078125, 0.14598464965820312, 0.156646728515625, 0.16730880737304688, 0.17797088623046875, 0.18863296508789062, 0.1992950439453125, 0.20995712280273438, 0.22061920166015625, 0.23128128051757812, 0.241943359375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 8.0, 7.0, 9.0, 10.0, 19.0, 23.0, 31.0, 39.0, 50.0, 102.0, 126.0, 244.0, 338.0, 651.0, 1249.0, 2422.0, 5140.0, 11745.0, 29731.0, 85057.0, 274067.0, 407830.0, 148878.0, 48188.0, 18120.0, 7442.0, 3299.0, 1628.0, 821.0, 494.0, 274.0, 158.0, 90.0, 68.0, 49.0, 41.0, 24.0, 21.0, 13.0, 11.0, 7.0, 7.0, 3.0, 6.0, 7.0, 2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.278076171875, -0.2694511413574219, -0.26082611083984375, -0.2522010803222656, -0.2435760498046875, -0.23495101928710938, -0.22632598876953125, -0.21770095825195312, -0.209075927734375, -0.20045089721679688, -0.19182586669921875, -0.18320083618164062, -0.1745758056640625, -0.16595077514648438, -0.15732574462890625, -0.14870071411132812, -0.14007568359375, -0.13145065307617188, -0.12282562255859375, -0.11420059204101562, -0.1055755615234375, -0.09695053100585938, -0.08832550048828125, -0.07970046997070312, -0.071075439453125, -0.062450408935546875, -0.05382537841796875, -0.045200347900390625, -0.0365753173828125, -0.027950286865234375, -0.01932525634765625, -0.010700225830078125, -0.0020751953125, 0.006549835205078125, 0.01517486572265625, 0.023799896240234375, 0.0324249267578125, 0.041049957275390625, 0.04967498779296875, 0.058300018310546875, 0.066925048828125, 0.07555007934570312, 0.08417510986328125, 0.09280014038085938, 0.1014251708984375, 0.11005020141601562, 0.11867523193359375, 0.12730026245117188, 0.13592529296875, 0.14455032348632812, 0.15317535400390625, 0.16180038452148438, 0.1704254150390625, 0.17905044555664062, 0.18767547607421875, 0.19630050659179688, 0.204925537109375, 0.21355056762695312, 0.22217559814453125, 0.23080062866210938, 0.2394256591796875, 0.24805068969726562, 0.25667572021484375, 0.2653007507324219, 0.27392578125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 0.0, 6.0, 14.0, 9.0, 11.0, 16.0, 13.0, 18.0, 23.0, 15.0, 26.0, 30.0, 32.0, 48.0, 27.0, 37.0, 53.0, 43.0, 53.0, 50.0, 47.0, 31.0, 34.0, 34.0, 51.0, 32.0, 33.0, 35.0, 24.0, 23.0, 27.0, 21.0, 15.0, 11.0, 8.0, 5.0, 10.0, 8.0, 4.0, 6.0, 3.0, 4.0, 1.0, 3.0, 1.0, 6.0, 0.0, 0.0, 3.0], "bins": [-0.483154296875, -0.4691314697265625, -0.455108642578125, -0.4410858154296875, -0.42706298828125, -0.4130401611328125, -0.399017333984375, -0.3849945068359375, -0.3709716796875, -0.3569488525390625, -0.342926025390625, -0.3289031982421875, -0.31488037109375, -0.3008575439453125, -0.286834716796875, -0.2728118896484375, -0.2587890625, -0.2447662353515625, -0.230743408203125, -0.2167205810546875, -0.20269775390625, -0.1886749267578125, -0.174652099609375, -0.1606292724609375, -0.1466064453125, -0.1325836181640625, -0.118560791015625, -0.1045379638671875, -0.09051513671875, -0.0764923095703125, -0.062469482421875, -0.0484466552734375, -0.034423828125, -0.0204010009765625, -0.006378173828125, 0.0076446533203125, 0.02166748046875, 0.0356903076171875, 0.049713134765625, 0.0637359619140625, 0.0777587890625, 0.0917816162109375, 0.105804443359375, 0.1198272705078125, 0.13385009765625, 0.1478729248046875, 0.161895751953125, 0.1759185791015625, 0.18994140625, 0.2039642333984375, 0.217987060546875, 0.2320098876953125, 0.24603271484375, 0.2600555419921875, 0.274078369140625, 0.2881011962890625, 0.3021240234375, 0.3161468505859375, 0.330169677734375, 0.3441925048828125, 0.35821533203125, 0.3722381591796875, 0.386260986328125, 0.4002838134765625, 0.414306640625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 5.0, 4.0, 5.0, 10.0, 21.0, 20.0, 28.0, 38.0, 56.0, 112.0, 161.0, 298.0, 625.0, 1429.0, 4028.0, 15148.0, 79477.0, 474381.0, 393613.0, 61034.0, 12310.0, 3314.0, 1244.0, 543.0, 250.0, 150.0, 92.0, 64.0, 26.0, 20.0, 14.0, 9.0, 5.0, 3.0, 9.0, 4.0, 2.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1937255859375, -0.18833351135253906, -0.18294143676757812, -0.1775493621826172, -0.17215728759765625, -0.1667652130126953, -0.16137313842773438, -0.15598106384277344, -0.1505889892578125, -0.14519691467285156, -0.13980484008789062, -0.1344127655029297, -0.12902069091796875, -0.12362861633300781, -0.11823654174804688, -0.11284446716308594, -0.107452392578125, -0.10206031799316406, -0.09666824340820312, -0.09127616882324219, -0.08588409423828125, -0.08049201965332031, -0.07509994506835938, -0.06970787048339844, -0.0643157958984375, -0.05892372131347656, -0.053531646728515625, -0.04813957214355469, -0.04274749755859375, -0.03735542297363281, -0.031963348388671875, -0.026571273803710938, -0.02117919921875, -0.015787124633789062, -0.010395050048828125, -0.0050029754638671875, 0.00038909912109375, 0.0057811737060546875, 0.011173248291015625, 0.016565322875976562, 0.0219573974609375, 0.027349472045898438, 0.032741546630859375, 0.03813362121582031, 0.04352569580078125, 0.04891777038574219, 0.054309844970703125, 0.05970191955566406, 0.065093994140625, 0.07048606872558594, 0.07587814331054688, 0.08127021789550781, 0.08666229248046875, 0.09205436706542969, 0.09744644165039062, 0.10283851623535156, 0.1082305908203125, 0.11362266540527344, 0.11901473999023438, 0.12440681457519531, 0.12979888916015625, 0.1351909637451172, 0.14058303833007812, 0.14597511291503906, 0.1513671875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 5.0, 6.0, 5.0, 12.0, 7.0, 12.0, 13.0, 30.0, 22.0, 50.0, 44.0, 69.0, 71.0, 104.0, 116.0, 103.0, 78.0, 69.0, 49.0, 38.0, 22.0, 17.0, 21.0, 7.0, 9.0, 7.0, 6.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0001614093780517578, -0.0001561492681503296, -0.00015088915824890137, -0.00014562904834747314, -0.00014036893844604492, -0.0001351088285446167, -0.00012984871864318848, -0.00012458860874176025, -0.00011932849884033203, -0.00011406838893890381, -0.00010880827903747559, -0.00010354816913604736, -9.828805923461914e-05, -9.302794933319092e-05, -8.77678394317627e-05, -8.250772953033447e-05, -7.724761962890625e-05, -7.198750972747803e-05, -6.67273998260498e-05, -6.146728992462158e-05, -5.620718002319336e-05, -5.094707012176514e-05, -4.5686960220336914e-05, -4.042685031890869e-05, -3.516674041748047e-05, -2.9906630516052246e-05, -2.4646520614624023e-05, -1.93864107131958e-05, -1.4126300811767578e-05, -8.866190910339355e-06, -3.606081008911133e-06, 1.6540288925170898e-06, 6.9141387939453125e-06, 1.2174248695373535e-05, 1.7434358596801758e-05, 2.269446849822998e-05, 2.7954578399658203e-05, 3.3214688301086426e-05, 3.847479820251465e-05, 4.373490810394287e-05, 4.8995018005371094e-05, 5.4255127906799316e-05, 5.951523780822754e-05, 6.477534770965576e-05, 7.003545761108398e-05, 7.529556751251221e-05, 8.055567741394043e-05, 8.581578731536865e-05, 9.107589721679688e-05, 9.63360071182251e-05, 0.00010159611701965332, 0.00010685622692108154, 0.00011211633682250977, 0.00011737644672393799, 0.0001226365566253662, 0.00012789666652679443, 0.00013315677642822266, 0.00013841688632965088, 0.0001436769962310791, 0.00014893710613250732, 0.00015419721603393555, 0.00015945732593536377, 0.000164717435836792, 0.00016997754573822021, 0.00017523765563964844]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 3.0, 0.0, 1.0, 3.0, 10.0, 11.0, 9.0, 21.0, 26.0, 41.0, 44.0, 56.0, 104.0, 163.0, 246.0, 377.0, 789.0, 1296.0, 2456.0, 5540.0, 14503.0, 47602.0, 205329.0, 494967.0, 202286.0, 47179.0, 14448.0, 5588.0, 2415.0, 1229.0, 654.0, 406.0, 257.0, 142.0, 109.0, 82.0, 48.0, 34.0, 27.0, 14.0, 10.0, 8.0, 6.0, 11.0, 5.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.1253662109375, -0.12138557434082031, -0.11740493774414062, -0.11342430114746094, -0.10944366455078125, -0.10546302795410156, -0.10148239135742188, -0.09750175476074219, -0.0935211181640625, -0.08954048156738281, -0.08555984497070312, -0.08157920837402344, -0.07759857177734375, -0.07361793518066406, -0.06963729858398438, -0.06565666198730469, -0.061676025390625, -0.05769538879394531, -0.053714752197265625, -0.04973411560058594, -0.04575347900390625, -0.04177284240722656, -0.037792205810546875, -0.03381156921386719, -0.0298309326171875, -0.025850296020507812, -0.021869659423828125, -0.017889022827148438, -0.01390838623046875, -0.009927749633789062, -0.005947113037109375, -0.0019664764404296875, 0.00201416015625, 0.0059947967529296875, 0.009975433349609375, 0.013956069946289062, 0.01793670654296875, 0.021917343139648438, 0.025897979736328125, 0.029878616333007812, 0.0338592529296875, 0.03783988952636719, 0.041820526123046875, 0.04580116271972656, 0.04978179931640625, 0.05376243591308594, 0.057743072509765625, 0.06172370910644531, 0.065704345703125, 0.06968498229980469, 0.07366561889648438, 0.07764625549316406, 0.08162689208984375, 0.08560752868652344, 0.08958816528320312, 0.09356880187988281, 0.0975494384765625, 0.10153007507324219, 0.10551071166992188, 0.10949134826660156, 0.11347198486328125, 0.11745262145996094, 0.12143325805664062, 0.1254138946533203, 0.12939453125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 4.0, 0.0, 1.0, 4.0, 6.0, 8.0, 10.0, 15.0, 11.0, 18.0, 41.0, 44.0, 66.0, 70.0, 90.0, 113.0, 140.0, 80.0, 80.0, 47.0, 37.0, 35.0, 26.0, 16.0, 14.0, 12.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.123291015625, -0.11836624145507812, -0.11344146728515625, -0.10851669311523438, -0.1035919189453125, -0.09866714477539062, -0.09374237060546875, -0.08881759643554688, -0.083892822265625, -0.07896804809570312, -0.07404327392578125, -0.06911849975585938, -0.0641937255859375, -0.059268951416015625, -0.05434417724609375, -0.049419403076171875, -0.04449462890625, -0.039569854736328125, -0.03464508056640625, -0.029720306396484375, -0.0247955322265625, -0.019870758056640625, -0.01494598388671875, -0.010021209716796875, -0.005096435546875, -0.000171661376953125, 0.00475311279296875, 0.009677886962890625, 0.0146026611328125, 0.019527435302734375, 0.02445220947265625, 0.029376983642578125, 0.0343017578125, 0.039226531982421875, 0.04415130615234375, 0.049076080322265625, 0.0540008544921875, 0.058925628662109375, 0.06385040283203125, 0.06877517700195312, 0.073699951171875, 0.07862472534179688, 0.08354949951171875, 0.08847427368164062, 0.0933990478515625, 0.09832382202148438, 0.10324859619140625, 0.10817337036132812, 0.11309814453125, 0.11802291870117188, 0.12294769287109375, 0.12787246704101562, 0.1327972412109375, 0.13772201538085938, 0.14264678955078125, 0.14757156372070312, 0.152496337890625, 0.15742111206054688, 0.16234588623046875, 0.16727066040039062, 0.1721954345703125, 0.17712020874023438, 0.18204498291015625, 0.18696975708007812, 0.19189453125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 31.0, 101.0, 358.0, 320.0, 117.0, 40.0, 17.0, 11.0, 2.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8362627029418945, -4.6495041847229, -4.462745666503906, -4.275987148284912, -4.089228630065918, -3.902470111846924, -3.7157113552093506, -3.5289528369903564, -3.3421943187713623, -3.155435800552368, -2.968677282333374, -2.781918525695801, -2.5951600074768066, -2.4084014892578125, -2.2216429710388184, -2.034884452819824, -1.84812593460083, -1.661367416381836, -1.4746088981628418, -1.287850260734558, -1.101091742515564, -0.9143332242965698, -0.7275745868682861, -0.540816068649292, -0.35405755043029785, -0.16729900240898132, 0.019459545612335205, 0.20621812343597412, 0.39297664165496826, 0.5797351598739624, 0.7664937973022461, 0.9532523155212402, 1.1400108337402344, 1.3267693519592285, 1.5135278701782227, 1.7002865076065063, 1.8870450258255005, 2.073803424835205, 2.2605621814727783, 2.4473206996917725, 2.6340792179107666, 2.8208377361297607, 3.007596254348755, 3.194355010986328, 3.3811135292053223, 3.5678720474243164, 3.7546305656433105, 3.9413890838623047, 4.128147602081299, 4.314906120300293, 4.501664638519287, 4.688423156738281, 4.875181674957275, 5.0619401931762695, 5.248699188232422, 5.435457229614258, 5.62221622467041, 5.808974742889404, 5.995733261108398, 6.182491779327393, 6.369250297546387, 6.556008815765381, 6.742767333984375, 6.929526329040527, 7.116284370422363]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 5.0, 10.0, 7.0, 12.0, 14.0, 25.0, 24.0, 29.0, 37.0, 35.0, 40.0, 51.0, 54.0, 63.0, 50.0, 68.0, 62.0, 59.0, 49.0, 44.0, 56.0, 38.0, 37.0, 24.0, 30.0, 27.0, 11.0, 12.0, 7.0, 7.0, 5.0, 2.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.413717269897461, -3.3074533939361572, -3.2011895179748535, -3.09492564201355, -2.988661766052246, -2.8823978900909424, -2.7761340141296387, -2.669869899749756, -2.5636062622070312, -2.4573423862457275, -2.351078510284424, -2.24481463432312, -2.1385507583618164, -2.0322868824005127, -1.9260228872299194, -1.8197590112686157, -1.7134950160980225, -1.6072311401367188, -1.500967264175415, -1.3947033882141113, -1.2884395122528076, -1.182175636291504, -1.0759116411209106, -0.9696477651596069, -0.8633838891983032, -0.7571200132369995, -0.6508561372756958, -0.5445922017097473, -0.4383283257484436, -0.3320644497871399, -0.2258005142211914, -0.1195366382598877, -0.013273000717163086, 0.09299089014530182, 0.19925478100776672, 0.3055186867713928, 0.41178256273269653, 0.5180464386940002, 0.6243103742599487, 0.7305742502212524, 0.8368381261825562, 0.9431020021438599, 1.0493658781051636, 1.1556298732757568, 1.2618937492370605, 1.3681576251983643, 1.474421501159668, 1.5806853771209717, 1.6869492530822754, 1.793213129043579, 1.8994770050048828, 2.0057408809661865, 2.1120047569274902, 2.218268632888794, 2.3245325088500977, 2.4307966232299805, 2.537060260772705, 2.643324136734009, 2.7495880126953125, 2.855851888656616, 2.96211576461792, 3.0683796405792236, 3.1746435165405273, 3.28090763092041, 3.387171506881714]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 11.0, 10.0, 16.0, 14.0, 26.0, 45.0, 81.0, 144.0, 248.0, 605.0, 1633.0, 9947.0, 3670741.0, 501257.0, 7440.0, 1253.0, 427.0, 184.0, 103.0, 46.0, 19.0, 14.0, 12.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.03125, -1.9803924560546875, -1.929534912109375, -1.8786773681640625, -1.82781982421875, -1.7769622802734375, -1.726104736328125, -1.6752471923828125, -1.6243896484375, -1.5735321044921875, -1.522674560546875, -1.4718170166015625, -1.42095947265625, -1.3701019287109375, -1.319244384765625, -1.2683868408203125, -1.217529296875, -1.1666717529296875, -1.115814208984375, -1.0649566650390625, -1.01409912109375, -0.9632415771484375, -0.912384033203125, -0.8615264892578125, -0.8106689453125, -0.7598114013671875, -0.708953857421875, -0.6580963134765625, -0.60723876953125, -0.5563812255859375, -0.505523681640625, -0.4546661376953125, -0.40380859375, -0.3529510498046875, -0.302093505859375, -0.2512359619140625, -0.20037841796875, -0.1495208740234375, -0.098663330078125, -0.0478057861328125, 0.0030517578125, 0.0539093017578125, 0.104766845703125, 0.1556243896484375, 0.20648193359375, 0.2573394775390625, 0.308197021484375, 0.3590545654296875, 0.409912109375, 0.4607696533203125, 0.511627197265625, 0.5624847412109375, 0.61334228515625, 0.6641998291015625, 0.715057373046875, 0.7659149169921875, 0.8167724609375, 0.8676300048828125, 0.918487548828125, 0.9693450927734375, 1.02020263671875, 1.0710601806640625, 1.121917724609375, 1.1727752685546875, 1.2236328125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 0.0, 0.0, 4.0, 13.0, 31.0, 47.0, 80.0, 75.0, 116.0, 136.0, 138.0, 107.0, 85.0, 73.0, 53.0, 23.0, 10.0, 6.0, 7.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.452392578125, -0.4413566589355469, -0.43032073974609375, -0.4192848205566406, -0.4082489013671875, -0.3972129821777344, -0.38617706298828125, -0.3751411437988281, -0.364105224609375, -0.3530693054199219, -0.34203338623046875, -0.3309974670410156, -0.3199615478515625, -0.3089256286621094, -0.29788970947265625, -0.2868537902832031, -0.27581787109375, -0.2647819519042969, -0.25374603271484375, -0.24271011352539062, -0.2316741943359375, -0.22063827514648438, -0.20960235595703125, -0.19856643676757812, -0.187530517578125, -0.17649459838867188, -0.16545867919921875, -0.15442276000976562, -0.1433868408203125, -0.13235092163085938, -0.12131500244140625, -0.11027908325195312, -0.0992431640625, -0.08820724487304688, -0.07717132568359375, -0.06613540649414062, -0.0550994873046875, -0.044063568115234375, -0.03302764892578125, -0.021991729736328125, -0.010955810546875, 8.0108642578125e-05, 0.01111602783203125, 0.022151947021484375, 0.0331878662109375, 0.044223785400390625, 0.05525970458984375, 0.06629562377929688, 0.07733154296875, 0.08836746215820312, 0.09940338134765625, 0.11043930053710938, 0.1214752197265625, 0.13251113891601562, 0.14354705810546875, 0.15458297729492188, 0.165618896484375, 0.17665481567382812, 0.18769073486328125, 0.19872665405273438, 0.2097625732421875, 0.22079849243164062, 0.23183441162109375, 0.24287033081054688, 0.25390625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 4.0, 9.0, 14.0, 16.0, 32.0, 46.0, 68.0, 129.0, 208.0, 389.0, 841.0, 1830.0, 4684.0, 14722.0, 75574.0, 3310519.0, 717788.0, 48770.0, 11340.0, 3948.0, 1573.0, 769.0, 402.0, 231.0, 139.0, 77.0, 57.0, 35.0, 26.0, 13.0, 12.0, 7.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3994140625, -0.38558197021484375, -0.3717498779296875, -0.35791778564453125, -0.344085693359375, -0.33025360107421875, -0.3164215087890625, -0.30258941650390625, -0.28875732421875, -0.27492523193359375, -0.2610931396484375, -0.24726104736328125, -0.233428955078125, -0.21959686279296875, -0.2057647705078125, -0.19193267822265625, -0.1781005859375, -0.16426849365234375, -0.1504364013671875, -0.13660430908203125, -0.122772216796875, -0.10894012451171875, -0.0951080322265625, -0.08127593994140625, -0.06744384765625, -0.05361175537109375, -0.0397796630859375, -0.02594757080078125, -0.012115478515625, 0.00171661376953125, 0.0155487060546875, 0.02938079833984375, 0.043212890625, 0.05704498291015625, 0.0708770751953125, 0.08470916748046875, 0.098541259765625, 0.11237335205078125, 0.1262054443359375, 0.14003753662109375, 0.15386962890625, 0.16770172119140625, 0.1815338134765625, 0.19536590576171875, 0.209197998046875, 0.22303009033203125, 0.2368621826171875, 0.25069427490234375, 0.2645263671875, 0.27835845947265625, 0.2921905517578125, 0.30602264404296875, 0.319854736328125, 0.33368682861328125, 0.3475189208984375, 0.36135101318359375, 0.37518310546875, 0.38901519775390625, 0.4028472900390625, 0.41667938232421875, 0.430511474609375, 0.44434356689453125, 0.4581756591796875, 0.47200775146484375, 0.48583984375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 4.0, 2.0, 4.0, 4.0, 6.0, 5.0, 8.0, 24.0, 34.0, 64.0, 102.0, 324.0, 2099.0, 906.0, 220.0, 108.0, 52.0, 39.0, 25.0, 10.0, 15.0, 6.0, 11.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.152099609375, -0.1454315185546875, -0.138763427734375, -0.1320953369140625, -0.12542724609375, -0.1187591552734375, -0.112091064453125, -0.1054229736328125, -0.0987548828125, -0.0920867919921875, -0.085418701171875, -0.0787506103515625, -0.07208251953125, -0.0654144287109375, -0.058746337890625, -0.0520782470703125, -0.04541015625, -0.0387420654296875, -0.032073974609375, -0.0254058837890625, -0.01873779296875, -0.0120697021484375, -0.005401611328125, 0.0012664794921875, 0.0079345703125, 0.0146026611328125, 0.021270751953125, 0.0279388427734375, 0.03460693359375, 0.0412750244140625, 0.047943115234375, 0.0546112060546875, 0.061279296875, 0.0679473876953125, 0.074615478515625, 0.0812835693359375, 0.08795166015625, 0.0946197509765625, 0.101287841796875, 0.1079559326171875, 0.1146240234375, 0.1212921142578125, 0.127960205078125, 0.1346282958984375, 0.14129638671875, 0.1479644775390625, 0.154632568359375, 0.1613006591796875, 0.16796875, 0.1746368408203125, 0.181304931640625, 0.1879730224609375, 0.19464111328125, 0.2013092041015625, 0.207977294921875, 0.2146453857421875, 0.2213134765625, 0.2279815673828125, 0.234649658203125, 0.2413177490234375, 0.24798583984375, 0.2546539306640625, 0.261322021484375, 0.2679901123046875, 0.274658203125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 10.0, 15.0, 33.0, 169.0, 364.0, 248.0, 112.0, 36.0, 11.0, 8.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5575941801071167, -0.4986702799797058, -0.4397464096546173, -0.3808225393295288, -0.3218986392021179, -0.26297473907470703, -0.20405086874961853, -0.14512699842453003, -0.08620309829711914, -0.027279213070869446, 0.03164467215538025, 0.09056855738162994, 0.14949244260787964, 0.20841634273529053, 0.26734021306037903, 0.32626408338546753, 0.3851879835128784, 0.4441118836402893, 0.5030357837677002, 0.5619596242904663, 0.6208835244178772, 0.6798074245452881, 0.7387312650680542, 0.7976551651954651, 0.856579065322876, 0.9155029654502869, 0.9744268655776978, 1.0333507061004639, 1.0922746658325195, 1.1511985063552856, 1.2101223468780518, 1.2690463066101074, 1.327970266342163, 1.3868941068649292, 1.4458180665969849, 1.504741907119751, 1.5636658668518066, 1.6225897073745728, 1.6815135478973389, 1.7404375076293945, 1.7993613481521606, 1.8582851886749268, 1.9172091484069824, 1.9761329889297485, 2.0350568294525146, 2.0939807891845703, 2.152904748916626, 2.2118284702301025, 2.270752429962158, 2.329676389694214, 2.3886001110076904, 2.447524070739746, 2.5064480304718018, 2.5653719902038574, 2.624295711517334, 2.6832196712493896, 2.7421436309814453, 2.801067590713501, 2.8599913120269775, 2.918915271759033, 2.977839231491089, 3.0367631912231445, 3.095686912536621, 3.1546108722686768, 3.2135345935821533]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 5.0, 2.0, 6.0, 6.0, 10.0, 12.0, 22.0, 22.0, 20.0, 33.0, 33.0, 48.0, 43.0, 44.0, 45.0, 54.0, 40.0, 54.0, 45.0, 65.0, 66.0, 50.0, 40.0, 35.0, 32.0, 37.0, 33.0, 21.0, 19.0, 18.0, 16.0, 9.0, 3.0, 9.0, 3.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4308505058288574, -0.41090407967567444, -0.39095762372016907, -0.3710111975669861, -0.3510647714138031, -0.3311183452606201, -0.31117188930511475, -0.29122546315193176, -0.2712790369987488, -0.2513326108455658, -0.23138616979122162, -0.21143972873687744, -0.19149330258369446, -0.17154686152935028, -0.1516004204750061, -0.13165399432182312, -0.11170753836631775, -0.09176110476255417, -0.07181467115879059, -0.05186823010444641, -0.03192179650068283, -0.01197536289691925, 0.007971078157424927, 0.02791750431060791, 0.04786394536495209, 0.06781037896871567, 0.08775681257247925, 0.10770325362682343, 0.1276496946811676, 0.14759612083435059, 0.16754256188869476, 0.18748898804187775, 0.20743542909622192, 0.2273818701505661, 0.24732829630374908, 0.26727473735809326, 0.28722116351127625, 0.30716758966445923, 0.3271140456199646, 0.3470604717731476, 0.36700689792633057, 0.38695332407951355, 0.4068997800350189, 0.4268462061882019, 0.4467926323413849, 0.46673905849456787, 0.48668551445007324, 0.5066319704055786, 0.526578426361084, 0.5465248823165894, 0.56647127866745, 0.5864177346229553, 0.6063641905784607, 0.6263105869293213, 0.6462570428848267, 0.666203498840332, 0.6861498951911926, 0.706096351146698, 0.7260427474975586, 0.745989203453064, 0.7659356594085693, 0.7858820557594299, 0.8058285117149353, 0.8257749080657959, 0.8457213640213013]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 9.0, 7.0, 13.0, 14.0, 17.0, 25.0, 50.0, 50.0, 85.0, 127.0, 208.0, 338.0, 632.0, 1293.0, 3692.0, 16874.0, 131496.0, 713623.0, 153844.0, 19066.0, 4106.0, 1410.0, 665.0, 327.0, 197.0, 137.0, 74.0, 47.0, 37.0, 24.0, 22.0, 15.0, 8.0, 6.0, 7.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75732421875, -0.733306884765625, -0.70928955078125, -0.685272216796875, -0.6612548828125, -0.637237548828125, -0.61322021484375, -0.589202880859375, -0.565185546875, -0.541168212890625, -0.51715087890625, -0.493133544921875, -0.4691162109375, -0.445098876953125, -0.42108154296875, -0.397064208984375, -0.373046875, -0.349029541015625, -0.32501220703125, -0.300994873046875, -0.2769775390625, -0.252960205078125, -0.22894287109375, -0.204925537109375, -0.180908203125, -0.156890869140625, -0.13287353515625, -0.108856201171875, -0.0848388671875, -0.060821533203125, -0.03680419921875, -0.012786865234375, 0.01123046875, 0.035247802734375, 0.05926513671875, 0.083282470703125, 0.1072998046875, 0.131317138671875, 0.15533447265625, 0.179351806640625, 0.203369140625, 0.227386474609375, 0.25140380859375, 0.275421142578125, 0.2994384765625, 0.323455810546875, 0.34747314453125, 0.371490478515625, 0.3955078125, 0.419525146484375, 0.44354248046875, 0.467559814453125, 0.4915771484375, 0.515594482421875, 0.53961181640625, 0.563629150390625, 0.587646484375, 0.611663818359375, 0.63568115234375, 0.659698486328125, 0.6837158203125, 0.707733154296875, 0.73175048828125, 0.755767822265625, 0.77978515625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 0.0, 2.0, 4.0, 23.0, 30.0, 49.0, 75.0, 88.0, 130.0, 126.0, 134.0, 102.0, 85.0, 66.0, 47.0, 21.0, 9.0, 3.0, 9.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.420654296875, -0.4100799560546875, -0.399505615234375, -0.3889312744140625, -0.37835693359375, -0.3677825927734375, -0.357208251953125, -0.3466339111328125, -0.3360595703125, -0.3254852294921875, -0.314910888671875, -0.3043365478515625, -0.29376220703125, -0.2831878662109375, -0.272613525390625, -0.2620391845703125, -0.25146484375, -0.2408905029296875, -0.230316162109375, -0.2197418212890625, -0.20916748046875, -0.1985931396484375, -0.188018798828125, -0.1774444580078125, -0.1668701171875, -0.1562957763671875, -0.145721435546875, -0.1351470947265625, -0.12457275390625, -0.1139984130859375, -0.103424072265625, -0.0928497314453125, -0.082275390625, -0.0717010498046875, -0.061126708984375, -0.0505523681640625, -0.03997802734375, -0.0294036865234375, -0.018829345703125, -0.0082550048828125, 0.0023193359375, 0.0128936767578125, 0.023468017578125, 0.0340423583984375, 0.04461669921875, 0.0551910400390625, 0.065765380859375, 0.0763397216796875, 0.0869140625, 0.0974884033203125, 0.108062744140625, 0.1186370849609375, 0.12921142578125, 0.1397857666015625, 0.150360107421875, 0.1609344482421875, 0.1715087890625, 0.1820831298828125, 0.192657470703125, 0.2032318115234375, 0.21380615234375, 0.2243804931640625, 0.234954833984375, 0.2455291748046875, 0.256103515625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 11.0, 10.0, 17.0, 24.0, 29.0, 39.0, 57.0, 81.0, 132.0, 182.0, 303.0, 454.0, 661.0, 1180.0, 2073.0, 3965.0, 8000.0, 17180.0, 39089.0, 99579.0, 277468.0, 358159.0, 142243.0, 53462.0, 22550.0, 10247.0, 5019.0, 2620.0, 1466.0, 788.0, 511.0, 290.0, 188.0, 152.0, 111.0, 60.0, 46.0, 26.0, 25.0, 22.0, 8.0, 11.0, 6.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0], "bins": [-0.2724609375, -0.2642478942871094, -0.25603485107421875, -0.24782180786132812, -0.2396087646484375, -0.23139572143554688, -0.22318267822265625, -0.21496963500976562, -0.206756591796875, -0.19854354858398438, -0.19033050537109375, -0.18211746215820312, -0.1739044189453125, -0.16569137573242188, -0.15747833251953125, -0.14926528930664062, -0.14105224609375, -0.13283920288085938, -0.12462615966796875, -0.11641311645507812, -0.1082000732421875, -0.09998703002929688, -0.09177398681640625, -0.08356094360351562, -0.075347900390625, -0.06713485717773438, -0.05892181396484375, -0.050708770751953125, -0.0424957275390625, -0.034282684326171875, -0.02606964111328125, -0.017856597900390625, -0.0096435546875, -0.001430511474609375, 0.00678253173828125, 0.014995574951171875, 0.0232086181640625, 0.031421661376953125, 0.03963470458984375, 0.047847747802734375, 0.056060791015625, 0.06427383422851562, 0.07248687744140625, 0.08069992065429688, 0.0889129638671875, 0.09712600708007812, 0.10533905029296875, 0.11355209350585938, 0.12176513671875, 0.12997817993164062, 0.13819122314453125, 0.14640426635742188, 0.1546173095703125, 0.16283035278320312, 0.17104339599609375, 0.17925643920898438, 0.187469482421875, 0.19568252563476562, 0.20389556884765625, 0.21210861206054688, 0.2203216552734375, 0.22853469848632812, 0.23674774169921875, 0.24496078491210938, 0.253173828125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 8.0, 3.0, 9.0, 11.0, 10.0, 18.0, 8.0, 13.0, 19.0, 14.0, 23.0, 35.0, 33.0, 46.0, 35.0, 41.0, 52.0, 49.0, 47.0, 39.0, 45.0, 41.0, 42.0, 39.0, 30.0, 30.0, 36.0, 34.0, 25.0, 24.0, 28.0, 25.0, 17.0, 19.0, 9.0, 13.0, 6.0, 5.0, 6.0, 5.0, 6.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.521484375, -0.5048751831054688, -0.4882659912109375, -0.47165679931640625, -0.455047607421875, -0.43843841552734375, -0.4218292236328125, -0.40522003173828125, -0.38861083984375, -0.37200164794921875, -0.3553924560546875, -0.33878326416015625, -0.322174072265625, -0.30556488037109375, -0.2889556884765625, -0.27234649658203125, -0.2557373046875, -0.23912811279296875, -0.2225189208984375, -0.20590972900390625, -0.189300537109375, -0.17269134521484375, -0.1560821533203125, -0.13947296142578125, -0.12286376953125, -0.10625457763671875, -0.0896453857421875, -0.07303619384765625, -0.056427001953125, -0.03981781005859375, -0.0232086181640625, -0.00659942626953125, 0.010009765625, 0.02661895751953125, 0.0432281494140625, 0.05983734130859375, 0.076446533203125, 0.09305572509765625, 0.1096649169921875, 0.12627410888671875, 0.14288330078125, 0.15949249267578125, 0.1761016845703125, 0.19271087646484375, 0.209320068359375, 0.22592926025390625, 0.2425384521484375, 0.25914764404296875, 0.2757568359375, 0.29236602783203125, 0.3089752197265625, 0.32558441162109375, 0.342193603515625, 0.35880279541015625, 0.3754119873046875, 0.39202117919921875, 0.40863037109375, 0.42523956298828125, 0.4418487548828125, 0.45845794677734375, 0.475067138671875, 0.49167633056640625, 0.5082855224609375, 0.5248947143554688, 0.54150390625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 3.0, 6.0, 8.0, 12.0, 23.0, 37.0, 83.0, 185.0, 500.0, 1630.0, 8541.0, 148824.0, 816337.0, 64992.0, 5475.0, 1229.0, 358.0, 150.0, 68.0, 41.0, 16.0, 12.0, 6.0, 6.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.31298828125, -0.3041419982910156, -0.29529571533203125, -0.2864494323730469, -0.2776031494140625, -0.2687568664550781, -0.25991058349609375, -0.2510643005371094, -0.242218017578125, -0.23337173461914062, -0.22452545166015625, -0.21567916870117188, -0.2068328857421875, -0.19798660278320312, -0.18914031982421875, -0.18029403686523438, -0.17144775390625, -0.16260147094726562, -0.15375518798828125, -0.14490890502929688, -0.1360626220703125, -0.12721633911132812, -0.11837005615234375, -0.10952377319335938, -0.100677490234375, -0.09183120727539062, -0.08298492431640625, -0.07413864135742188, -0.0652923583984375, -0.056446075439453125, -0.04759979248046875, -0.038753509521484375, -0.0299072265625, -0.021060943603515625, -0.01221466064453125, -0.003368377685546875, 0.0054779052734375, 0.014324188232421875, 0.02317047119140625, 0.032016754150390625, 0.040863037109375, 0.049709320068359375, 0.05855560302734375, 0.06740188598632812, 0.0762481689453125, 0.08509445190429688, 0.09394073486328125, 0.10278701782226562, 0.11163330078125, 0.12047958374023438, 0.12932586669921875, 0.13817214965820312, 0.1470184326171875, 0.15586471557617188, 0.16471099853515625, 0.17355728149414062, 0.182403564453125, 0.19124984741210938, 0.20009613037109375, 0.20894241333007812, 0.2177886962890625, 0.22663497924804688, 0.23548126220703125, 0.24432754516601562, 0.253173828125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 5.0, 3.0, 2.0, 5.0, 11.0, 5.0, 11.0, 9.0, 16.0, 16.0, 13.0, 29.0, 27.0, 40.0, 40.0, 62.0, 91.0, 80.0, 102.0, 98.0, 63.0, 57.0, 39.0, 25.0, 32.0, 23.0, 20.0, 21.0, 14.0, 10.0, 8.0, 7.0, 7.0, 3.0, 4.0, 3.0, 2.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001633167266845703, -0.00015808828175067902, -0.00015285983681678772, -0.00014763139188289642, -0.00014240294694900513, -0.00013717450201511383, -0.00013194605708122253, -0.00012671761214733124, -0.00012148916721343994, -0.00011626072227954865, -0.00011103227734565735, -0.00010580383241176605, -0.00010057538747787476, -9.534694254398346e-05, -9.011849761009216e-05, -8.489005267620087e-05, -7.966160774230957e-05, -7.443316280841827e-05, -6.920471787452698e-05, -6.397627294063568e-05, -5.8747828006744385e-05, -5.351938307285309e-05, -4.829093813896179e-05, -4.3062493205070496e-05, -3.78340482711792e-05, -3.26056033372879e-05, -2.7377158403396606e-05, -2.214871346950531e-05, -1.6920268535614014e-05, -1.1691823601722717e-05, -6.463378667831421e-06, -1.2349337339401245e-06, 3.993511199951172e-06, 9.221956133842468e-06, 1.4450401067733765e-05, 1.967884600162506e-05, 2.4907290935516357e-05, 3.0135735869407654e-05, 3.536418080329895e-05, 4.0592625737190247e-05, 4.582107067108154e-05, 5.104951560497284e-05, 5.6277960538864136e-05, 6.150640547275543e-05, 6.673485040664673e-05, 7.196329534053802e-05, 7.719174027442932e-05, 8.242018520832062e-05, 8.764863014221191e-05, 9.287707507610321e-05, 9.810552000999451e-05, 0.0001033339649438858, 0.0001085624098777771, 0.0001137908548116684, 0.00011901929974555969, 0.000124247744679451, 0.00012947618961334229, 0.00013470463454723358, 0.00013993307948112488, 0.00014516152441501617, 0.00015038996934890747, 0.00015561841428279877, 0.00016084685921669006, 0.00016607530415058136, 0.00017130374908447266]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 2.0, 3.0, 4.0, 9.0, 9.0, 15.0, 16.0, 38.0, 66.0, 97.0, 157.0, 335.0, 620.0, 1280.0, 2850.0, 7101.0, 23549.0, 118359.0, 485917.0, 324171.0, 60573.0, 14382.0, 4917.0, 2064.0, 941.0, 450.0, 274.0, 136.0, 85.0, 44.0, 32.0, 15.0, 18.0, 8.0, 9.0, 5.0, 3.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1473388671875, -0.14298057556152344, -0.13862228393554688, -0.1342639923095703, -0.12990570068359375, -0.1255474090576172, -0.12118911743164062, -0.11683082580566406, -0.1124725341796875, -0.10811424255371094, -0.10375595092773438, -0.09939765930175781, -0.09503936767578125, -0.09068107604980469, -0.08632278442382812, -0.08196449279785156, -0.077606201171875, -0.07324790954589844, -0.06888961791992188, -0.06453132629394531, -0.06017303466796875, -0.05581474304199219, -0.051456451416015625, -0.04709815979003906, -0.0427398681640625, -0.03838157653808594, -0.034023284912109375, -0.029664993286132812, -0.02530670166015625, -0.020948410034179688, -0.016590118408203125, -0.012231826782226562, -0.00787353515625, -0.0035152435302734375, 0.000843048095703125, 0.0052013397216796875, 0.00955963134765625, 0.013917922973632812, 0.018276214599609375, 0.022634506225585938, 0.0269927978515625, 0.03135108947753906, 0.035709381103515625, 0.04006767272949219, 0.04442596435546875, 0.04878425598144531, 0.053142547607421875, 0.05750083923339844, 0.061859130859375, 0.06621742248535156, 0.07057571411132812, 0.07493400573730469, 0.07929229736328125, 0.08365058898925781, 0.08800888061523438, 0.09236717224121094, 0.0967254638671875, 0.10108375549316406, 0.10544204711914062, 0.10980033874511719, 0.11415863037109375, 0.11851692199707031, 0.12287521362304688, 0.12723350524902344, 0.131591796875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 7.0, 6.0, 6.0, 12.0, 12.0, 25.0, 30.0, 44.0, 50.0, 70.0, 72.0, 92.0, 103.0, 90.0, 88.0, 83.0, 50.0, 40.0, 33.0, 31.0, 20.0, 15.0, 6.0, 6.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.1859130859375, -0.18097305297851562, -0.17603302001953125, -0.17109298706054688, -0.1661529541015625, -0.16121292114257812, -0.15627288818359375, -0.15133285522460938, -0.146392822265625, -0.14145278930664062, -0.13651275634765625, -0.13157272338867188, -0.1266326904296875, -0.12169265747070312, -0.11675262451171875, -0.11181259155273438, -0.10687255859375, -0.10193252563476562, -0.09699249267578125, -0.09205245971679688, -0.0871124267578125, -0.08217239379882812, -0.07723236083984375, -0.07229232788085938, -0.067352294921875, -0.062412261962890625, -0.05747222900390625, -0.052532196044921875, -0.0475921630859375, -0.042652130126953125, -0.03771209716796875, -0.032772064208984375, -0.02783203125, -0.022891998291015625, -0.01795196533203125, -0.013011932373046875, -0.0080718994140625, -0.003131866455078125, 0.00180816650390625, 0.006748199462890625, 0.011688232421875, 0.016628265380859375, 0.02156829833984375, 0.026508331298828125, 0.0314483642578125, 0.036388397216796875, 0.04132843017578125, 0.046268463134765625, 0.05120849609375, 0.056148529052734375, 0.06108856201171875, 0.06602859497070312, 0.0709686279296875, 0.07590866088867188, 0.08084869384765625, 0.08578872680664062, 0.090728759765625, 0.09566879272460938, 0.10060882568359375, 0.10554885864257812, 0.1104888916015625, 0.11542892456054688, 0.12036895751953125, 0.12530899047851562, 0.1302490234375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 38.0, 182.0, 546.0, 177.0, 36.0, 19.0, 6.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.51819610595703, -16.19015884399414, -15.862123489379883, -15.534086227416992, -15.206049919128418, -14.878013610839844, -14.549976348876953, -14.221940040588379, -13.893903732299805, -13.56586742401123, -13.237831115722656, -12.909793853759766, -12.581757545471191, -12.253721237182617, -11.925683975219727, -11.597647666931152, -11.269611358642578, -10.941575050354004, -10.61353874206543, -10.285501480102539, -9.957465171813965, -9.62942886352539, -9.3013916015625, -8.973355293273926, -8.645318984985352, -8.317282676696777, -7.989245891571045, -7.6612091064453125, -7.333172798156738, -7.005136489868164, -6.677099704742432, -6.349062919616699, -6.021025657653809, -5.692989349365234, -5.364952564239502, -5.0369157791137695, -4.708879470825195, -4.380843162536621, -4.052806377410889, -3.7247698307037354, -3.396733283996582, -3.0686967372894287, -2.7406601905822754, -2.412623643875122, -2.0845870971679688, -1.7565505504608154, -1.428514003753662, -1.1004774570465088, -0.7724409103393555, -0.44440436363220215, -0.11636781692504883, 0.2116687297821045, 0.5397052764892578, 0.8677418231964111, 1.1957783699035645, 1.5238149166107178, 1.851851463317871, 2.1798880100250244, 2.5079245567321777, 2.835961103439331, 3.1639976501464844, 3.4920341968536377, 3.820070743560791, 4.148107528686523, 4.476143836975098]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 6.0, 4.0, 7.0, 5.0, 7.0, 5.0, 7.0, 7.0, 16.0, 11.0, 18.0, 22.0, 19.0, 29.0, 23.0, 32.0, 27.0, 41.0, 29.0, 35.0, 48.0, 46.0, 39.0, 37.0, 33.0, 43.0, 36.0, 35.0, 31.0, 39.0, 34.0, 34.0, 22.0, 24.0, 24.0, 12.0, 27.0, 13.0, 14.0, 17.0, 11.0, 6.0, 4.0, 11.0, 5.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.781054973602295, -2.69256591796875, -2.604076862335205, -2.51558780670166, -2.4270989894866943, -2.3386099338531494, -2.2501208782196045, -2.1616318225860596, -2.0731427669525146, -1.9846537113189697, -1.8961647748947144, -1.8076757192611694, -1.7191866636276245, -1.6306977272033691, -1.5422086715698242, -1.4537196159362793, -1.365230679512024, -1.276741623878479, -1.1882526874542236, -1.0997636318206787, -1.0112745761871338, -0.9227855801582336, -0.8342965841293335, -0.7458075284957886, -0.6573185324668884, -0.5688295364379883, -0.48034048080444336, -0.3918514847755432, -0.3033624589443207, -0.21487343311309814, -0.126384437084198, -0.037895381450653076, 0.05059361457824707, 0.1390826404094696, 0.22757165133953094, 0.3160606622695923, 0.4045496881008148, 0.49303871393203735, 0.5815277099609375, 0.6700167655944824, 0.7585057616233826, 0.8469947576522827, 0.9354838132858276, 1.023972749710083, 1.112461805343628, 1.2009508609771729, 1.2894399166107178, 1.3779289722442627, 1.466417908668518, 1.554906964302063, 1.6433959007263184, 1.7318849563598633, 1.8203740119934082, 1.9088630676269531, 1.9973520040512085, 2.085841178894043, 2.174329996109009, 2.2628190517425537, 2.3513081073760986, 2.4397969245910645, 2.5282859802246094, 2.6167750358581543, 2.705264091491699, 2.793753147125244, 2.882242202758789]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 7.0, 7.0, 13.0, 10.0, 25.0, 47.0, 82.0, 153.0, 352.0, 974.0, 4399.0, 97005.0, 4074987.0, 13397.0, 1883.0, 516.0, 213.0, 110.0, 45.0, 21.0, 13.0, 9.0, 8.0, 5.0, 5.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.267578125, -2.2013702392578125, -2.135162353515625, -2.0689544677734375, -2.00274658203125, -1.9365386962890625, -1.870330810546875, -1.8041229248046875, -1.7379150390625, -1.6717071533203125, -1.605499267578125, -1.5392913818359375, -1.47308349609375, -1.4068756103515625, -1.340667724609375, -1.2744598388671875, -1.208251953125, -1.1420440673828125, -1.075836181640625, -1.0096282958984375, -0.94342041015625, -0.8772125244140625, -0.811004638671875, -0.7447967529296875, -0.6785888671875, -0.6123809814453125, -0.546173095703125, -0.4799652099609375, -0.41375732421875, -0.3475494384765625, -0.281341552734375, -0.2151336669921875, -0.14892578125, -0.0827178955078125, -0.016510009765625, 0.0496978759765625, 0.11590576171875, 0.1821136474609375, 0.248321533203125, 0.3145294189453125, 0.3807373046875, 0.4469451904296875, 0.513153076171875, 0.5793609619140625, 0.64556884765625, 0.7117767333984375, 0.777984619140625, 0.8441925048828125, 0.910400390625, 0.9766082763671875, 1.042816162109375, 1.1090240478515625, 1.17523193359375, 1.2414398193359375, 1.307647705078125, 1.3738555908203125, 1.4400634765625, 1.5062713623046875, 1.572479248046875, 1.6386871337890625, 1.70489501953125, 1.7711029052734375, 1.837310791015625, 1.9035186767578125, 1.9697265625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 7.0, 5.0, 10.0, 19.0, 42.0, 55.0, 57.0, 84.0, 101.0, 94.0, 90.0, 90.0, 96.0, 76.0, 61.0, 45.0, 25.0, 15.0, 15.0, 12.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39404296875, -0.38376617431640625, -0.3734893798828125, -0.36321258544921875, -0.352935791015625, -0.34265899658203125, -0.3323822021484375, -0.32210540771484375, -0.31182861328125, -0.30155181884765625, -0.2912750244140625, -0.28099822998046875, -0.270721435546875, -0.26044464111328125, -0.2501678466796875, -0.23989105224609375, -0.2296142578125, -0.21933746337890625, -0.2090606689453125, -0.19878387451171875, -0.188507080078125, -0.17823028564453125, -0.1679534912109375, -0.15767669677734375, -0.14739990234375, -0.13712310791015625, -0.1268463134765625, -0.11656951904296875, -0.106292724609375, -0.09601593017578125, -0.0857391357421875, -0.07546234130859375, -0.065185546875, -0.05490875244140625, -0.0446319580078125, -0.03435516357421875, -0.024078369140625, -0.01380157470703125, -0.0035247802734375, 0.00675201416015625, 0.01702880859375, 0.02730560302734375, 0.0375823974609375, 0.04785919189453125, 0.058135986328125, 0.06841278076171875, 0.0786895751953125, 0.08896636962890625, 0.0992431640625, 0.10951995849609375, 0.1197967529296875, 0.13007354736328125, 0.140350341796875, 0.15062713623046875, 0.1609039306640625, 0.17118072509765625, 0.18145751953125, 0.19173431396484375, 0.2020111083984375, 0.21228790283203125, 0.222564697265625, 0.23284149169921875, 0.2431182861328125, 0.25339508056640625, 0.263671875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 9.0, 4.0, 7.0, 13.0, 14.0, 29.0, 41.0, 41.0, 66.0, 104.0, 149.0, 235.0, 304.0, 628.0, 1121.0, 2502.0, 6753.0, 29823.0, 321798.0, 3713541.0, 94094.0, 14738.0, 4243.0, 1819.0, 857.0, 489.0, 327.0, 190.0, 125.0, 64.0, 70.0, 36.0, 19.0, 14.0, 10.0, 6.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.546875, -0.5293960571289062, -0.5119171142578125, -0.49443817138671875, -0.476959228515625, -0.45948028564453125, -0.4420013427734375, -0.42452239990234375, -0.40704345703125, -0.38956451416015625, -0.3720855712890625, -0.35460662841796875, -0.337127685546875, -0.31964874267578125, -0.3021697998046875, -0.28469085693359375, -0.2672119140625, -0.24973297119140625, -0.2322540283203125, -0.21477508544921875, -0.197296142578125, -0.17981719970703125, -0.1623382568359375, -0.14485931396484375, -0.12738037109375, -0.10990142822265625, -0.0924224853515625, -0.07494354248046875, -0.057464599609375, -0.03998565673828125, -0.0225067138671875, -0.00502777099609375, 0.012451171875, 0.02993011474609375, 0.0474090576171875, 0.06488800048828125, 0.082366943359375, 0.09984588623046875, 0.1173248291015625, 0.13480377197265625, 0.15228271484375, 0.16976165771484375, 0.1872406005859375, 0.20471954345703125, 0.222198486328125, 0.23967742919921875, 0.2571563720703125, 0.27463531494140625, 0.2921142578125, 0.30959320068359375, 0.3270721435546875, 0.34455108642578125, 0.362030029296875, 0.37950897216796875, 0.3969879150390625, 0.41446685791015625, 0.43194580078125, 0.44942474365234375, 0.4669036865234375, 0.48438262939453125, 0.501861572265625, 0.5193405151367188, 0.5368194580078125, 0.5542984008789062, 0.57177734375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 5.0, 5.0, 5.0, 12.0, 21.0, 45.0, 53.0, 108.0, 346.0, 2418.0, 706.0, 175.0, 71.0, 39.0, 26.0, 14.0, 8.0, 6.0, 3.0, 1.0, 1.0, 5.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4052734375, -0.3936004638671875, -0.381927490234375, -0.3702545166015625, -0.35858154296875, -0.3469085693359375, -0.335235595703125, -0.3235626220703125, -0.3118896484375, -0.3002166748046875, -0.288543701171875, -0.2768707275390625, -0.26519775390625, -0.2535247802734375, -0.241851806640625, -0.2301788330078125, -0.218505859375, -0.2068328857421875, -0.195159912109375, -0.1834869384765625, -0.17181396484375, -0.1601409912109375, -0.148468017578125, -0.1367950439453125, -0.1251220703125, -0.1134490966796875, -0.101776123046875, -0.0901031494140625, -0.07843017578125, -0.0667572021484375, -0.055084228515625, -0.0434112548828125, -0.03173828125, -0.0200653076171875, -0.008392333984375, 0.0032806396484375, 0.01495361328125, 0.0266265869140625, 0.038299560546875, 0.0499725341796875, 0.0616455078125, 0.0733184814453125, 0.084991455078125, 0.0966644287109375, 0.10833740234375, 0.1200103759765625, 0.131683349609375, 0.1433563232421875, 0.155029296875, 0.1667022705078125, 0.178375244140625, 0.1900482177734375, 0.20172119140625, 0.2133941650390625, 0.225067138671875, 0.2367401123046875, 0.2484130859375, 0.2600860595703125, 0.271759033203125, 0.2834320068359375, 0.29510498046875, 0.3067779541015625, 0.318450927734375, 0.3301239013671875, 0.341796875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 5.0, 11.0, 26.0, 92.0, 423.0, 365.0, 64.0, 13.0, 5.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2928340435028076, -1.173526406288147, -1.0542187690734863, -0.9349111914634705, -0.8156035542488098, -0.6962959170341492, -0.5769883394241333, -0.45768070220947266, -0.338373064994812, -0.21906544268131256, -0.09975782036781311, 0.019549787044525146, 0.1388574242591858, 0.25816506147384644, 0.3774726390838623, 0.49678027629852295, 0.6160879135131836, 0.7353955507278442, 0.8547031879425049, 0.9740107655525208, 1.0933184623718262, 1.2126259803771973, 1.331933617591858, 1.4512412548065186, 1.5705488920211792, 1.6898565292358398, 1.8091641664505005, 1.9284718036651611, 2.0477793216705322, 2.1670870780944824, 2.2863945960998535, 2.4057021141052246, 2.5250096321105957, 2.644317150115967, 2.763624906539917, 2.882932424545288, 3.0022401809692383, 3.1215476989746094, 3.2408552169799805, 3.3601629734039307, 3.479470729827881, 3.598778247833252, 3.718086004257202, 3.8373935222625732, 3.9567012786865234, 4.0760087966918945, 4.195316314697266, 4.314623832702637, 4.433931350708008, 4.553238868713379, 4.67254638671875, 4.791854381561279, 4.91116189956665, 5.0304694175720215, 5.149776935577393, 5.269084930419922, 5.388392448425293, 5.507699966430664, 5.627007484436035, 5.7463154792785645, 5.8656229972839355, 5.984930515289307, 6.104238033294678, 6.223546028137207, 6.342853546142578]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 4.0, 3.0, 6.0, 14.0, 10.0, 13.0, 20.0, 25.0, 20.0, 34.0, 27.0, 44.0, 52.0, 42.0, 56.0, 63.0, 59.0, 67.0, 59.0, 42.0, 47.0, 56.0, 36.0, 41.0, 28.0, 29.0, 28.0, 16.0, 16.0, 14.0, 5.0, 4.0, 7.0, 5.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7749946117401123, -0.7453752756118774, -0.7157559394836426, -0.6861366033554077, -0.6565172076225281, -0.6268978714942932, -0.5972785353660583, -0.5676591992378235, -0.5380398035049438, -0.508420467376709, -0.47880110144615173, -0.44918176531791687, -0.4195623993873596, -0.38994306325912476, -0.3603237271308899, -0.33070439100265503, -0.30108505487442017, -0.2714657187461853, -0.24184635281562805, -0.2122270166873932, -0.18260766565799713, -0.15298831462860107, -0.12336897850036621, -0.09374962747097015, -0.0641302764415741, -0.03451092913746834, -0.004891581833362579, 0.02472776174545288, 0.05434711277484894, 0.083966463804245, 0.11358579993247986, 0.14320515096187592, 0.17282450199127197, 0.20244385302066803, 0.2320632040500641, 0.26168254017829895, 0.2913019061088562, 0.32092124223709106, 0.3505405783653259, 0.3801599144935608, 0.40977928042411804, 0.4393986165523529, 0.46901798248291016, 0.498637318611145, 0.5282566547393799, 0.5578759908676147, 0.5874953269958496, 0.6171147227287292, 0.6467340588569641, 0.676353394985199, 0.7059727311134338, 0.7355921268463135, 0.7652114629745483, 0.7948307991027832, 0.8244501352310181, 0.8540694713592529, 0.8836888074874878, 0.9133081436157227, 0.9429274797439575, 0.9725468158721924, 1.0021661520004272, 1.031785488128662, 1.0614049434661865, 1.0910242795944214, 1.1206436157226562]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 5.0, 3.0, 8.0, 9.0, 15.0, 11.0, 14.0, 37.0, 50.0, 67.0, 119.0, 183.0, 358.0, 707.0, 1474.0, 3799.0, 12692.0, 66878.0, 626939.0, 288250.0, 34036.0, 7868.0, 2706.0, 1079.0, 514.0, 284.0, 141.0, 102.0, 62.0, 45.0, 31.0, 19.0, 11.0, 11.0, 4.0, 5.0, 6.0, 6.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.87646484375, -0.8505477905273438, -0.8246307373046875, -0.7987136840820312, -0.772796630859375, -0.7468795776367188, -0.7209625244140625, -0.6950454711914062, -0.66912841796875, -0.6432113647460938, -0.6172943115234375, -0.5913772583007812, -0.565460205078125, -0.5395431518554688, -0.5136260986328125, -0.48770904541015625, -0.4617919921875, -0.43587493896484375, -0.4099578857421875, -0.38404083251953125, -0.358123779296875, -0.33220672607421875, -0.3062896728515625, -0.28037261962890625, -0.25445556640625, -0.22853851318359375, -0.2026214599609375, -0.17670440673828125, -0.150787353515625, -0.12487030029296875, -0.0989532470703125, -0.07303619384765625, -0.047119140625, -0.02120208740234375, 0.0047149658203125, 0.03063201904296875, 0.056549072265625, 0.08246612548828125, 0.1083831787109375, 0.13430023193359375, 0.16021728515625, 0.18613433837890625, 0.2120513916015625, 0.23796844482421875, 0.263885498046875, 0.28980255126953125, 0.3157196044921875, 0.34163665771484375, 0.3675537109375, 0.39347076416015625, 0.4193878173828125, 0.44530487060546875, 0.471221923828125, 0.49713897705078125, 0.5230560302734375, 0.5489730834960938, 0.57489013671875, 0.6008071899414062, 0.6267242431640625, 0.6526412963867188, 0.678558349609375, 0.7044754028320312, 0.7303924560546875, 0.7563095092773438, 0.7822265625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 4.0, 4.0, 5.0, 20.0, 23.0, 46.0, 44.0, 58.0, 77.0, 89.0, 98.0, 84.0, 96.0, 87.0, 75.0, 64.0, 51.0, 30.0, 12.0, 18.0, 9.0, 10.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36962890625, -0.35974884033203125, -0.3498687744140625, -0.33998870849609375, -0.330108642578125, -0.32022857666015625, -0.3103485107421875, -0.30046844482421875, -0.29058837890625, -0.28070831298828125, -0.2708282470703125, -0.26094818115234375, -0.251068115234375, -0.24118804931640625, -0.2313079833984375, -0.22142791748046875, -0.2115478515625, -0.20166778564453125, -0.1917877197265625, -0.18190765380859375, -0.172027587890625, -0.16214752197265625, -0.1522674560546875, -0.14238739013671875, -0.13250732421875, -0.12262725830078125, -0.1127471923828125, -0.10286712646484375, -0.092987060546875, -0.08310699462890625, -0.0732269287109375, -0.06334686279296875, -0.053466796875, -0.04358673095703125, -0.0337066650390625, -0.02382659912109375, -0.013946533203125, -0.00406646728515625, 0.0058135986328125, 0.01569366455078125, 0.02557373046875, 0.03545379638671875, 0.0453338623046875, 0.05521392822265625, 0.065093994140625, 0.07497406005859375, 0.0848541259765625, 0.09473419189453125, 0.1046142578125, 0.11449432373046875, 0.1243743896484375, 0.13425445556640625, 0.144134521484375, 0.15401458740234375, 0.1638946533203125, 0.17377471923828125, 0.18365478515625, 0.19353485107421875, 0.2034149169921875, 0.21329498291015625, 0.223175048828125, 0.23305511474609375, 0.2429351806640625, 0.25281524658203125, 0.2626953125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 8.0, 7.0, 2.0, 10.0, 2.0, 11.0, 15.0, 18.0, 12.0, 29.0, 45.0, 56.0, 65.0, 127.0, 164.0, 297.0, 544.0, 1086.0, 2266.0, 5964.0, 19651.0, 92381.0, 552460.0, 304100.0, 49119.0, 12053.0, 4251.0, 1753.0, 797.0, 466.0, 245.0, 147.0, 118.0, 85.0, 58.0, 34.0, 29.0, 18.0, 16.0, 10.0, 14.0, 7.0, 4.0, 8.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 3.0], "bins": [-0.5439453125, -0.5287551879882812, -0.5135650634765625, -0.49837493896484375, -0.483184814453125, -0.46799468994140625, -0.4528045654296875, -0.43761444091796875, -0.42242431640625, -0.40723419189453125, -0.3920440673828125, -0.37685394287109375, -0.361663818359375, -0.34647369384765625, -0.3312835693359375, -0.31609344482421875, -0.3009033203125, -0.28571319580078125, -0.2705230712890625, -0.25533294677734375, -0.240142822265625, -0.22495269775390625, -0.2097625732421875, -0.19457244873046875, -0.17938232421875, -0.16419219970703125, -0.1490020751953125, -0.13381195068359375, -0.118621826171875, -0.10343170166015625, -0.0882415771484375, -0.07305145263671875, -0.057861328125, -0.04267120361328125, -0.0274810791015625, -0.01229095458984375, 0.002899169921875, 0.01808929443359375, 0.0332794189453125, 0.04846954345703125, 0.06365966796875, 0.07884979248046875, 0.0940399169921875, 0.10923004150390625, 0.124420166015625, 0.13961029052734375, 0.1548004150390625, 0.16999053955078125, 0.1851806640625, 0.20037078857421875, 0.2155609130859375, 0.23075103759765625, 0.245941162109375, 0.26113128662109375, 0.2763214111328125, 0.29151153564453125, 0.30670166015625, 0.32189178466796875, 0.3370819091796875, 0.35227203369140625, 0.367462158203125, 0.38265228271484375, 0.3978424072265625, 0.41303253173828125, 0.42822265625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 8.0, 5.0, 9.0, 6.0, 12.0, 13.0, 17.0, 13.0, 26.0, 18.0, 35.0, 35.0, 31.0, 49.0, 39.0, 48.0, 48.0, 57.0, 52.0, 52.0, 45.0, 42.0, 43.0, 43.0, 32.0, 41.0, 41.0, 24.0, 17.0, 21.0, 18.0, 19.0, 12.0, 7.0, 6.0, 7.0, 5.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.6298828125, -0.608551025390625, -0.58721923828125, -0.565887451171875, -0.5445556640625, -0.523223876953125, -0.50189208984375, -0.480560302734375, -0.459228515625, -0.437896728515625, -0.41656494140625, -0.395233154296875, -0.3739013671875, -0.352569580078125, -0.33123779296875, -0.309906005859375, -0.28857421875, -0.267242431640625, -0.24591064453125, -0.224578857421875, -0.2032470703125, -0.181915283203125, -0.16058349609375, -0.139251708984375, -0.117919921875, -0.096588134765625, -0.07525634765625, -0.053924560546875, -0.0325927734375, -0.011260986328125, 0.01007080078125, 0.031402587890625, 0.052734375, 0.074066162109375, 0.09539794921875, 0.116729736328125, 0.1380615234375, 0.159393310546875, 0.18072509765625, 0.202056884765625, 0.223388671875, 0.244720458984375, 0.26605224609375, 0.287384033203125, 0.3087158203125, 0.330047607421875, 0.35137939453125, 0.372711181640625, 0.39404296875, 0.415374755859375, 0.43670654296875, 0.458038330078125, 0.4793701171875, 0.500701904296875, 0.52203369140625, 0.543365478515625, 0.564697265625, 0.586029052734375, 0.60736083984375, 0.628692626953125, 0.6500244140625, 0.671356201171875, 0.69268798828125, 0.714019775390625, 0.7353515625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 8.0, 4.0, 14.0, 22.0, 75.0, 264.0, 1369.0, 819029.0, 226354.0, 1075.0, 224.0, 68.0, 20.0, 13.0, 12.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1201171875, -1.08270263671875, -1.0452880859375, -1.00787353515625, -0.970458984375, -0.93304443359375, -0.8956298828125, -0.85821533203125, -0.82080078125, -0.78338623046875, -0.7459716796875, -0.70855712890625, -0.671142578125, -0.63372802734375, -0.5963134765625, -0.55889892578125, -0.521484375, -0.48406982421875, -0.4466552734375, -0.40924072265625, -0.371826171875, -0.33441162109375, -0.2969970703125, -0.25958251953125, -0.22216796875, -0.18475341796875, -0.1473388671875, -0.10992431640625, -0.072509765625, -0.03509521484375, 0.0023193359375, 0.03973388671875, 0.0771484375, 0.11456298828125, 0.1519775390625, 0.18939208984375, 0.226806640625, 0.26422119140625, 0.3016357421875, 0.33905029296875, 0.37646484375, 0.41387939453125, 0.4512939453125, 0.48870849609375, 0.526123046875, 0.56353759765625, 0.6009521484375, 0.63836669921875, 0.67578125, 0.71319580078125, 0.7506103515625, 0.78802490234375, 0.825439453125, 0.86285400390625, 0.9002685546875, 0.93768310546875, 0.97509765625, 1.01251220703125, 1.0499267578125, 1.08734130859375, 1.124755859375, 1.16217041015625, 1.1995849609375, 1.23699951171875, 1.2744140625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 9.0, 23.0, 94.0, 455.0, 341.0, 57.0, 18.0, 7.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0020198822021484375, -0.001982402056455612, -0.0019449219107627869, -0.0019074417650699615, -0.0018699616193771362, -0.001832481473684311, -0.0017950013279914856, -0.0017575211822986603, -0.001720041036605835, -0.0016825608909130096, -0.0016450807452201843, -0.001607600599527359, -0.0015701204538345337, -0.0015326403081417084, -0.001495160162448883, -0.0014576800167560577, -0.0014201998710632324, -0.001382719725370407, -0.0013452395796775818, -0.0013077594339847565, -0.0012702792882919312, -0.0012327991425991058, -0.0011953189969062805, -0.0011578388512134552, -0.0011203587055206299, -0.0010828785598278046, -0.0010453984141349792, -0.001007918268442154, -0.0009704381227493286, -0.0009329579770565033, -0.000895477831363678, -0.0008579976856708527, -0.0008205175399780273, -0.000783037394285202, -0.0007455572485923767, -0.0007080771028995514, -0.0006705969572067261, -0.0006331168115139008, -0.0005956366658210754, -0.0005581565201282501, -0.0005206763744354248, -0.0004831962287425995, -0.00044571608304977417, -0.00040823593735694885, -0.00037075579166412354, -0.0003332756459712982, -0.0002957955002784729, -0.0002583153545856476, -0.00022083520889282227, -0.00018335506319999695, -0.00014587491750717163, -0.00010839477181434631, -7.0914626121521e-05, -3.343448042869568e-05, 4.045665264129639e-06, 4.1525810956954956e-05, 7.900595664978027e-05, 0.00011648610234260559, 0.0001539662480354309, 0.00019144639372825623, 0.00022892653942108154, 0.00026640668511390686, 0.0003038868308067322, 0.0003413669764995575, 0.0003788471221923828]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 3.0, 6.0, 12.0, 34.0, 59.0, 120.0, 223.0, 1086.0, 781437.0, 264365.0, 786.0, 234.0, 82.0, 49.0, 27.0, 13.0, 11.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.564453125, -1.5242919921875, -1.484130859375, -1.4439697265625, -1.40380859375, -1.3636474609375, -1.323486328125, -1.2833251953125, -1.2431640625, -1.2030029296875, -1.162841796875, -1.1226806640625, -1.08251953125, -1.0423583984375, -1.002197265625, -0.9620361328125, -0.921875, -0.8817138671875, -0.841552734375, -0.8013916015625, -0.76123046875, -0.7210693359375, -0.680908203125, -0.6407470703125, -0.6005859375, -0.5604248046875, -0.520263671875, -0.4801025390625, -0.43994140625, -0.3997802734375, -0.359619140625, -0.3194580078125, -0.279296875, -0.2391357421875, -0.198974609375, -0.1588134765625, -0.11865234375, -0.0784912109375, -0.038330078125, 0.0018310546875, 0.0419921875, 0.0821533203125, 0.122314453125, 0.1624755859375, 0.20263671875, 0.2427978515625, 0.282958984375, 0.3231201171875, 0.36328125, 0.4034423828125, 0.443603515625, 0.4837646484375, 0.52392578125, 0.5640869140625, 0.604248046875, 0.6444091796875, 0.6845703125, 0.7247314453125, 0.764892578125, 0.8050537109375, 0.84521484375, 0.8853759765625, 0.925537109375, 0.9656982421875, 1.005859375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 10.0, 47.0, 387.0, 487.0, 67.0, 12.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7109375, -1.668212890625, -1.62548828125, -1.582763671875, -1.5400390625, -1.497314453125, -1.45458984375, -1.411865234375, -1.369140625, -1.326416015625, -1.28369140625, -1.240966796875, -1.1982421875, -1.155517578125, -1.11279296875, -1.070068359375, -1.02734375, -0.984619140625, -0.94189453125, -0.899169921875, -0.8564453125, -0.813720703125, -0.77099609375, -0.728271484375, -0.685546875, -0.642822265625, -0.60009765625, -0.557373046875, -0.5146484375, -0.471923828125, -0.42919921875, -0.386474609375, -0.34375, -0.301025390625, -0.25830078125, -0.215576171875, -0.1728515625, -0.130126953125, -0.08740234375, -0.044677734375, -0.001953125, 0.040771484375, 0.08349609375, 0.126220703125, 0.1689453125, 0.211669921875, 0.25439453125, 0.297119140625, 0.33984375, 0.382568359375, 0.42529296875, 0.468017578125, 0.5107421875, 0.553466796875, 0.59619140625, 0.638916015625, 0.681640625, 0.724365234375, 0.76708984375, 0.809814453125, 0.8525390625, 0.895263671875, 0.93798828125, 0.980712890625, 1.0234375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 7.0, 15.0, 208.0, 558.0, 167.0, 39.0, 11.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.039624214172363, -13.681843757629395, -13.324064254760742, -12.966283798217773, -12.608504295349121, -12.250723838806152, -11.8929443359375, -11.535163879394531, -11.177383422851562, -10.819602966308594, -10.461823463439941, -10.104043006896973, -9.74626350402832, -9.388483047485352, -9.030702590942383, -8.67292308807373, -8.315143585205078, -7.957363605499268, -7.599583625793457, -7.241803169250488, -6.884023666381836, -6.526243209838867, -6.168463230133057, -5.810683250427246, -5.4529032707214355, -5.095123291015625, -4.7373433113098145, -4.379563331604004, -4.021782875061035, -3.6640031337738037, -3.306222915649414, -2.9484429359436035, -2.5906620025634766, -2.232882022857666, -1.875101923942566, -1.5173218250274658, -1.1595418453216553, -0.8017618656158447, -0.4439816474914551, -0.08620166778564453, 0.271578311920166, 0.6293583512306213, 0.9871383905410767, 1.3449184894561768, 1.7026984691619873, 2.060478448867798, 2.4182586669921875, 2.776038646697998, 3.1338186264038086, 3.491598606109619, 3.8493785858154297, 4.207159042358398, 4.564938545227051, 4.9227190017700195, 5.28049898147583, 5.638278961181641, 5.996058940887451, 6.353838920593262, 6.711618900299072, 7.069398880004883, 7.427179336547852, 7.784958839416504, 8.142739295959473, 8.500518798828125, 8.858299255371094]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 4.0, 5.0, 7.0, 12.0, 6.0, 6.0, 17.0, 15.0, 18.0, 16.0, 18.0, 20.0, 29.0, 21.0, 20.0, 28.0, 41.0, 30.0, 42.0, 28.0, 39.0, 43.0, 32.0, 42.0, 52.0, 45.0, 47.0, 38.0, 38.0, 26.0, 23.0, 34.0, 26.0, 28.0, 11.0, 14.0, 14.0, 12.0, 12.0, 10.0, 8.0, 6.0, 5.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.8073842525482178, -2.716726779937744, -2.6260693073272705, -2.535411834716797, -2.444754123687744, -2.3540966510772705, -2.263439178466797, -2.1727817058563232, -2.0821242332458496, -1.991466760635376, -1.9008092880249023, -1.8101516962051392, -1.7194942235946655, -1.628836750984192, -1.5381791591644287, -1.447521686553955, -1.3568642139434814, -1.2662067413330078, -1.1755492687225342, -1.084891676902771, -0.9942342042922974, -0.9035767316818237, -0.8129191994667053, -0.7222616672515869, -0.6316041946411133, -0.5409467220306396, -0.45028918981552124, -0.3596316874027252, -0.2689741849899292, -0.17831668257713318, -0.08765918016433716, 0.00299835205078125, 0.09365558624267578, 0.1843130886554718, 0.2749705910682678, 0.36562809348106384, 0.45628559589385986, 0.5469430685043335, 0.6376006007194519, 0.7282581329345703, 0.818915605545044, 0.9095730781555176, 1.0002305507659912, 1.0908881425857544, 1.181545615196228, 1.2722030878067017, 1.3628606796264648, 1.4535181522369385, 1.544175624847412, 1.6348330974578857, 1.7254905700683594, 1.8161481618881226, 1.9068056344985962, 1.9974631071090698, 2.088120698928833, 2.1787781715393066, 2.2694356441497803, 2.360093116760254, 2.4507505893707275, 2.541408061981201, 2.632065773010254, 2.7227232456207275, 2.813380718231201, 2.904038190841675, 2.9946956634521484]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 8.0, 2.0, 3.0, 11.0, 12.0, 7.0, 26.0, 37.0, 55.0, 82.0, 118.0, 191.0, 386.0, 816.0, 2295.0, 9424.0, 100956.0, 4014250.0, 55652.0, 6811.0, 1747.0, 658.0, 326.0, 185.0, 102.0, 52.0, 24.0, 17.0, 13.0, 13.0, 6.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.94189453125, -0.9087295532226562, -0.8755645751953125, -0.8423995971679688, -0.809234619140625, -0.7760696411132812, -0.7429046630859375, -0.7097396850585938, -0.67657470703125, -0.6434097290039062, -0.6102447509765625, -0.5770797729492188, -0.543914794921875, -0.5107498168945312, -0.4775848388671875, -0.44441986083984375, -0.4112548828125, -0.37808990478515625, -0.3449249267578125, -0.31175994873046875, -0.278594970703125, -0.24542999267578125, -0.2122650146484375, -0.17910003662109375, -0.14593505859375, -0.11277008056640625, -0.0796051025390625, -0.04644012451171875, -0.013275146484375, 0.01988983154296875, 0.0530548095703125, 0.08621978759765625, 0.119384765625, 0.15254974365234375, 0.1857147216796875, 0.21887969970703125, 0.252044677734375, 0.28520965576171875, 0.3183746337890625, 0.35153961181640625, 0.38470458984375, 0.41786956787109375, 0.4510345458984375, 0.48419952392578125, 0.517364501953125, 0.5505294799804688, 0.5836944580078125, 0.6168594360351562, 0.6500244140625, 0.6831893920898438, 0.7163543701171875, 0.7495193481445312, 0.782684326171875, 0.8158493041992188, 0.8490142822265625, 0.8821792602539062, 0.91534423828125, 0.9485092163085938, 0.9816741943359375, 1.0148391723632812, 1.048004150390625, 1.0811691284179688, 1.1143341064453125, 1.1474990844726562, 1.1806640625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 7.0, 10.0, 14.0, 27.0, 34.0, 34.0, 51.0, 58.0, 57.0, 78.0, 99.0, 90.0, 87.0, 72.0, 77.0, 55.0, 53.0, 32.0, 25.0, 17.0, 18.0, 2.0, 5.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.374267578125, -0.36423492431640625, -0.3542022705078125, -0.34416961669921875, -0.334136962890625, -0.32410430908203125, -0.3140716552734375, -0.30403900146484375, -0.29400634765625, -0.28397369384765625, -0.2739410400390625, -0.26390838623046875, -0.253875732421875, -0.24384307861328125, -0.2338104248046875, -0.22377777099609375, -0.2137451171875, -0.20371246337890625, -0.1936798095703125, -0.18364715576171875, -0.173614501953125, -0.16358184814453125, -0.1535491943359375, -0.14351654052734375, -0.13348388671875, -0.12345123291015625, -0.1134185791015625, -0.10338592529296875, -0.093353271484375, -0.08332061767578125, -0.0732879638671875, -0.06325531005859375, -0.05322265625, -0.04319000244140625, -0.0331573486328125, -0.02312469482421875, -0.013092041015625, -0.00305938720703125, 0.0069732666015625, 0.01700592041015625, 0.02703857421875, 0.03707122802734375, 0.0471038818359375, 0.05713653564453125, 0.067169189453125, 0.07720184326171875, 0.0872344970703125, 0.09726715087890625, 0.1072998046875, 0.11733245849609375, 0.1273651123046875, 0.13739776611328125, 0.147430419921875, 0.15746307373046875, 0.1674957275390625, 0.17752838134765625, 0.18756103515625, 0.19759368896484375, 0.2076263427734375, 0.21765899658203125, 0.227691650390625, 0.23772430419921875, 0.2477569580078125, 0.25778961181640625, 0.267822265625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 8.0, 12.0, 9.0, 10.0, 9.0, 20.0, 18.0, 29.0, 38.0, 58.0, 67.0, 100.0, 172.0, 271.0, 544.0, 1136.0, 2979.0, 11607.0, 128478.0, 3969921.0, 65629.0, 8463.0, 2468.0, 1040.0, 483.0, 246.0, 160.0, 103.0, 60.0, 41.0, 29.0, 16.0, 11.0, 16.0, 12.0, 12.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.86474609375, -0.8403167724609375, -0.815887451171875, -0.7914581298828125, -0.76702880859375, -0.7425994873046875, -0.718170166015625, -0.6937408447265625, -0.6693115234375, -0.6448822021484375, -0.620452880859375, -0.5960235595703125, -0.57159423828125, -0.5471649169921875, -0.522735595703125, -0.4983062744140625, -0.473876953125, -0.4494476318359375, -0.425018310546875, -0.4005889892578125, -0.37615966796875, -0.3517303466796875, -0.327301025390625, -0.3028717041015625, -0.2784423828125, -0.2540130615234375, -0.229583740234375, -0.2051544189453125, -0.18072509765625, -0.1562957763671875, -0.131866455078125, -0.1074371337890625, -0.0830078125, -0.0585784912109375, -0.034149169921875, -0.0097198486328125, 0.01470947265625, 0.0391387939453125, 0.063568115234375, 0.0879974365234375, 0.1124267578125, 0.1368560791015625, 0.161285400390625, 0.1857147216796875, 0.21014404296875, 0.2345733642578125, 0.259002685546875, 0.2834320068359375, 0.307861328125, 0.3322906494140625, 0.356719970703125, 0.3811492919921875, 0.40557861328125, 0.4300079345703125, 0.454437255859375, 0.4788665771484375, 0.5032958984375, 0.5277252197265625, 0.552154541015625, 0.5765838623046875, 0.60101318359375, 0.6254425048828125, 0.649871826171875, 0.6743011474609375, 0.69873046875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 5.0, 12.0, 18.0, 24.0, 56.0, 235.0, 2617.0, 867.0, 142.0, 48.0, 19.0, 14.0, 7.0, 3.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 3.0], "bins": [-0.697265625, -0.6826953887939453, -0.6681251525878906, -0.6535549163818359, -0.6389846801757812, -0.6244144439697266, -0.6098442077636719, -0.5952739715576172, -0.5807037353515625, -0.5661334991455078, -0.5515632629394531, -0.5369930267333984, -0.5224227905273438, -0.5078525543212891, -0.4932823181152344, -0.4787120819091797, -0.464141845703125, -0.4495716094970703, -0.4350013732910156, -0.42043113708496094, -0.40586090087890625, -0.39129066467285156, -0.3767204284667969, -0.3621501922607422, -0.3475799560546875, -0.3330097198486328, -0.3184394836425781, -0.30386924743652344, -0.28929901123046875, -0.27472877502441406, -0.2601585388183594, -0.2455883026123047, -0.23101806640625, -0.2164478302001953, -0.20187759399414062, -0.18730735778808594, -0.17273712158203125, -0.15816688537597656, -0.14359664916992188, -0.1290264129638672, -0.1144561767578125, -0.09988594055175781, -0.08531570434570312, -0.07074546813964844, -0.05617523193359375, -0.04160499572753906, -0.027034759521484375, -0.012464523315429688, 0.002105712890625, 0.016675949096679688, 0.031246185302734375, 0.04581642150878906, 0.06038665771484375, 0.07495689392089844, 0.08952713012695312, 0.10409736633300781, 0.1186676025390625, 0.1332378387451172, 0.14780807495117188, 0.16237831115722656, 0.17694854736328125, 0.19151878356933594, 0.20608901977539062, 0.2206592559814453, 0.2352294921875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 10.0, 16.0, 44.0, 100.0, 210.0, 298.0, 196.0, 75.0, 29.0, 5.0, 3.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5799061059951782, -1.5246837139129639, -1.469461441040039, -1.4142390489578247, -1.3590166568756104, -1.303794264793396, -1.2485718727111816, -1.1933495998382568, -1.1381272077560425, -1.0829048156738281, -1.0276825428009033, -0.972460150718689, -0.9172377586364746, -0.8620153665542603, -0.8067930340766907, -0.7515707015991211, -0.6963483095169067, -0.6411259174346924, -0.5859035849571228, -0.5306812524795532, -0.47545886039733887, -0.4202364981174469, -0.36501413583755493, -0.30979177355766296, -0.254569411277771, -0.19934704899787903, -0.14412468671798706, -0.08890232443809509, -0.033679962158203125, 0.021542400121688843, 0.07676476240158081, 0.13198712468147278, 0.1872096061706543, 0.24243196845054626, 0.29765433073043823, 0.3528766930103302, 0.40809905529022217, 0.46332141757011414, 0.5185437798500061, 0.5737661123275757, 0.62898850440979, 0.6842108964920044, 0.739433228969574, 0.7946555614471436, 0.8498779535293579, 0.9051003456115723, 0.9603226780891418, 1.0155450105667114, 1.0707674026489258, 1.1259897947311401, 1.1812121868133545, 1.2364344596862793, 1.2916568517684937, 1.346879243850708, 1.4021015167236328, 1.4573239088058472, 1.5125463008880615, 1.5677686929702759, 1.6229910850524902, 1.678213357925415, 1.7334357500076294, 1.7886581420898438, 1.8438804149627686, 1.899102807044983, 1.9543251991271973]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 7.0, 4.0, 3.0, 4.0, 6.0, 20.0, 14.0, 22.0, 34.0, 32.0, 40.0, 40.0, 43.0, 60.0, 70.0, 57.0, 58.0, 55.0, 56.0, 62.0, 51.0, 51.0, 45.0, 44.0, 31.0, 17.0, 18.0, 16.0, 7.0, 15.0, 6.0, 8.0, 8.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.018858790397644, -0.9912204742431641, -0.9635821580886841, -0.9359437823295593, -0.9083054661750793, -0.8806671500205994, -0.8530288338661194, -0.8253904581069946, -0.7977521419525146, -0.7701138257980347, -0.7424755096435547, -0.7148371338844299, -0.68719881772995, -0.65956050157547, -0.63192218542099, -0.6042838096618652, -0.5766454935073853, -0.5490071773529053, -0.5213688611984253, -0.4937305152416229, -0.46609216928482056, -0.4384538531303406, -0.4108155369758606, -0.3831771910190582, -0.35553890466690063, -0.32790058851242065, -0.3002622425556183, -0.2726239264011383, -0.24498558044433594, -0.21734726428985596, -0.18970893323421478, -0.1620706021785736, -0.13443225622177124, -0.10679392516613007, -0.07915559411048889, -0.051517270505428314, -0.02387893944978714, 0.0037593841552734375, 0.03139771521091461, 0.059036046266555786, 0.08667437732219696, 0.11431270837783813, 0.1419510394334793, 0.16958937048912048, 0.19722768664360046, 0.22486601769924164, 0.2525043487548828, 0.2801426649093628, 0.30778101086616516, 0.33541932702064514, 0.3630576729774475, 0.3906959891319275, 0.41833433508872986, 0.44597265124320984, 0.4736109972000122, 0.5012493133544922, 0.5288876295089722, 0.5565259456634521, 0.5841642618179321, 0.6118026375770569, 0.6394409537315369, 0.6670792698860168, 0.6947175860404968, 0.7223559617996216, 0.7499942779541016]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 9.0, 4.0, 3.0, 15.0, 16.0, 20.0, 41.0, 76.0, 132.0, 205.0, 402.0, 842.0, 2593.0, 12676.0, 103998.0, 770211.0, 136763.0, 15650.0, 3002.0, 1009.0, 375.0, 208.0, 107.0, 78.0, 53.0, 31.0, 16.0, 9.0, 5.0, 5.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.96435546875, -0.9356155395507812, -0.9068756103515625, -0.8781356811523438, -0.849395751953125, -0.8206558227539062, -0.7919158935546875, -0.7631759643554688, -0.73443603515625, -0.7056961059570312, -0.6769561767578125, -0.6482162475585938, -0.619476318359375, -0.5907363891601562, -0.5619964599609375, -0.5332565307617188, -0.5045166015625, -0.47577667236328125, -0.4470367431640625, -0.41829681396484375, -0.389556884765625, -0.36081695556640625, -0.3320770263671875, -0.30333709716796875, -0.27459716796875, -0.24585723876953125, -0.2171173095703125, -0.18837738037109375, -0.159637451171875, -0.13089752197265625, -0.1021575927734375, -0.07341766357421875, -0.044677734375, -0.01593780517578125, 0.0128021240234375, 0.04154205322265625, 0.070281982421875, 0.09902191162109375, 0.1277618408203125, 0.15650177001953125, 0.18524169921875, 0.21398162841796875, 0.2427215576171875, 0.27146148681640625, 0.300201416015625, 0.32894134521484375, 0.3576812744140625, 0.38642120361328125, 0.4151611328125, 0.44390106201171875, 0.4726409912109375, 0.5013809204101562, 0.530120849609375, 0.5588607788085938, 0.5876007080078125, 0.6163406372070312, 0.64508056640625, 0.6738204956054688, 0.7025604248046875, 0.7313003540039062, 0.760040283203125, 0.7887802124023438, 0.8175201416015625, 0.8462600708007812, 0.875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 6.0, 13.0, 19.0, 25.0, 41.0, 46.0, 57.0, 67.0, 75.0, 106.0, 103.0, 74.0, 91.0, 70.0, 68.0, 50.0, 33.0, 30.0, 16.0, 8.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.399658203125, -0.38896942138671875, -0.3782806396484375, -0.36759185791015625, -0.356903076171875, -0.34621429443359375, -0.3355255126953125, -0.32483673095703125, -0.31414794921875, -0.30345916748046875, -0.2927703857421875, -0.28208160400390625, -0.271392822265625, -0.26070404052734375, -0.2500152587890625, -0.23932647705078125, -0.2286376953125, -0.21794891357421875, -0.2072601318359375, -0.19657135009765625, -0.185882568359375, -0.17519378662109375, -0.1645050048828125, -0.15381622314453125, -0.14312744140625, -0.13243865966796875, -0.1217498779296875, -0.11106109619140625, -0.100372314453125, -0.08968353271484375, -0.0789947509765625, -0.06830596923828125, -0.0576171875, -0.04692840576171875, -0.0362396240234375, -0.02555084228515625, -0.014862060546875, -0.00417327880859375, 0.0065155029296875, 0.01720428466796875, 0.02789306640625, 0.03858184814453125, 0.0492706298828125, 0.05995941162109375, 0.070648193359375, 0.08133697509765625, 0.0920257568359375, 0.10271453857421875, 0.1134033203125, 0.12409210205078125, 0.1347808837890625, 0.14546966552734375, 0.156158447265625, 0.16684722900390625, 0.1775360107421875, 0.18822479248046875, 0.19891357421875, 0.20960235595703125, 0.2202911376953125, 0.23097991943359375, 0.241668701171875, 0.25235748291015625, 0.2630462646484375, 0.27373504638671875, 0.284423828125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 9.0, 8.0, 3.0, 9.0, 9.0, 5.0, 14.0, 18.0, 40.0, 57.0, 68.0, 107.0, 166.0, 277.0, 492.0, 1132.0, 3168.0, 10520.0, 47042.0, 306125.0, 558289.0, 94188.0, 18367.0, 4950.0, 1797.0, 707.0, 356.0, 181.0, 135.0, 80.0, 57.0, 38.0, 46.0, 31.0, 17.0, 8.0, 7.0, 9.0, 5.0, 3.0, 8.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46533203125, -0.45041656494140625, -0.4355010986328125, -0.42058563232421875, -0.405670166015625, -0.39075469970703125, -0.3758392333984375, -0.36092376708984375, -0.34600830078125, -0.33109283447265625, -0.3161773681640625, -0.30126190185546875, -0.286346435546875, -0.27143096923828125, -0.2565155029296875, -0.24160003662109375, -0.2266845703125, -0.21176910400390625, -0.1968536376953125, -0.18193817138671875, -0.167022705078125, -0.15210723876953125, -0.1371917724609375, -0.12227630615234375, -0.10736083984375, -0.09244537353515625, -0.0775299072265625, -0.06261444091796875, -0.047698974609375, -0.03278350830078125, -0.0178680419921875, -0.00295257568359375, 0.011962890625, 0.02687835693359375, 0.0417938232421875, 0.05670928955078125, 0.071624755859375, 0.08654022216796875, 0.1014556884765625, 0.11637115478515625, 0.13128662109375, 0.14620208740234375, 0.1611175537109375, 0.17603302001953125, 0.190948486328125, 0.20586395263671875, 0.2207794189453125, 0.23569488525390625, 0.2506103515625, 0.26552581787109375, 0.2804412841796875, 0.29535675048828125, 0.310272216796875, 0.32518768310546875, 0.3401031494140625, 0.35501861572265625, 0.36993408203125, 0.38484954833984375, 0.3997650146484375, 0.41468048095703125, 0.429595947265625, 0.44451141357421875, 0.4594268798828125, 0.47434234619140625, 0.4892578125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 4.0, 3.0, 7.0, 9.0, 15.0, 13.0, 9.0, 21.0, 20.0, 22.0, 30.0, 36.0, 43.0, 33.0, 52.0, 40.0, 37.0, 46.0, 53.0, 40.0, 54.0, 49.0, 41.0, 41.0, 47.0, 28.0, 36.0, 25.0, 21.0, 27.0, 19.0, 17.0, 11.0, 15.0, 10.0, 3.0, 10.0, 9.0, 7.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.650390625, -0.629425048828125, -0.60845947265625, -0.587493896484375, -0.5665283203125, -0.545562744140625, -0.52459716796875, -0.503631591796875, -0.482666015625, -0.461700439453125, -0.44073486328125, -0.419769287109375, -0.3988037109375, -0.377838134765625, -0.35687255859375, -0.335906982421875, -0.31494140625, -0.293975830078125, -0.27301025390625, -0.252044677734375, -0.2310791015625, -0.210113525390625, -0.18914794921875, -0.168182373046875, -0.147216796875, -0.126251220703125, -0.10528564453125, -0.084320068359375, -0.0633544921875, -0.042388916015625, -0.02142333984375, -0.000457763671875, 0.0205078125, 0.041473388671875, 0.06243896484375, 0.083404541015625, 0.1043701171875, 0.125335693359375, 0.14630126953125, 0.167266845703125, 0.188232421875, 0.209197998046875, 0.23016357421875, 0.251129150390625, 0.2720947265625, 0.293060302734375, 0.31402587890625, 0.334991455078125, 0.35595703125, 0.376922607421875, 0.39788818359375, 0.418853759765625, 0.4398193359375, 0.460784912109375, 0.48175048828125, 0.502716064453125, 0.523681640625, 0.544647216796875, 0.56561279296875, 0.586578369140625, 0.6075439453125, 0.628509521484375, 0.64947509765625, 0.670440673828125, 0.69140625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 6.0, 6.0, 14.0, 25.0, 30.0, 43.0, 52.0, 75.0, 114.0, 130.0, 282.0, 479.0, 1260.0, 5710.0, 59262.0, 704925.0, 256334.0, 15674.0, 2383.0, 790.0, 380.0, 209.0, 116.0, 82.0, 53.0, 45.0, 21.0, 16.0, 7.0, 7.0, 4.0, 10.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.193603515625, -0.18686866760253906, -0.18013381958007812, -0.1733989715576172, -0.16666412353515625, -0.1599292755126953, -0.15319442749023438, -0.14645957946777344, -0.1397247314453125, -0.13298988342285156, -0.12625503540039062, -0.11952018737792969, -0.11278533935546875, -0.10605049133300781, -0.09931564331054688, -0.09258079528808594, -0.085845947265625, -0.07911109924316406, -0.07237625122070312, -0.06564140319824219, -0.05890655517578125, -0.05217170715332031, -0.045436859130859375, -0.03870201110839844, -0.0319671630859375, -0.025232315063476562, -0.018497467041015625, -0.011762619018554688, -0.00502777099609375, 0.0017070770263671875, 0.008441925048828125, 0.015176773071289062, 0.02191162109375, 0.028646469116210938, 0.035381317138671875, 0.04211616516113281, 0.04885101318359375, 0.05558586120605469, 0.062320709228515625, 0.06905555725097656, 0.0757904052734375, 0.08252525329589844, 0.08926010131835938, 0.09599494934082031, 0.10272979736328125, 0.10946464538574219, 0.11619949340820312, 0.12293434143066406, 0.129669189453125, 0.13640403747558594, 0.14313888549804688, 0.1498737335205078, 0.15660858154296875, 0.1633434295654297, 0.17007827758789062, 0.17681312561035156, 0.1835479736328125, 0.19028282165527344, 0.19701766967773438, 0.2037525177001953, 0.21048736572265625, 0.2172222137451172, 0.22395706176757812, 0.23069190979003906, 0.2374267578125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 7.0, 15.0, 31.0, 87.0, 270.0, 358.0, 137.0, 57.0, 24.0, 11.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0008192062377929688, -0.0008028671145439148, -0.0007865279912948608, -0.0007701888680458069, -0.0007538497447967529, -0.000737510621547699, -0.000721171498298645, -0.0007048323750495911, -0.0006884932518005371, -0.0006721541285514832, -0.0006558150053024292, -0.0006394758820533752, -0.0006231367588043213, -0.0006067976355552673, -0.0005904585123062134, -0.0005741193890571594, -0.0005577802658081055, -0.0005414411425590515, -0.0005251020193099976, -0.0005087628960609436, -0.0004924237728118896, -0.0004760846495628357, -0.00045974552631378174, -0.0004434064030647278, -0.00042706727981567383, -0.0004107281565666199, -0.0003943890333175659, -0.00037804991006851196, -0.000361710786819458, -0.00034537166357040405, -0.0003290325403213501, -0.00031269341707229614, -0.0002963542938232422, -0.00028001517057418823, -0.0002636760473251343, -0.0002473369240760803, -0.00023099780082702637, -0.0002146586775779724, -0.00019831955432891846, -0.0001819804310798645, -0.00016564130783081055, -0.0001493021845817566, -0.00013296306133270264, -0.00011662393808364868, -0.00010028481483459473, -8.394569158554077e-05, -6.760656833648682e-05, -5.126744508743286e-05, -3.4928321838378906e-05, -1.858919858932495e-05, -2.250075340270996e-06, 1.4089047908782959e-05, 3.0428171157836914e-05, 4.676729440689087e-05, 6.310641765594482e-05, 7.944554090499878e-05, 9.578466415405273e-05, 0.00011212378740310669, 0.00012846291065216064, 0.0001448020339012146, 0.00016114115715026855, 0.0001774802803993225, 0.00019381940364837646, 0.00021015852689743042, 0.00022649765014648438]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 5.0, 1.0, 3.0, 4.0, 10.0, 12.0, 26.0, 25.0, 49.0, 83.0, 128.0, 265.0, 568.0, 1418.0, 4315.0, 26251.0, 392611.0, 572882.0, 41242.0, 5591.0, 1690.0, 652.0, 320.0, 159.0, 102.0, 52.0, 34.0, 20.0, 18.0, 7.0, 8.0, 7.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.189208984375, -0.18270492553710938, -0.17620086669921875, -0.16969680786132812, -0.1631927490234375, -0.15668869018554688, -0.15018463134765625, -0.14368057250976562, -0.137176513671875, -0.13067245483398438, -0.12416839599609375, -0.11766433715820312, -0.1111602783203125, -0.10465621948242188, -0.09815216064453125, -0.09164810180664062, -0.08514404296875, -0.07863998413085938, -0.07213592529296875, -0.06563186645507812, -0.0591278076171875, -0.052623748779296875, -0.04611968994140625, -0.039615631103515625, -0.033111572265625, -0.026607513427734375, -0.02010345458984375, -0.013599395751953125, -0.0070953369140625, -0.000591278076171875, 0.00591278076171875, 0.012416839599609375, 0.0189208984375, 0.025424957275390625, 0.03192901611328125, 0.038433074951171875, 0.0449371337890625, 0.051441192626953125, 0.05794525146484375, 0.06444931030273438, 0.070953369140625, 0.07745742797851562, 0.08396148681640625, 0.09046554565429688, 0.0969696044921875, 0.10347366333007812, 0.10997772216796875, 0.11648178100585938, 0.12298583984375, 0.12948989868164062, 0.13599395751953125, 0.14249801635742188, 0.1490020751953125, 0.15550613403320312, 0.16201019287109375, 0.16851425170898438, 0.175018310546875, 0.18152236938476562, 0.18802642822265625, 0.19453048706054688, 0.2010345458984375, 0.20753860473632812, 0.21404266357421875, 0.22054672241210938, 0.22705078125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 7.0, 19.0, 30.0, 53.0, 96.0, 149.0, 202.0, 175.0, 100.0, 71.0, 40.0, 25.0, 10.0, 11.0, 4.0, 4.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25537109375, -0.2450103759765625, -0.234649658203125, -0.2242889404296875, -0.21392822265625, -0.2035675048828125, -0.193206787109375, -0.1828460693359375, -0.1724853515625, -0.1621246337890625, -0.151763916015625, -0.1414031982421875, -0.13104248046875, -0.1206817626953125, -0.110321044921875, -0.0999603271484375, -0.089599609375, -0.0792388916015625, -0.068878173828125, -0.0585174560546875, -0.04815673828125, -0.0377960205078125, -0.027435302734375, -0.0170745849609375, -0.0067138671875, 0.0036468505859375, 0.014007568359375, 0.0243682861328125, 0.03472900390625, 0.0450897216796875, 0.055450439453125, 0.0658111572265625, 0.076171875, 0.0865325927734375, 0.096893310546875, 0.1072540283203125, 0.11761474609375, 0.1279754638671875, 0.138336181640625, 0.1486968994140625, 0.1590576171875, 0.1694183349609375, 0.179779052734375, 0.1901397705078125, 0.20050048828125, 0.2108612060546875, 0.221221923828125, 0.2315826416015625, 0.241943359375, 0.2523040771484375, 0.262664794921875, 0.2730255126953125, 0.28338623046875, 0.2937469482421875, 0.304107666015625, 0.3144683837890625, 0.3248291015625, 0.3351898193359375, 0.345550537109375, 0.3559112548828125, 0.36627197265625, 0.3766326904296875, 0.386993408203125, 0.3973541259765625, 0.40771484375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0, 19.0, 145.0, 495.0, 259.0, 62.0, 14.0, 9.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.169074058532715, -6.876773834228516, -6.584473133087158, -6.292172431945801, -5.999872207641602, -5.707571983337402, -5.415271282196045, -5.1229705810546875, -4.830670356750488, -4.538370132446289, -4.246069431304932, -3.9537689685821533, -3.661468505859375, -3.3691680431365967, -3.0768675804138184, -2.78456711769104, -2.4922666549682617, -2.1999661922454834, -1.907665729522705, -1.6153652667999268, -1.3230648040771484, -1.0307643413543701, -0.7384638786315918, -0.4461634159088135, -0.15386295318603516, 0.13843750953674316, 0.4307379722595215, 0.7230384349822998, 1.0153388977050781, 1.3076393604278564, 1.5999398231506348, 1.892240285873413, 2.184539794921875, 2.4768402576446533, 2.7691407203674316, 3.06144118309021, 3.3537416458129883, 3.6460421085357666, 3.938342571258545, 4.230643272399902, 4.522943496704102, 4.815243721008301, 5.107544422149658, 5.399845123291016, 5.692145347595215, 5.984445571899414, 6.2767462730407715, 6.569046974182129, 6.861347198486328, 7.153647422790527, 7.445948123931885, 7.738248825073242, 8.030549049377441, 8.32284927368164, 8.615150451660156, 8.907450675964355, 9.199750900268555, 9.492051124572754, 9.784351348876953, 10.076652526855469, 10.368952751159668, 10.661252975463867, 10.953554153442383, 11.245854377746582, 11.538154602050781]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 0.0, 6.0, 1.0, 2.0, 9.0, 7.0, 7.0, 7.0, 8.0, 10.0, 9.0, 13.0, 16.0, 21.0, 20.0, 16.0, 37.0, 26.0, 27.0, 34.0, 33.0, 34.0, 31.0, 43.0, 34.0, 43.0, 49.0, 40.0, 36.0, 45.0, 29.0, 30.0, 44.0, 25.0, 23.0, 21.0, 32.0, 22.0, 17.0, 20.0, 14.0, 16.0, 10.0, 11.0, 7.0, 3.0, 9.0, 4.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.585902214050293, -2.4994189739227295, -2.412935495376587, -2.3264522552490234, -2.239968776702881, -2.1534855365753174, -2.067002296447754, -1.9805189371109009, -1.8940355777740479, -1.8075522184371948, -1.7210688591003418, -1.6345856189727783, -1.5481022596359253, -1.4616189002990723, -1.3751356601715088, -1.2886523008346558, -1.2021689414978027, -1.1156855821609497, -1.0292022228240967, -0.9427189826965332, -0.8562356233596802, -0.7697522640228271, -0.6832689642906189, -0.5967856645584106, -0.5103023052215576, -0.423818975687027, -0.33733564615249634, -0.2508523166179657, -0.16436898708343506, -0.07788565754890442, 0.00859767198562622, 0.09508097171783447, 0.1815643310546875, 0.26804766058921814, 0.3545309901237488, 0.4410143196582794, 0.5274976491928101, 0.6139810085296631, 0.7004643082618713, 0.7869476079940796, 0.8734309673309326, 0.9599143266677856, 1.0463976860046387, 1.1328809261322021, 1.2193642854690552, 1.3058476448059082, 1.3923308849334717, 1.4788142442703247, 1.5652976036071777, 1.6517809629440308, 1.7382643222808838, 1.8247475624084473, 1.9112309217453003, 1.9977142810821533, 2.084197521209717, 2.1706809997558594, 2.257164239883423, 2.3436474800109863, 2.430130958557129, 2.5166141986846924, 2.603097438812256, 2.6895809173583984, 2.776064157485962, 2.8625473976135254, 2.949030876159668]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 4.0, 3.0, 9.0, 8.0, 10.0, 18.0, 39.0, 45.0, 70.0, 120.0, 230.0, 444.0, 1026.0, 2250.0, 6045.0, 20469.0, 285254.0, 3832270.0, 32991.0, 7907.0, 2721.0, 1178.0, 531.0, 254.0, 146.0, 85.0, 50.0, 32.0, 21.0, 21.0, 12.0, 5.0, 3.0, 1.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1650390625, -1.1298828125, -1.0947265625, -1.0595703125, -1.0244140625, -0.9892578125, -0.9541015625, -0.9189453125, -0.8837890625, -0.8486328125, -0.8134765625, -0.7783203125, -0.7431640625, -0.7080078125, -0.6728515625, -0.6376953125, -0.6025390625, -0.5673828125, -0.5322265625, -0.4970703125, -0.4619140625, -0.4267578125, -0.3916015625, -0.3564453125, -0.3212890625, -0.2861328125, -0.2509765625, -0.2158203125, -0.1806640625, -0.1455078125, -0.1103515625, -0.0751953125, -0.0400390625, -0.0048828125, 0.0302734375, 0.0654296875, 0.1005859375, 0.1357421875, 0.1708984375, 0.2060546875, 0.2412109375, 0.2763671875, 0.3115234375, 0.3466796875, 0.3818359375, 0.4169921875, 0.4521484375, 0.4873046875, 0.5224609375, 0.5576171875, 0.5927734375, 0.6279296875, 0.6630859375, 0.6982421875, 0.7333984375, 0.7685546875, 0.8037109375, 0.8388671875, 0.8740234375, 0.9091796875, 0.9443359375, 0.9794921875, 1.0146484375, 1.0498046875, 1.0849609375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 1.0, 4.0, 12.0, 19.0, 12.0, 22.0, 40.0, 40.0, 56.0, 54.0, 64.0, 75.0, 80.0, 79.0, 82.0, 77.0, 59.0, 61.0, 49.0, 38.0, 31.0, 23.0, 12.0, 8.0, 5.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.358154296875, -0.3479766845703125, -0.337799072265625, -0.3276214599609375, -0.31744384765625, -0.3072662353515625, -0.297088623046875, -0.2869110107421875, -0.2767333984375, -0.2665557861328125, -0.256378173828125, -0.2462005615234375, -0.23602294921875, -0.2258453369140625, -0.215667724609375, -0.2054901123046875, -0.1953125, -0.1851348876953125, -0.174957275390625, -0.1647796630859375, -0.15460205078125, -0.1444244384765625, -0.134246826171875, -0.1240692138671875, -0.1138916015625, -0.1037139892578125, -0.093536376953125, -0.0833587646484375, -0.07318115234375, -0.0630035400390625, -0.052825927734375, -0.0426483154296875, -0.032470703125, -0.0222930908203125, -0.012115478515625, -0.0019378662109375, 0.00823974609375, 0.0184173583984375, 0.028594970703125, 0.0387725830078125, 0.0489501953125, 0.0591278076171875, 0.069305419921875, 0.0794830322265625, 0.08966064453125, 0.0998382568359375, 0.110015869140625, 0.1201934814453125, 0.13037109375, 0.1405487060546875, 0.150726318359375, 0.1609039306640625, 0.17108154296875, 0.1812591552734375, 0.191436767578125, 0.2016143798828125, 0.2117919921875, 0.2219696044921875, 0.232147216796875, 0.2423248291015625, 0.25250244140625, 0.2626800537109375, 0.272857666015625, 0.2830352783203125, 0.293212890625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 1.0, 8.0, 11.0, 15.0, 24.0, 28.0, 36.0, 62.0, 94.0, 154.0, 354.0, 685.0, 1738.0, 6766.0, 61963.0, 4047341.0, 64561.0, 7075.0, 1782.0, 734.0, 370.0, 158.0, 110.0, 58.0, 39.0, 36.0, 19.0, 19.0, 16.0, 15.0, 4.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.93798828125, -0.9061965942382812, -0.8744049072265625, -0.8426132202148438, -0.810821533203125, -0.7790298461914062, -0.7472381591796875, -0.7154464721679688, -0.68365478515625, -0.6518630981445312, -0.6200714111328125, -0.5882797241210938, -0.556488037109375, -0.5246963500976562, -0.4929046630859375, -0.46111297607421875, -0.4293212890625, -0.39752960205078125, -0.3657379150390625, -0.33394622802734375, -0.302154541015625, -0.27036285400390625, -0.2385711669921875, -0.20677947998046875, -0.17498779296875, -0.14319610595703125, -0.1114044189453125, -0.07961273193359375, -0.047821044921875, -0.01602935791015625, 0.0157623291015625, 0.04755401611328125, 0.079345703125, 0.11113739013671875, 0.1429290771484375, 0.17472076416015625, 0.206512451171875, 0.23830413818359375, 0.2700958251953125, 0.30188751220703125, 0.33367919921875, 0.36547088623046875, 0.3972625732421875, 0.42905426025390625, 0.460845947265625, 0.49263763427734375, 0.5244293212890625, 0.5562210083007812, 0.5880126953125, 0.6198043823242188, 0.6515960693359375, 0.6833877563476562, 0.715179443359375, 0.7469711303710938, 0.7787628173828125, 0.8105545043945312, 0.84234619140625, 0.8741378784179688, 0.9059295654296875, 0.9377212524414062, 0.969512939453125, 1.0013046264648438, 1.0330963134765625, 1.0648880004882812, 1.0966796875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 6.0, 9.0, 27.0, 21.0, 93.0, 447.0, 3199.0, 152.0, 56.0, 22.0, 23.0, 9.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.374267578125, -0.3557853698730469, -0.33730316162109375, -0.3188209533691406, -0.3003387451171875, -0.2818565368652344, -0.26337432861328125, -0.24489212036132812, -0.226409912109375, -0.20792770385742188, -0.18944549560546875, -0.17096328735351562, -0.1524810791015625, -0.13399887084960938, -0.11551666259765625, -0.09703445434570312, -0.07855224609375, -0.060070037841796875, -0.04158782958984375, -0.023105621337890625, -0.0046234130859375, 0.013858795166015625, 0.03234100341796875, 0.050823211669921875, 0.069305419921875, 0.08778762817382812, 0.10626983642578125, 0.12475204467773438, 0.1432342529296875, 0.16171646118164062, 0.18019866943359375, 0.19868087768554688, 0.2171630859375, 0.23564529418945312, 0.25412750244140625, 0.2726097106933594, 0.2910919189453125, 0.3095741271972656, 0.32805633544921875, 0.3465385437011719, 0.365020751953125, 0.3835029602050781, 0.40198516845703125, 0.4204673767089844, 0.4389495849609375, 0.4574317932128906, 0.47591400146484375, 0.4943962097167969, 0.51287841796875, 0.5313606262207031, 0.5498428344726562, 0.5683250427246094, 0.5868072509765625, 0.6052894592285156, 0.6237716674804688, 0.6422538757324219, 0.660736083984375, 0.6792182922363281, 0.6977005004882812, 0.7161827087402344, 0.7346649169921875, 0.7531471252441406, 0.7716293334960938, 0.7901115417480469, 0.80859375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 14.0, 30.0, 147.0, 493.0, 225.0, 59.0, 11.0, 7.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8485846519470215, -1.7629787921905518, -1.6773728132247925, -1.5917669534683228, -1.506161093711853, -1.4205551147460938, -1.334949254989624, -1.2493433952331543, -1.1637375354766846, -1.0781316757202148, -0.9925257563591003, -0.9069198369979858, -0.8213139772415161, -0.7357080578804016, -0.6501021385192871, -0.5644962787628174, -0.4788902997970581, -0.393284410238266, -0.3076785206794739, -0.22207260131835938, -0.13646671175956726, -0.050860822200775146, 0.034745097160339355, 0.12035095691680908, 0.20595687627792358, 0.2915627658367157, 0.3771686553955078, 0.4627745747566223, 0.5483804941177368, 0.6339863538742065, 0.719592273235321, 0.8051981329917908, 0.8908040523529053, 0.9764099717140198, 1.0620158910751343, 1.147621750831604, 1.2332276105880737, 1.318833589553833, 1.4044394493103027, 1.4900453090667725, 1.5756511688232422, 1.661257028579712, 1.7468630075454712, 1.832468867301941, 1.9180747270584106, 2.00368070602417, 2.0892865657806396, 2.1748924255371094, 2.260498523712158, 2.346104383468628, 2.4317102432250977, 2.5173163414001465, 2.602922201156616, 2.688528060913086, 2.7741339206695557, 2.8597397804260254, 2.945345640182495, 3.030951499938965, 3.1165573596954346, 3.2021632194519043, 3.287769317626953, 3.373375177383423, 3.4589810371398926, 3.5445868968963623, 3.630192756652832]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 13.0, 5.0, 10.0, 16.0, 24.0, 42.0, 49.0, 54.0, 47.0, 68.0, 78.0, 64.0, 80.0, 61.0, 58.0, 65.0, 60.0, 35.0, 30.0, 38.0, 28.0, 20.0, 13.0, 8.0, 11.0, 12.0, 3.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.15854811668396, -1.1239628791809082, -1.089377522468567, -1.0547922849655151, -1.0202069282531738, -0.9856216907501221, -0.9510364532470703, -0.9164511561393738, -0.8818658590316772, -0.8472805619239807, -0.8126952648162842, -0.7781100273132324, -0.7435247302055359, -0.7089394330978394, -0.6743541955947876, -0.6397688984870911, -0.6051836013793945, -0.570598304271698, -0.5360130071640015, -0.5014277696609497, -0.4668424725532532, -0.43225717544555664, -0.3976719081401825, -0.36308664083480835, -0.3285013437271118, -0.2939160466194153, -0.25933077931404114, -0.2247454971075058, -0.19016021490097046, -0.15557493269443512, -0.12098965048789978, -0.08640436828136444, -0.0518190860748291, -0.017233803868293762, 0.017351478338241577, 0.051936760544776917, 0.08652204275131226, 0.1211073249578476, 0.15569260716438293, 0.19027788937091827, 0.2248631715774536, 0.25944846868515015, 0.2940337359905243, 0.32861900329589844, 0.36320430040359497, 0.3977895975112915, 0.43237486481666565, 0.4669601321220398, 0.5015454292297363, 0.5361307263374329, 0.5707160234451294, 0.6053012609481812, 0.6398865580558777, 0.6744718551635742, 0.709057092666626, 0.7436423897743225, 0.778227686882019, 0.8128129839897156, 0.8473982810974121, 0.8819835186004639, 0.9165688157081604, 0.9511541128158569, 0.9857393503189087, 1.02032470703125, 1.0549099445343018]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 1.0, 7.0, 7.0, 11.0, 22.0, 29.0, 49.0, 66.0, 114.0, 191.0, 360.0, 684.0, 1570.0, 4413.0, 15428.0, 69977.0, 416285.0, 440600.0, 74658.0, 16097.0, 4644.0, 1748.0, 754.0, 330.0, 176.0, 119.0, 84.0, 43.0, 30.0, 20.0, 12.0, 11.0, 1.0, 3.0, 5.0, 0.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.705078125, -0.6849441528320312, -0.6648101806640625, -0.6446762084960938, -0.624542236328125, -0.6044082641601562, -0.5842742919921875, -0.5641403198242188, -0.54400634765625, -0.5238723754882812, -0.5037384033203125, -0.48360443115234375, -0.463470458984375, -0.44333648681640625, -0.4232025146484375, -0.40306854248046875, -0.3829345703125, -0.36280059814453125, -0.3426666259765625, -0.32253265380859375, -0.302398681640625, -0.28226470947265625, -0.2621307373046875, -0.24199676513671875, -0.22186279296875, -0.20172882080078125, -0.1815948486328125, -0.16146087646484375, -0.141326904296875, -0.12119293212890625, -0.1010589599609375, -0.08092498779296875, -0.060791015625, -0.04065704345703125, -0.0205230712890625, -0.00038909912109375, 0.019744873046875, 0.03987884521484375, 0.0600128173828125, 0.08014678955078125, 0.10028076171875, 0.12041473388671875, 0.1405487060546875, 0.16068267822265625, 0.180816650390625, 0.20095062255859375, 0.2210845947265625, 0.24121856689453125, 0.2613525390625, 0.28148651123046875, 0.3016204833984375, 0.32175445556640625, 0.341888427734375, 0.36202239990234375, 0.3821563720703125, 0.40229034423828125, 0.42242431640625, 0.44255828857421875, 0.4626922607421875, 0.48282623291015625, 0.502960205078125, 0.5230941772460938, 0.5432281494140625, 0.5633621215820312, 0.58349609375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 3.0, 6.0, 10.0, 10.0, 17.0, 21.0, 28.0, 40.0, 46.0, 50.0, 60.0, 63.0, 72.0, 76.0, 75.0, 82.0, 83.0, 52.0, 53.0, 33.0, 48.0, 32.0, 23.0, 12.0, 6.0, 4.0, 3.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34033203125, -0.33028411865234375, -0.3202362060546875, -0.31018829345703125, -0.300140380859375, -0.29009246826171875, -0.2800445556640625, -0.26999664306640625, -0.25994873046875, -0.24990081787109375, -0.2398529052734375, -0.22980499267578125, -0.219757080078125, -0.20970916748046875, -0.1996612548828125, -0.18961334228515625, -0.1795654296875, -0.16951751708984375, -0.1594696044921875, -0.14942169189453125, -0.139373779296875, -0.12932586669921875, -0.1192779541015625, -0.10923004150390625, -0.09918212890625, -0.08913421630859375, -0.0790863037109375, -0.06903839111328125, -0.058990478515625, -0.04894256591796875, -0.0388946533203125, -0.02884674072265625, -0.018798828125, -0.00875091552734375, 0.0012969970703125, 0.01134490966796875, 0.021392822265625, 0.03144073486328125, 0.0414886474609375, 0.05153656005859375, 0.06158447265625, 0.07163238525390625, 0.0816802978515625, 0.09172821044921875, 0.101776123046875, 0.11182403564453125, 0.1218719482421875, 0.13191986083984375, 0.1419677734375, 0.15201568603515625, 0.1620635986328125, 0.17211151123046875, 0.182159423828125, 0.19220733642578125, 0.2022552490234375, 0.21230316162109375, 0.22235107421875, 0.23239898681640625, 0.2424468994140625, 0.25249481201171875, 0.262542724609375, 0.27259063720703125, 0.2826385498046875, 0.29268646240234375, 0.302734375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 1.0, 5.0, 3.0, 6.0, 10.0, 7.0, 9.0, 20.0, 17.0, 30.0, 49.0, 53.0, 112.0, 167.0, 264.0, 525.0, 893.0, 1907.0, 4621.0, 14690.0, 69489.0, 498534.0, 384432.0, 52984.0, 11962.0, 3970.0, 1698.0, 893.0, 443.0, 271.0, 145.0, 110.0, 59.0, 52.0, 27.0, 22.0, 16.0, 15.0, 7.0, 8.0, 6.0, 5.0, 3.0, 8.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.5576171875, -0.540679931640625, -0.52374267578125, -0.506805419921875, -0.4898681640625, -0.472930908203125, -0.45599365234375, -0.439056396484375, -0.422119140625, -0.405181884765625, -0.38824462890625, -0.371307373046875, -0.3543701171875, -0.337432861328125, -0.32049560546875, -0.303558349609375, -0.28662109375, -0.269683837890625, -0.25274658203125, -0.235809326171875, -0.2188720703125, -0.201934814453125, -0.18499755859375, -0.168060302734375, -0.151123046875, -0.134185791015625, -0.11724853515625, -0.100311279296875, -0.0833740234375, -0.066436767578125, -0.04949951171875, -0.032562255859375, -0.015625, 0.001312255859375, 0.01824951171875, 0.035186767578125, 0.0521240234375, 0.069061279296875, 0.08599853515625, 0.102935791015625, 0.119873046875, 0.136810302734375, 0.15374755859375, 0.170684814453125, 0.1876220703125, 0.204559326171875, 0.22149658203125, 0.238433837890625, 0.25537109375, 0.272308349609375, 0.28924560546875, 0.306182861328125, 0.3231201171875, 0.340057373046875, 0.35699462890625, 0.373931884765625, 0.390869140625, 0.407806396484375, 0.42474365234375, 0.441680908203125, 0.4586181640625, 0.475555419921875, 0.49249267578125, 0.509429931640625, 0.5263671875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 4.0, 9.0, 7.0, 6.0, 11.0, 16.0, 21.0, 30.0, 31.0, 39.0, 53.0, 58.0, 59.0, 61.0, 62.0, 55.0, 65.0, 61.0, 68.0, 49.0, 46.0, 40.0, 32.0, 28.0, 18.0, 22.0, 12.0, 9.0, 7.0, 4.0, 3.0, 6.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.03125, -0.9936676025390625, -0.956085205078125, -0.9185028076171875, -0.88092041015625, -0.8433380126953125, -0.805755615234375, -0.7681732177734375, -0.7305908203125, -0.6930084228515625, -0.655426025390625, -0.6178436279296875, -0.58026123046875, -0.5426788330078125, -0.505096435546875, -0.4675140380859375, -0.429931640625, -0.3923492431640625, -0.354766845703125, -0.3171844482421875, -0.27960205078125, -0.2420196533203125, -0.204437255859375, -0.1668548583984375, -0.1292724609375, -0.0916900634765625, -0.054107666015625, -0.0165252685546875, 0.02105712890625, 0.0586395263671875, 0.096221923828125, 0.1338043212890625, 0.17138671875, 0.2089691162109375, 0.246551513671875, 0.2841339111328125, 0.32171630859375, 0.3592987060546875, 0.396881103515625, 0.4344635009765625, 0.4720458984375, 0.5096282958984375, 0.547210693359375, 0.5847930908203125, 0.62237548828125, 0.6599578857421875, 0.697540283203125, 0.7351226806640625, 0.772705078125, 0.8102874755859375, 0.847869873046875, 0.8854522705078125, 0.92303466796875, 0.9606170654296875, 0.998199462890625, 1.0357818603515625, 1.0733642578125, 1.1109466552734375, 1.148529052734375, 1.1861114501953125, 1.22369384765625, 1.2612762451171875, 1.298858642578125, 1.3364410400390625, 1.3740234375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 5.0, 2.0, 10.0, 14.0, 12.0, 32.0, 28.0, 47.0, 76.0, 158.0, 360.0, 864.0, 2877.0, 20156.0, 597151.0, 408264.0, 14670.0, 2385.0, 755.0, 293.0, 157.0, 89.0, 51.0, 32.0, 10.0, 9.0, 16.0, 8.0, 3.0, 2.0, 5.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.301513671875, -0.2917671203613281, -0.28202056884765625, -0.2722740173339844, -0.2625274658203125, -0.2527809143066406, -0.24303436279296875, -0.23328781127929688, -0.223541259765625, -0.21379470825195312, -0.20404815673828125, -0.19430160522460938, -0.1845550537109375, -0.17480850219726562, -0.16506195068359375, -0.15531539916992188, -0.14556884765625, -0.13582229614257812, -0.12607574462890625, -0.11632919311523438, -0.1065826416015625, -0.09683609008789062, -0.08708953857421875, -0.07734298706054688, -0.067596435546875, -0.057849884033203125, -0.04810333251953125, -0.038356781005859375, -0.0286102294921875, -0.018863677978515625, -0.00911712646484375, 0.000629425048828125, 0.0103759765625, 0.020122528076171875, 0.02986907958984375, 0.039615631103515625, 0.0493621826171875, 0.059108734130859375, 0.06885528564453125, 0.07860183715820312, 0.088348388671875, 0.09809494018554688, 0.10784149169921875, 0.11758804321289062, 0.1273345947265625, 0.13708114624023438, 0.14682769775390625, 0.15657424926757812, 0.16632080078125, 0.17606735229492188, 0.18581390380859375, 0.19556045532226562, 0.2053070068359375, 0.21505355834960938, 0.22480010986328125, 0.23454666137695312, 0.244293212890625, 0.2540397644042969, 0.26378631591796875, 0.2735328674316406, 0.2832794189453125, 0.2930259704589844, 0.30277252197265625, 0.3125190734863281, 0.322265625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 6.0, 5.0, 9.0, 14.0, 18.0, 36.0, 38.0, 54.0, 67.0, 112.0, 201.0, 156.0, 89.0, 62.0, 43.0, 35.0, 26.0, 14.0, 9.0, 5.0, 6.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00030612945556640625, -0.0002986006438732147, -0.0002910718321800232, -0.00028354302048683167, -0.00027601420879364014, -0.0002684853971004486, -0.0002609565854072571, -0.00025342777371406555, -0.000245898962020874, -0.0002383701503276825, -0.00023084133863449097, -0.00022331252694129944, -0.0002157837152481079, -0.00020825490355491638, -0.00020072609186172485, -0.00019319728016853333, -0.0001856684684753418, -0.00017813965678215027, -0.00017061084508895874, -0.0001630820333957672, -0.00015555322170257568, -0.00014802441000938416, -0.00014049559831619263, -0.0001329667866230011, -0.00012543797492980957, -0.00011790916323661804, -0.00011038035154342651, -0.00010285153985023499, -9.532272815704346e-05, -8.779391646385193e-05, -8.02651047706604e-05, -7.273629307746887e-05, -6.520748138427734e-05, -5.7678669691085815e-05, -5.014985799789429e-05, -4.262104630470276e-05, -3.509223461151123e-05, -2.7563422918319702e-05, -2.0034611225128174e-05, -1.2505799531936646e-05, -4.976987838745117e-06, 2.551823854446411e-06, 1.008063554763794e-05, 1.7609447240829468e-05, 2.5138258934020996e-05, 3.2667070627212524e-05, 4.019588232040405e-05, 4.772469401359558e-05, 5.525350570678711e-05, 6.278231739997864e-05, 7.031112909317017e-05, 7.78399407863617e-05, 8.536875247955322e-05, 9.289756417274475e-05, 0.00010042637586593628, 0.00010795518755912781, 0.00011548399925231934, 0.00012301281094551086, 0.0001305416226387024, 0.00013807043433189392, 0.00014559924602508545, 0.00015312805771827698, 0.0001606568694114685, 0.00016818568110466003, 0.00017571449279785156]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 6.0, 6.0, 9.0, 15.0, 31.0, 49.0, 64.0, 177.0, 353.0, 921.0, 2841.0, 14686.0, 167288.0, 752761.0, 95496.0, 10169.0, 2275.0, 751.0, 286.0, 151.0, 98.0, 58.0, 18.0, 17.0, 13.0, 6.0, 8.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.242919921875, -0.23465728759765625, -0.2263946533203125, -0.21813201904296875, -0.209869384765625, -0.20160675048828125, -0.1933441162109375, -0.18508148193359375, -0.17681884765625, -0.16855621337890625, -0.1602935791015625, -0.15203094482421875, -0.143768310546875, -0.13550567626953125, -0.1272430419921875, -0.11898040771484375, -0.1107177734375, -0.10245513916015625, -0.0941925048828125, -0.08592987060546875, -0.077667236328125, -0.06940460205078125, -0.0611419677734375, -0.05287933349609375, -0.04461669921875, -0.03635406494140625, -0.0280914306640625, -0.01982879638671875, -0.011566162109375, -0.00330352783203125, 0.0049591064453125, 0.01322174072265625, 0.021484375, 0.02974700927734375, 0.0380096435546875, 0.04627227783203125, 0.054534912109375, 0.06279754638671875, 0.0710601806640625, 0.07932281494140625, 0.08758544921875, 0.09584808349609375, 0.1041107177734375, 0.11237335205078125, 0.120635986328125, 0.12889862060546875, 0.1371612548828125, 0.14542388916015625, 0.1536865234375, 0.16194915771484375, 0.1702117919921875, 0.17847442626953125, 0.186737060546875, 0.19499969482421875, 0.2032623291015625, 0.21152496337890625, 0.21978759765625, 0.22805023193359375, 0.2363128662109375, 0.24457550048828125, 0.252838134765625, 0.26110076904296875, 0.2693634033203125, 0.27762603759765625, 0.285888671875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 5.0, 14.0, 14.0, 23.0, 33.0, 33.0, 46.0, 71.0, 111.0, 141.0, 163.0, 120.0, 63.0, 54.0, 30.0, 26.0, 13.0, 17.0, 8.0, 7.0, 4.0, 4.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.334716796875, -0.3231315612792969, -0.31154632568359375, -0.2999610900878906, -0.2883758544921875, -0.2767906188964844, -0.26520538330078125, -0.2536201477050781, -0.242034912109375, -0.23044967651367188, -0.21886444091796875, -0.20727920532226562, -0.1956939697265625, -0.18410873413085938, -0.17252349853515625, -0.16093826293945312, -0.14935302734375, -0.13776779174804688, -0.12618255615234375, -0.11459732055664062, -0.1030120849609375, -0.09142684936523438, -0.07984161376953125, -0.06825637817382812, -0.056671142578125, -0.045085906982421875, -0.03350067138671875, -0.021915435791015625, -0.0103302001953125, 0.001255035400390625, 0.01284027099609375, 0.024425506591796875, 0.0360107421875, 0.047595977783203125, 0.05918121337890625, 0.07076644897460938, 0.0823516845703125, 0.09393692016601562, 0.10552215576171875, 0.11710739135742188, 0.128692626953125, 0.14027786254882812, 0.15186309814453125, 0.16344833374023438, 0.1750335693359375, 0.18661880493164062, 0.19820404052734375, 0.20978927612304688, 0.22137451171875, 0.23295974731445312, 0.24454498291015625, 0.2561302185058594, 0.2677154541015625, 0.2793006896972656, 0.29088592529296875, 0.3024711608886719, 0.314056396484375, 0.3256416320800781, 0.33722686767578125, 0.3488121032714844, 0.3603973388671875, 0.3719825744628906, 0.38356781005859375, 0.3951530456542969, 0.40673828125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 7.0, 15.0, 30.0, 45.0, 104.0, 207.0, 253.0, 158.0, 81.0, 46.0, 28.0, 8.0, 6.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.850019931793213, -2.675107717514038, -2.500195264816284, -2.3252830505371094, -2.1503705978393555, -1.9754583835601807, -1.8005461692810059, -1.6256338357925415, -1.4507215023040771, -1.2758091688156128, -1.1008968353271484, -0.9259846210479736, -0.7510722875595093, -0.5761599540710449, -0.4012477397918701, -0.22633540630340576, -0.051423072814941406, 0.12348923087120056, 0.29840153455734253, 0.4733138084411621, 0.6482261419296265, 0.8231384754180908, 0.9980506896972656, 1.17296302318573, 1.3478753566741943, 1.5227876901626587, 1.697700023651123, 1.8726122379302979, 2.0475244522094727, 2.2224369049072266, 2.3973491191864014, 2.572261333465576, 2.7471742630004883, 2.922086477279663, 3.096998929977417, 3.271911144256592, 3.4468235969543457, 3.6217358112335205, 3.7966480255126953, 3.971560478210449, 4.146472930908203, 4.321385383605957, 4.496297359466553, 4.671209812164307, 4.8461222648620605, 5.021034240722656, 5.19594669342041, 5.370859146118164, 5.54577112197876, 5.720683574676514, 5.895595550537109, 6.070508003234863, 6.245420455932617, 6.420332908630371, 6.595244884490967, 6.770157337188721, 6.945069313049316, 7.11998176574707, 7.294893741607666, 7.46980619430542, 7.644718647003174, 7.8196306228637695, 7.994543075561523, 8.169455528259277, 8.344367980957031]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 6.0, 5.0, 9.0, 6.0, 6.0, 7.0, 22.0, 15.0, 14.0, 18.0, 20.0, 33.0, 17.0, 39.0, 26.0, 35.0, 35.0, 35.0, 48.0, 35.0, 50.0, 52.0, 43.0, 42.0, 35.0, 42.0, 35.0, 35.0, 32.0, 27.0, 28.0, 30.0, 23.0, 15.0, 15.0, 11.0, 10.0, 8.0, 9.0, 10.0, 5.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-5.188874244689941, -5.028903961181641, -4.868933200836182, -4.708962917327881, -4.54899263381958, -4.389021873474121, -4.22905158996582, -4.0690813064575195, -3.9091107845306396, -3.7491402626037598, -3.589169979095459, -3.429199457168579, -3.269228935241699, -3.1092586517333984, -2.9492881298065186, -2.7893176078796387, -2.629347324371338, -2.469376802444458, -2.3094065189361572, -2.1494359970092773, -1.989465594291687, -1.8294951915740967, -1.6695246696472168, -1.5095542669296265, -1.3495838642120361, -1.1896134614944458, -1.0296430587768555, -0.8696725368499756, -0.7097021341323853, -0.5497317314147949, -0.3897612690925598, -0.2297908067703247, -0.06982040405273438, 0.09015002846717834, 0.25012046098709106, 0.4100908935070038, 0.5700613260269165, 0.7300317287445068, 0.8900021910667419, 1.049972653388977, 1.2099430561065674, 1.3699134588241577, 1.529883861541748, 1.689854383468628, 1.8498247861862183, 2.0097951889038086, 2.1697657108306885, 2.3297362327575684, 2.489706516265869, 2.649677038192749, 2.80964732170105, 2.9696178436279297, 3.1295881271362305, 3.2895586490631104, 3.4495291709899902, 3.609499454498291, 3.769469976425171, 3.929440498352051, 4.089410781860352, 4.249381065368652, 4.409351825714111, 4.569322109222412, 4.729292392730713, 4.889263153076172, 5.049233436584473]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 3.0, 7.0, 11.0, 8.0, 30.0, 18.0, 36.0, 76.0, 79.0, 138.0, 224.0, 374.0, 635.0, 1038.0, 1754.0, 3468.0, 6708.0, 15074.0, 45428.0, 894545.0, 3139230.0, 53414.0, 16437.0, 6982.0, 3607.0, 1931.0, 1114.0, 696.0, 436.0, 263.0, 160.0, 112.0, 74.0, 64.0, 31.0, 26.0, 20.0, 9.0, 5.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.76904296875, -0.747100830078125, -0.72515869140625, -0.703216552734375, -0.6812744140625, -0.659332275390625, -0.63739013671875, -0.615447998046875, -0.593505859375, -0.571563720703125, -0.54962158203125, -0.527679443359375, -0.5057373046875, -0.483795166015625, -0.46185302734375, -0.439910888671875, -0.41796875, -0.396026611328125, -0.37408447265625, -0.352142333984375, -0.3302001953125, -0.308258056640625, -0.28631591796875, -0.264373779296875, -0.242431640625, -0.220489501953125, -0.19854736328125, -0.176605224609375, -0.1546630859375, -0.132720947265625, -0.11077880859375, -0.088836669921875, -0.06689453125, -0.044952392578125, -0.02301025390625, -0.001068115234375, 0.0208740234375, 0.042816162109375, 0.06475830078125, 0.086700439453125, 0.108642578125, 0.130584716796875, 0.15252685546875, 0.174468994140625, 0.1964111328125, 0.218353271484375, 0.24029541015625, 0.262237548828125, 0.2841796875, 0.306121826171875, 0.32806396484375, 0.350006103515625, 0.3719482421875, 0.393890380859375, 0.41583251953125, 0.437774658203125, 0.459716796875, 0.481658935546875, 0.50360107421875, 0.525543212890625, 0.5474853515625, 0.569427490234375, 0.59136962890625, 0.613311767578125, 0.63525390625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 1.0, 7.0, 5.0, 8.0, 13.0, 13.0, 20.0, 33.0, 19.0, 26.0, 40.0, 40.0, 42.0, 43.0, 42.0, 56.0, 75.0, 50.0, 68.0, 50.0, 48.0, 50.0, 59.0, 39.0, 30.0, 27.0, 24.0, 24.0, 17.0, 7.0, 10.0, 8.0, 9.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.331298828125, -0.3213844299316406, -0.31147003173828125, -0.3015556335449219, -0.2916412353515625, -0.2817268371582031, -0.27181243896484375, -0.2618980407714844, -0.251983642578125, -0.24206924438476562, -0.23215484619140625, -0.22224044799804688, -0.2123260498046875, -0.20241165161132812, -0.19249725341796875, -0.18258285522460938, -0.17266845703125, -0.16275405883789062, -0.15283966064453125, -0.14292526245117188, -0.1330108642578125, -0.12309646606445312, -0.11318206787109375, -0.10326766967773438, -0.093353271484375, -0.08343887329101562, -0.07352447509765625, -0.06361007690429688, -0.0536956787109375, -0.043781280517578125, -0.03386688232421875, -0.023952484130859375, -0.0140380859375, -0.004123687744140625, 0.00579071044921875, 0.015705108642578125, 0.0256195068359375, 0.035533905029296875, 0.04544830322265625, 0.055362701416015625, 0.065277099609375, 0.07519149780273438, 0.08510589599609375, 0.09502029418945312, 0.1049346923828125, 0.11484909057617188, 0.12476348876953125, 0.13467788696289062, 0.14459228515625, 0.15450668334960938, 0.16442108154296875, 0.17433547973632812, 0.1842498779296875, 0.19416427612304688, 0.20407867431640625, 0.21399307250976562, 0.223907470703125, 0.23382186889648438, 0.24373626708984375, 0.2536506652832031, 0.2635650634765625, 0.2734794616699219, 0.28339385986328125, 0.2933082580566406, 0.30322265625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 8.0, 6.0, 10.0, 13.0, 29.0, 21.0, 47.0, 73.0, 141.0, 199.0, 303.0, 577.0, 1076.0, 2265.0, 5720.0, 17917.0, 91421.0, 3893109.0, 146005.0, 22806.0, 7076.0, 2721.0, 1142.0, 573.0, 411.0, 202.0, 151.0, 103.0, 52.0, 45.0, 22.0, 17.0, 9.0, 4.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.62060546875, -0.5988998413085938, -0.5771942138671875, -0.5554885864257812, -0.533782958984375, -0.5120773315429688, -0.4903717041015625, -0.46866607666015625, -0.44696044921875, -0.42525482177734375, -0.4035491943359375, -0.38184356689453125, -0.360137939453125, -0.33843231201171875, -0.3167266845703125, -0.29502105712890625, -0.2733154296875, -0.25160980224609375, -0.2299041748046875, -0.20819854736328125, -0.186492919921875, -0.16478729248046875, -0.1430816650390625, -0.12137603759765625, -0.09967041015625, -0.07796478271484375, -0.0562591552734375, -0.03455352783203125, -0.012847900390625, 0.00885772705078125, 0.0305633544921875, 0.05226898193359375, 0.073974609375, 0.09568023681640625, 0.1173858642578125, 0.13909149169921875, 0.160797119140625, 0.18250274658203125, 0.2042083740234375, 0.22591400146484375, 0.24761962890625, 0.26932525634765625, 0.2910308837890625, 0.31273651123046875, 0.334442138671875, 0.35614776611328125, 0.3778533935546875, 0.39955902099609375, 0.4212646484375, 0.44297027587890625, 0.4646759033203125, 0.48638153076171875, 0.508087158203125, 0.5297927856445312, 0.5514984130859375, 0.5732040405273438, 0.59490966796875, 0.6166152954101562, 0.6383209228515625, 0.6600265502929688, 0.681732177734375, 0.7034378051757812, 0.7251434326171875, 0.7468490600585938, 0.7685546875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 11.0, 3.0, 13.0, 16.0, 13.0, 23.0, 40.0, 89.0, 252.0, 3112.0, 279.0, 82.0, 51.0, 24.0, 21.0, 14.0, 3.0, 9.0, 6.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7666015625, -0.7461700439453125, -0.725738525390625, -0.7053070068359375, -0.68487548828125, -0.6644439697265625, -0.644012451171875, -0.6235809326171875, -0.6031494140625, -0.5827178955078125, -0.562286376953125, -0.5418548583984375, -0.52142333984375, -0.5009918212890625, -0.480560302734375, -0.4601287841796875, -0.439697265625, -0.4192657470703125, -0.398834228515625, -0.3784027099609375, -0.35797119140625, -0.3375396728515625, -0.317108154296875, -0.2966766357421875, -0.2762451171875, -0.2558135986328125, -0.235382080078125, -0.2149505615234375, -0.19451904296875, -0.1740875244140625, -0.153656005859375, -0.1332244873046875, -0.11279296875, -0.0923614501953125, -0.071929931640625, -0.0514984130859375, -0.03106689453125, -0.0106353759765625, 0.009796142578125, 0.0302276611328125, 0.0506591796875, 0.0710906982421875, 0.091522216796875, 0.1119537353515625, 0.13238525390625, 0.1528167724609375, 0.173248291015625, 0.1936798095703125, 0.214111328125, 0.2345428466796875, 0.254974365234375, 0.2754058837890625, 0.29583740234375, 0.3162689208984375, 0.336700439453125, 0.3571319580078125, 0.3775634765625, 0.3979949951171875, 0.418426513671875, 0.4388580322265625, 0.45928955078125, 0.4797210693359375, 0.500152587890625, 0.5205841064453125, 0.541015625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 6.0, 1.0, 8.0, 28.0, 99.0, 326.0, 377.0, 99.0, 30.0, 13.0, 6.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-5.024125099182129, -4.915098190307617, -4.806070804595947, -4.6970438957214355, -4.588016986846924, -4.478989601135254, -4.369962692260742, -4.2609357833862305, -4.1519083976745605, -4.042881488800049, -3.933854341506958, -3.824827194213867, -3.7158000469207764, -3.6067728996276855, -3.497745990753174, -3.388718843460083, -3.2796919345855713, -3.1706647872924805, -3.0616378784179688, -2.952610731124878, -2.843583583831787, -2.7345566749572754, -2.6255295276641846, -2.5165023803710938, -2.407475471496582, -2.298448324203491, -2.1894214153289795, -2.0803942680358887, -1.9713671207427979, -1.8623400926589966, -1.7533130645751953, -1.6442859172821045, -1.5352587699890137, -1.4262317419052124, -1.3172045946121216, -1.2081775665283203, -1.0991504192352295, -0.9901233911514282, -0.881096363067627, -0.7720692753791809, -0.6630421876907349, -0.5540151000022888, -0.44498804211616516, -0.3359609842300415, -0.22693389654159546, -0.11790680885314941, -0.008879780769348145, 0.1001473069190979, 0.20917439460754395, 0.31820148229599, 0.42722854018211365, 0.5362555980682373, 0.6452826857566833, 0.7543097734451294, 0.8633368015289307, 0.9723638892173767, 1.0813909769058228, 1.190418004989624, 1.2994451522827148, 1.4084721803665161, 1.5174992084503174, 1.6265263557434082, 1.7355533838272095, 1.8445804119110107, 1.9536075592041016]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 8.0, 5.0, 10.0, 14.0, 11.0, 14.0, 23.0, 34.0, 32.0, 30.0, 42.0, 37.0, 33.0, 41.0, 52.0, 51.0, 49.0, 62.0, 52.0, 64.0, 45.0, 42.0, 28.0, 51.0, 35.0, 30.0, 33.0, 24.0, 15.0, 9.0, 4.0, 8.0, 4.0, 3.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.594771146774292, -1.5484250783920288, -1.5020790100097656, -1.4557329416275024, -1.4093868732452393, -1.3630409240722656, -1.3166948556900024, -1.2703487873077393, -1.224002718925476, -1.177656650543213, -1.1313105821609497, -1.0849645137786865, -1.038618564605713, -0.9922724366188049, -0.9459264278411865, -0.8995803594589233, -0.8532342910766602, -0.806888222694397, -0.7605421543121338, -0.7141961455345154, -0.6678500771522522, -0.621504008769989, -0.5751579999923706, -0.5288119316101074, -0.48246586322784424, -0.43611979484558105, -0.38977375626564026, -0.34342771768569946, -0.2970816493034363, -0.2507355809211731, -0.2043895423412323, -0.1580435037612915, -0.11169755458831787, -0.06535150110721588, -0.01900544762611389, 0.027340605854988098, 0.07368665933609009, 0.12003271281719208, 0.16637876629829407, 0.21272480487823486, 0.25907087326049805, 0.30541694164276123, 0.351762980222702, 0.3981090188026428, 0.444455087184906, 0.4908011555671692, 0.5371471643447876, 0.5834932327270508, 0.629839301109314, 0.6761853694915771, 0.7225314378738403, 0.7688774466514587, 0.8152235150337219, 0.8615695834159851, 0.9079155921936035, 0.9542616605758667, 1.0006077289581299, 1.046953797340393, 1.0932998657226562, 1.1396459341049194, 1.1859920024871826, 1.2323379516601562, 1.2786840200424194, 1.3250300884246826, 1.3713761568069458]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 6.0, 10.0, 12.0, 13.0, 20.0, 37.0, 35.0, 76.0, 133.0, 253.0, 492.0, 1141.0, 3343.0, 12559.0, 63615.0, 489989.0, 408390.0, 52770.0, 10564.0, 2966.0, 1106.0, 506.0, 198.0, 130.0, 85.0, 38.0, 19.0, 19.0, 11.0, 10.0, 4.0, 8.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8828125, -0.8575515747070312, -0.8322906494140625, -0.8070297241210938, -0.781768798828125, -0.7565078735351562, -0.7312469482421875, -0.7059860229492188, -0.68072509765625, -0.6554641723632812, -0.6302032470703125, -0.6049423217773438, -0.579681396484375, -0.5544204711914062, -0.5291595458984375, -0.5038986206054688, -0.4786376953125, -0.45337677001953125, -0.4281158447265625, -0.40285491943359375, -0.377593994140625, -0.35233306884765625, -0.3270721435546875, -0.30181121826171875, -0.27655029296875, -0.25128936767578125, -0.2260284423828125, -0.20076751708984375, -0.175506591796875, -0.15024566650390625, -0.1249847412109375, -0.09972381591796875, -0.074462890625, -0.04920196533203125, -0.0239410400390625, 0.00131988525390625, 0.026580810546875, 0.05184173583984375, 0.0771026611328125, 0.10236358642578125, 0.12762451171875, 0.15288543701171875, 0.1781463623046875, 0.20340728759765625, 0.228668212890625, 0.25392913818359375, 0.2791900634765625, 0.30445098876953125, 0.3297119140625, 0.35497283935546875, 0.3802337646484375, 0.40549468994140625, 0.430755615234375, 0.45601654052734375, 0.4812774658203125, 0.5065383911132812, 0.53179931640625, 0.5570602416992188, 0.5823211669921875, 0.6075820922851562, 0.632843017578125, 0.6581039428710938, 0.6833648681640625, 0.7086257934570312, 0.73388671875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 7.0, 9.0, 9.0, 13.0, 21.0, 25.0, 25.0, 28.0, 31.0, 32.0, 34.0, 38.0, 41.0, 48.0, 69.0, 57.0, 54.0, 65.0, 58.0, 45.0, 45.0, 46.0, 36.0, 38.0, 26.0, 24.0, 19.0, 13.0, 9.0, 13.0, 9.0, 5.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3212890625, -0.31159210205078125, -0.3018951416015625, -0.29219818115234375, -0.282501220703125, -0.27280426025390625, -0.2631072998046875, -0.25341033935546875, -0.24371337890625, -0.23401641845703125, -0.2243194580078125, -0.21462249755859375, -0.204925537109375, -0.19522857666015625, -0.1855316162109375, -0.17583465576171875, -0.1661376953125, -0.15644073486328125, -0.1467437744140625, -0.13704681396484375, -0.127349853515625, -0.11765289306640625, -0.1079559326171875, -0.09825897216796875, -0.08856201171875, -0.07886505126953125, -0.0691680908203125, -0.05947113037109375, -0.049774169921875, -0.04007720947265625, -0.0303802490234375, -0.02068328857421875, -0.010986328125, -0.00128936767578125, 0.0084075927734375, 0.01810455322265625, 0.027801513671875, 0.03749847412109375, 0.0471954345703125, 0.05689239501953125, 0.06658935546875, 0.07628631591796875, 0.0859832763671875, 0.09568023681640625, 0.105377197265625, 0.11507415771484375, 0.1247711181640625, 0.13446807861328125, 0.1441650390625, 0.15386199951171875, 0.1635589599609375, 0.17325592041015625, 0.182952880859375, 0.19264984130859375, 0.2023468017578125, 0.21204376220703125, 0.22174072265625, 0.23143768310546875, 0.2411346435546875, 0.25083160400390625, 0.260528564453125, 0.27022552490234375, 0.2799224853515625, 0.28961944580078125, 0.29931640625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 9.0, 13.0, 13.0, 20.0, 42.0, 55.0, 79.0, 156.0, 256.0, 583.0, 1846.0, 8116.0, 66339.0, 832481.0, 122555.0, 12040.0, 2520.0, 740.0, 296.0, 167.0, 83.0, 45.0, 30.0, 26.0, 10.0, 13.0, 7.0, 8.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95361328125, -0.9163742065429688, -0.8791351318359375, -0.8418960571289062, -0.804656982421875, -0.7674179077148438, -0.7301788330078125, -0.6929397583007812, -0.65570068359375, -0.6184616088867188, -0.5812225341796875, -0.5439834594726562, -0.506744384765625, -0.46950531005859375, -0.4322662353515625, -0.39502716064453125, -0.3577880859375, -0.32054901123046875, -0.2833099365234375, -0.24607086181640625, -0.208831787109375, -0.17159271240234375, -0.1343536376953125, -0.09711456298828125, -0.05987548828125, -0.02263641357421875, 0.0146026611328125, 0.05184173583984375, 0.089080810546875, 0.12631988525390625, 0.1635589599609375, 0.20079803466796875, 0.238037109375, 0.27527618408203125, 0.3125152587890625, 0.34975433349609375, 0.386993408203125, 0.42423248291015625, 0.4614715576171875, 0.49871063232421875, 0.53594970703125, 0.5731887817382812, 0.6104278564453125, 0.6476669311523438, 0.684906005859375, 0.7221450805664062, 0.7593841552734375, 0.7966232299804688, 0.8338623046875, 0.8711013793945312, 0.9083404541015625, 0.9455795288085938, 0.982818603515625, 1.0200576782226562, 1.0572967529296875, 1.0945358276367188, 1.13177490234375, 1.1690139770507812, 1.2062530517578125, 1.2434921264648438, 1.280731201171875, 1.3179702758789062, 1.3552093505859375, 1.3924484252929688, 1.4296875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 8.0, 7.0, 14.0, 10.0, 6.0, 17.0, 19.0, 19.0, 28.0, 31.0, 31.0, 49.0, 48.0, 55.0, 65.0, 67.0, 61.0, 66.0, 64.0, 59.0, 45.0, 40.0, 32.0, 42.0, 33.0, 13.0, 21.0, 9.0, 9.0, 8.0, 2.0, 10.0, 3.0, 3.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.755859375, -1.701629638671875, -1.64739990234375, -1.593170166015625, -1.5389404296875, -1.484710693359375, -1.43048095703125, -1.376251220703125, -1.322021484375, -1.267791748046875, -1.21356201171875, -1.159332275390625, -1.1051025390625, -1.050872802734375, -0.99664306640625, -0.942413330078125, -0.88818359375, -0.833953857421875, -0.77972412109375, -0.725494384765625, -0.6712646484375, -0.617034912109375, -0.56280517578125, -0.508575439453125, -0.454345703125, -0.400115966796875, -0.34588623046875, -0.291656494140625, -0.2374267578125, -0.183197021484375, -0.12896728515625, -0.074737548828125, -0.0205078125, 0.033721923828125, 0.08795166015625, 0.142181396484375, 0.1964111328125, 0.250640869140625, 0.30487060546875, 0.359100341796875, 0.413330078125, 0.467559814453125, 0.52178955078125, 0.576019287109375, 0.6302490234375, 0.684478759765625, 0.73870849609375, 0.792938232421875, 0.84716796875, 0.901397705078125, 0.95562744140625, 1.009857177734375, 1.0640869140625, 1.118316650390625, 1.17254638671875, 1.226776123046875, 1.281005859375, 1.335235595703125, 1.38946533203125, 1.443695068359375, 1.4979248046875, 1.552154541015625, 1.60638427734375, 1.660614013671875, 1.71484375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 9.0, 5.0, 2.0, 13.0, 23.0, 31.0, 56.0, 110.0, 241.0, 648.0, 2434.0, 24535.0, 943782.0, 71033.0, 4093.0, 886.0, 352.0, 130.0, 67.0, 27.0, 29.0, 10.0, 9.0, 9.0, 4.0, 5.0, 2.0, 0.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.64794921875, -0.627471923828125, -0.60699462890625, -0.586517333984375, -0.5660400390625, -0.545562744140625, -0.52508544921875, -0.504608154296875, -0.484130859375, -0.463653564453125, -0.44317626953125, -0.422698974609375, -0.4022216796875, -0.381744384765625, -0.36126708984375, -0.340789794921875, -0.3203125, -0.299835205078125, -0.27935791015625, -0.258880615234375, -0.2384033203125, -0.217926025390625, -0.19744873046875, -0.176971435546875, -0.156494140625, -0.136016845703125, -0.11553955078125, -0.095062255859375, -0.0745849609375, -0.054107666015625, -0.03363037109375, -0.013153076171875, 0.00732421875, 0.027801513671875, 0.04827880859375, 0.068756103515625, 0.0892333984375, 0.109710693359375, 0.13018798828125, 0.150665283203125, 0.171142578125, 0.191619873046875, 0.21209716796875, 0.232574462890625, 0.2530517578125, 0.273529052734375, 0.29400634765625, 0.314483642578125, 0.3349609375, 0.355438232421875, 0.37591552734375, 0.396392822265625, 0.4168701171875, 0.437347412109375, 0.45782470703125, 0.478302001953125, 0.498779296875, 0.519256591796875, 0.53973388671875, 0.560211181640625, 0.5806884765625, 0.601165771484375, 0.62164306640625, 0.642120361328125, 0.66259765625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 4.0, 5.0, 6.0, 15.0, 16.0, 35.0, 35.0, 52.0, 95.0, 155.0, 210.0, 147.0, 61.0, 49.0, 29.0, 21.0, 22.0, 10.0, 14.0, 5.0, 5.0, 7.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00023508071899414062, -0.00022409111261367798, -0.00021310150623321533, -0.00020211189985275269, -0.00019112229347229004, -0.0001801326870918274, -0.00016914308071136475, -0.0001581534743309021, -0.00014716386795043945, -0.0001361742615699768, -0.00012518465518951416, -0.00011419504880905151, -0.00010320544242858887, -9.221583604812622e-05, -8.122622966766357e-05, -7.023662328720093e-05, -5.924701690673828e-05, -4.8257410526275635e-05, -3.726780414581299e-05, -2.6278197765350342e-05, -1.5288591384887695e-05, -4.298985004425049e-06, 6.690621376037598e-06, 1.7680227756500244e-05, 2.866983413696289e-05, 3.965944051742554e-05, 5.0649046897888184e-05, 6.163865327835083e-05, 7.262825965881348e-05, 8.361786603927612e-05, 9.460747241973877e-05, 0.00010559707880020142, 0.00011658668518066406, 0.0001275762915611267, 0.00013856589794158936, 0.000149555504322052, 0.00016054511070251465, 0.0001715347170829773, 0.00018252432346343994, 0.0001935139298439026, 0.00020450353622436523, 0.00021549314260482788, 0.00022648274898529053, 0.00023747235536575317, 0.0002484619617462158, 0.00025945156812667847, 0.0002704411745071411, 0.00028143078088760376, 0.0002924203872680664, 0.00030340999364852905, 0.0003143996000289917, 0.00032538920640945435, 0.000336378812789917, 0.00034736841917037964, 0.0003583580255508423, 0.00036934763193130493, 0.0003803372383117676, 0.0003913268446922302, 0.00040231645107269287, 0.0004133060574531555, 0.00042429566383361816, 0.0004352852702140808, 0.00044627487659454346, 0.0004572644829750061, 0.00046825408935546875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 15.0, 22.0, 27.0, 62.0, 137.0, 242.0, 588.0, 2662.0, 44016.0, 963124.0, 34224.0, 2360.0, 606.0, 222.0, 103.0, 54.0, 39.0, 22.0, 7.0, 8.0, 8.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.6884765625, -0.6685028076171875, -0.648529052734375, -0.6285552978515625, -0.60858154296875, -0.5886077880859375, -0.568634033203125, -0.5486602783203125, -0.5286865234375, -0.5087127685546875, -0.488739013671875, -0.4687652587890625, -0.44879150390625, -0.4288177490234375, -0.408843994140625, -0.3888702392578125, -0.368896484375, -0.3489227294921875, -0.328948974609375, -0.3089752197265625, -0.28900146484375, -0.2690277099609375, -0.249053955078125, -0.2290802001953125, -0.2091064453125, -0.1891326904296875, -0.169158935546875, -0.1491851806640625, -0.12921142578125, -0.1092376708984375, -0.089263916015625, -0.0692901611328125, -0.04931640625, -0.0293426513671875, -0.009368896484375, 0.0106048583984375, 0.03057861328125, 0.0505523681640625, 0.070526123046875, 0.0904998779296875, 0.1104736328125, 0.1304473876953125, 0.150421142578125, 0.1703948974609375, 0.19036865234375, 0.2103424072265625, 0.230316162109375, 0.2502899169921875, 0.270263671875, 0.2902374267578125, 0.310211181640625, 0.3301849365234375, 0.35015869140625, 0.3701324462890625, 0.390106201171875, 0.4100799560546875, 0.4300537109375, 0.4500274658203125, 0.470001220703125, 0.4899749755859375, 0.50994873046875, 0.5299224853515625, 0.549896240234375, 0.5698699951171875, 0.58984375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 7.0, 8.0, 30.0, 33.0, 83.0, 173.0, 285.0, 190.0, 84.0, 47.0, 28.0, 11.0, 12.0, 9.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.119140625, -1.0877151489257812, -1.0562896728515625, -1.0248641967773438, -0.993438720703125, -0.9620132446289062, -0.9305877685546875, -0.8991622924804688, -0.86773681640625, -0.8363113403320312, -0.8048858642578125, -0.7734603881835938, -0.742034912109375, -0.7106094360351562, -0.6791839599609375, -0.6477584838867188, -0.6163330078125, -0.5849075317382812, -0.5534820556640625, -0.5220565795898438, -0.490631103515625, -0.45920562744140625, -0.4277801513671875, -0.39635467529296875, -0.36492919921875, -0.33350372314453125, -0.3020782470703125, -0.27065277099609375, -0.239227294921875, -0.20780181884765625, -0.1763763427734375, -0.14495086669921875, -0.113525390625, -0.08209991455078125, -0.0506744384765625, -0.01924896240234375, 0.012176513671875, 0.04360198974609375, 0.0750274658203125, 0.10645294189453125, 0.13787841796875, 0.16930389404296875, 0.2007293701171875, 0.23215484619140625, 0.263580322265625, 0.29500579833984375, 0.3264312744140625, 0.35785675048828125, 0.3892822265625, 0.42070770263671875, 0.4521331787109375, 0.48355865478515625, 0.514984130859375, 0.5464096069335938, 0.5778350830078125, 0.6092605590820312, 0.64068603515625, 0.6721115112304688, 0.7035369873046875, 0.7349624633789062, 0.766387939453125, 0.7978134155273438, 0.8292388916015625, 0.8606643676757812, 0.89208984375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 0.0, 4.0, 3.0, 10.0, 16.0, 24.0, 49.0, 129.0, 235.0, 280.0, 139.0, 74.0, 24.0, 12.0, 4.0, 4.0, 3.0, 0.0, 0.0, 3.0], "bins": [-15.32483959197998, -15.036296844482422, -14.747754096984863, -14.459211349487305, -14.170668601989746, -13.882125854492188, -13.593583106994629, -13.30504035949707, -13.016497611999512, -12.727954864501953, -12.439412117004395, -12.150869369506836, -11.862326622009277, -11.573783874511719, -11.28524112701416, -10.996698379516602, -10.708154678344727, -10.419611930847168, -10.13106918334961, -9.84252643585205, -9.553983688354492, -9.265440940856934, -8.976898193359375, -8.688355445861816, -8.399812698364258, -8.1112699508667, -7.822727203369141, -7.534184455871582, -7.245641708374023, -6.957098960876465, -6.668556213378906, -6.380013465881348, -6.091469764709473, -5.802927017211914, -5.5143842697143555, -5.225841522216797, -4.937298774719238, -4.64875602722168, -4.360213279724121, -4.0716705322265625, -3.783127784729004, -3.4945850372314453, -3.2060422897338867, -2.917499542236328, -2.6289567947387695, -2.340414047241211, -2.0518710613250732, -1.7633283138275146, -1.474785566329956, -1.1862428188323975, -0.8977000117301941, -0.6091572046279907, -0.32061445713043213, -0.032071709632873535, 0.2564711570739746, 0.5450139045715332, 0.8335566520690918, 1.1220993995666504, 1.410642147064209, 1.6991850137710571, 1.9877277612686157, 2.2762703895568848, 2.5648133754730225, 2.853356122970581, 3.1418988704681396]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 6.0, 6.0, 5.0, 6.0, 10.0, 14.0, 15.0, 18.0, 29.0, 24.0, 36.0, 37.0, 44.0, 56.0, 47.0, 71.0, 55.0, 51.0, 56.0, 53.0, 54.0, 31.0, 40.0, 32.0, 33.0, 28.0, 27.0, 27.0, 22.0, 8.0, 10.0, 15.0, 9.0, 11.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.401443481445312, -8.115632057189941, -7.829820156097412, -7.544008731842041, -7.258196830749512, -6.972385406494141, -6.6865739822387695, -6.400762557983398, -6.114950656890869, -5.829139232635498, -5.543327331542969, -5.257515907287598, -4.971704483032227, -4.685892581939697, -4.400081157684326, -4.114269256591797, -3.828457832336426, -3.5426461696624756, -3.2568345069885254, -2.9710230827331543, -2.685211420059204, -2.399399757385254, -2.113588333129883, -1.8277766704559326, -1.5419650077819824, -1.2561533451080322, -0.9703418016433716, -0.6845301985740662, -0.39871859550476074, -0.11290693283081055, 0.1729046106338501, 0.45871615409851074, 0.7445278167724609, 1.0303394794464111, 1.3161510229110718, 1.6019625663757324, 1.8877742290496826, 2.173585891723633, 2.459397315979004, 2.745208978652954, 3.0310206413269043, 3.3168323040008545, 3.6026439666748047, 3.888455390930176, 4.174266815185547, 4.460078716278076, 4.745890140533447, 5.031702041625977, 5.317513465881348, 5.603324890136719, 5.889136791229248, 6.174948215484619, 6.460760116577148, 6.7465715408325195, 7.032382965087891, 7.318194389343262, 7.604006290435791, 7.889817714691162, 8.175629615783691, 8.461441040039062, 8.747252464294434, 9.033063888549805, 9.318876266479492, 9.604687690734863, 9.890499114990234]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 1.0, 3.0, 5.0, 5.0, 10.0, 10.0, 19.0, 38.0, 71.0, 171.0, 308.0, 719.0, 2057.0, 10999.0, 4026860.0, 144246.0, 6190.0, 1494.0, 614.0, 217.0, 107.0, 67.0, 23.0, 19.0, 13.0, 5.0, 2.0, 4.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.330078125, -1.2975234985351562, -1.2649688720703125, -1.2324142456054688, -1.199859619140625, -1.1673049926757812, -1.1347503662109375, -1.1021957397460938, -1.06964111328125, -1.0370864868164062, -1.0045318603515625, -0.9719772338867188, -0.939422607421875, -0.9068679809570312, -0.8743133544921875, -0.8417587280273438, -0.8092041015625, -0.7766494750976562, -0.7440948486328125, -0.7115402221679688, -0.678985595703125, -0.6464309692382812, -0.6138763427734375, -0.5813217163085938, -0.54876708984375, -0.5162124633789062, -0.4836578369140625, -0.45110321044921875, -0.418548583984375, -0.38599395751953125, -0.3534393310546875, -0.32088470458984375, -0.288330078125, -0.25577545166015625, -0.2232208251953125, -0.19066619873046875, -0.158111572265625, -0.12555694580078125, -0.0930023193359375, -0.06044769287109375, -0.02789306640625, 0.00466156005859375, 0.0372161865234375, 0.06977081298828125, 0.102325439453125, 0.13488006591796875, 0.1674346923828125, 0.19998931884765625, 0.2325439453125, 0.26509857177734375, 0.2976531982421875, 0.33020782470703125, 0.362762451171875, 0.39531707763671875, 0.4278717041015625, 0.46042633056640625, 0.49298095703125, 0.5255355834960938, 0.5580902099609375, 0.5906448364257812, 0.623199462890625, 0.6557540893554688, 0.6883087158203125, 0.7208633422851562, 0.75341796875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 7.0, 6.0, 11.0, 12.0, 13.0, 14.0, 16.0, 30.0, 23.0, 16.0, 30.0, 37.0, 44.0, 43.0, 32.0, 47.0, 43.0, 53.0, 50.0, 50.0, 51.0, 44.0, 35.0, 50.0, 47.0, 32.0, 32.0, 24.0, 16.0, 14.0, 17.0, 21.0, 13.0, 10.0, 9.0, 4.0, 3.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.4169921875, -0.40517425537109375, -0.3933563232421875, -0.38153839111328125, -0.369720458984375, -0.35790252685546875, -0.3460845947265625, -0.33426666259765625, -0.32244873046875, -0.31063079833984375, -0.2988128662109375, -0.28699493408203125, -0.275177001953125, -0.26335906982421875, -0.2515411376953125, -0.23972320556640625, -0.2279052734375, -0.21608734130859375, -0.2042694091796875, -0.19245147705078125, -0.180633544921875, -0.16881561279296875, -0.1569976806640625, -0.14517974853515625, -0.13336181640625, -0.12154388427734375, -0.1097259521484375, -0.09790802001953125, -0.086090087890625, -0.07427215576171875, -0.0624542236328125, -0.05063629150390625, -0.038818359375, -0.02700042724609375, -0.0151824951171875, -0.00336456298828125, 0.008453369140625, 0.02027130126953125, 0.0320892333984375, 0.04390716552734375, 0.05572509765625, 0.06754302978515625, 0.0793609619140625, 0.09117889404296875, 0.102996826171875, 0.11481475830078125, 0.1266326904296875, 0.13845062255859375, 0.1502685546875, 0.16208648681640625, 0.1739044189453125, 0.18572235107421875, 0.197540283203125, 0.20935821533203125, 0.2211761474609375, 0.23299407958984375, 0.24481201171875, 0.25662994384765625, 0.2684478759765625, 0.28026580810546875, 0.292083740234375, 0.30390167236328125, 0.3157196044921875, 0.32753753662109375, 0.33935546875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 8.0, 8.0, 6.0, 13.0, 27.0, 43.0, 58.0, 80.0, 162.0, 296.0, 605.0, 1245.0, 3239.0, 14035.0, 3992501.0, 169087.0, 8320.0, 2417.0, 1005.0, 500.0, 267.0, 166.0, 69.0, 37.0, 50.0, 19.0, 11.0, 9.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-1.181640625, -1.1540756225585938, -1.1265106201171875, -1.0989456176757812, -1.071380615234375, -1.0438156127929688, -1.0162506103515625, -0.9886856079101562, -0.96112060546875, -0.9335556030273438, -0.9059906005859375, -0.8784255981445312, -0.850860595703125, -0.8232955932617188, -0.7957305908203125, -0.7681655883789062, -0.7406005859375, -0.7130355834960938, -0.6854705810546875, -0.6579055786132812, -0.630340576171875, -0.6027755737304688, -0.5752105712890625, -0.5476455688476562, -0.52008056640625, -0.49251556396484375, -0.4649505615234375, -0.43738555908203125, -0.409820556640625, -0.38225555419921875, -0.3546905517578125, -0.32712554931640625, -0.299560546875, -0.27199554443359375, -0.2444305419921875, -0.21686553955078125, -0.189300537109375, -0.16173553466796875, -0.1341705322265625, -0.10660552978515625, -0.07904052734375, -0.05147552490234375, -0.0239105224609375, 0.00365447998046875, 0.031219482421875, 0.05878448486328125, 0.0863494873046875, 0.11391448974609375, 0.1414794921875, 0.16904449462890625, 0.1966094970703125, 0.22417449951171875, 0.251739501953125, 0.27930450439453125, 0.3068695068359375, 0.33443450927734375, 0.36199951171875, 0.38956451416015625, 0.4171295166015625, 0.44469451904296875, 0.472259521484375, 0.49982452392578125, 0.5273895263671875, 0.5549545288085938, 0.58251953125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 4.0, 6.0, 8.0, 8.0, 35.0, 56.0, 393.0, 3461.0, 60.0, 24.0, 5.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.331787109375, -0.3235187530517578, -0.3152503967285156, -0.30698204040527344, -0.29871368408203125, -0.29044532775878906, -0.2821769714355469, -0.2739086151123047, -0.2656402587890625, -0.2573719024658203, -0.24910354614257812, -0.24083518981933594, -0.23256683349609375, -0.22429847717285156, -0.21603012084960938, -0.2077617645263672, -0.199493408203125, -0.1912250518798828, -0.18295669555664062, -0.17468833923339844, -0.16641998291015625, -0.15815162658691406, -0.14988327026367188, -0.1416149139404297, -0.1333465576171875, -0.1250782012939453, -0.11680984497070312, -0.10854148864746094, -0.10027313232421875, -0.09200477600097656, -0.08373641967773438, -0.07546806335449219, -0.06719970703125, -0.05893135070800781, -0.050662994384765625, -0.04239463806152344, -0.03412628173828125, -0.025857925415039062, -0.017589569091796875, -0.009321212768554688, -0.0010528564453125, 0.0072154998779296875, 0.015483856201171875, 0.023752212524414062, 0.03202056884765625, 0.04028892517089844, 0.048557281494140625, 0.05682563781738281, 0.065093994140625, 0.07336235046386719, 0.08163070678710938, 0.08989906311035156, 0.09816741943359375, 0.10643577575683594, 0.11470413208007812, 0.12297248840332031, 0.1312408447265625, 0.1395092010498047, 0.14777755737304688, 0.15604591369628906, 0.16431427001953125, 0.17258262634277344, 0.18085098266601562, 0.1891193389892578, 0.1973876953125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 12.0, 34.0, 109.0, 496.0, 320.0, 34.0, 6.0, 2.0, 1.0, 2.0], "bins": [-3.0160655975341797, -2.964134931564331, -2.9122045040130615, -2.860273838043213, -2.8083434104919434, -2.7564127445220947, -2.704482316970825, -2.6525516510009766, -2.600621223449707, -2.5486905574798584, -2.496760129928589, -2.4448294639587402, -2.3928990364074707, -2.340968370437622, -2.2890379428863525, -2.237107276916504, -2.1851768493652344, -2.1332461833953857, -2.081315755844116, -2.0293850898742676, -1.977454662322998, -1.925524115562439, -1.8735935688018799, -1.8216630220413208, -1.7697323560714722, -1.717801809310913, -1.665871262550354, -1.613940715789795, -1.5620101690292358, -1.5100796222686768, -1.4581490755081177, -1.4062185287475586, -1.3542879819869995, -1.3023574352264404, -1.2504268884658813, -1.1984963417053223, -1.1465657949447632, -1.094635248184204, -1.042704701423645, -0.9907741546630859, -0.9388436079025269, -0.8869130611419678, -0.8349825143814087, -0.7830519676208496, -0.7311214208602905, -0.6791908740997314, -0.6272603273391724, -0.5753297805786133, -0.5233991742134094, -0.47146862745285034, -0.41953808069229126, -0.3676075339317322, -0.3156769871711731, -0.2637464106082916, -0.21181586384773254, -0.15988531708717346, -0.10795477032661438, -0.056024219840765, -0.004093669354915619, 0.04783688485622406, 0.09976743161678314, 0.15169799327850342, 0.2036285400390625, 0.2555590867996216, 0.30748963356018066]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 5.0, 8.0, 9.0, 9.0, 8.0, 19.0, 13.0, 14.0, 27.0, 24.0, 29.0, 26.0, 20.0, 38.0, 45.0, 47.0, 34.0, 39.0, 46.0, 45.0, 48.0, 38.0, 33.0, 43.0, 18.0, 42.0, 34.0, 28.0, 25.0, 22.0, 19.0, 26.0, 28.0, 18.0, 16.0, 12.0, 9.0, 13.0, 6.0, 7.0, 6.0, 4.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32217538356781006, -0.30978909134864807, -0.2974027991294861, -0.2850165367126465, -0.2726302444934845, -0.2602439522743225, -0.24785766005516052, -0.23547138273715973, -0.22308510541915894, -0.21069881319999695, -0.19831253588199615, -0.18592624366283417, -0.17353996634483337, -0.1611536741256714, -0.1487673819065094, -0.1363811045885086, -0.12399481236934662, -0.11160852760076523, -0.09922224283218384, -0.08683595061302185, -0.07444967329502106, -0.06206338480114937, -0.04967709630727768, -0.03729081153869629, -0.0249045267701149, -0.012518241070210934, -0.0001319553703069687, 0.012254331260919571, 0.02464061602950096, 0.03702690079808235, 0.04941318929195404, 0.06179947406053543, 0.07418575882911682, 0.08657204359769821, 0.0989583283662796, 0.11134462058544159, 0.12373089790344238, 0.13611719012260437, 0.14850348234176636, 0.16088975965976715, 0.17327603697776794, 0.18566232919692993, 0.19804860651493073, 0.2104348987340927, 0.2228211760520935, 0.2352074682712555, 0.24759376049041748, 0.2599800229072571, 0.27236634492874146, 0.28475263714790344, 0.29713892936706543, 0.30952519178390503, 0.321911484003067, 0.334297776222229, 0.346684068441391, 0.359070360660553, 0.3714566230773926, 0.38384291529655457, 0.39622920751571655, 0.40861546993255615, 0.42100176215171814, 0.4333880543708801, 0.4457743465900421, 0.4581606388092041, 0.4705469012260437]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 4.0, 11.0, 6.0, 11.0, 12.0, 15.0, 17.0, 38.0, 40.0, 71.0, 111.0, 161.0, 313.0, 609.0, 1465.0, 3693.0, 10713.0, 36885.0, 175171.0, 558455.0, 201001.0, 41219.0, 11582.0, 3904.0, 1589.0, 634.0, 310.0, 165.0, 111.0, 58.0, 53.0, 36.0, 21.0, 16.0, 14.0, 9.0, 7.0, 6.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66748046875, -0.6463165283203125, -0.625152587890625, -0.6039886474609375, -0.58282470703125, -0.5616607666015625, -0.540496826171875, -0.5193328857421875, -0.4981689453125, -0.4770050048828125, -0.455841064453125, -0.4346771240234375, -0.41351318359375, -0.3923492431640625, -0.371185302734375, -0.3500213623046875, -0.328857421875, -0.3076934814453125, -0.286529541015625, -0.2653656005859375, -0.24420166015625, -0.2230377197265625, -0.201873779296875, -0.1807098388671875, -0.1595458984375, -0.1383819580078125, -0.117218017578125, -0.0960540771484375, -0.07489013671875, -0.0537261962890625, -0.032562255859375, -0.0113983154296875, 0.009765625, 0.0309295654296875, 0.052093505859375, 0.0732574462890625, 0.09442138671875, 0.1155853271484375, 0.136749267578125, 0.1579132080078125, 0.1790771484375, 0.2002410888671875, 0.221405029296875, 0.2425689697265625, 0.26373291015625, 0.2848968505859375, 0.306060791015625, 0.3272247314453125, 0.348388671875, 0.3695526123046875, 0.390716552734375, 0.4118804931640625, 0.43304443359375, 0.4542083740234375, 0.475372314453125, 0.4965362548828125, 0.5177001953125, 0.5388641357421875, 0.560028076171875, 0.5811920166015625, 0.60235595703125, 0.6235198974609375, 0.644683837890625, 0.6658477783203125, 0.68701171875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 9.0, 8.0, 9.0, 13.0, 7.0, 11.0, 11.0, 23.0, 26.0, 31.0, 20.0, 32.0, 33.0, 33.0, 45.0, 39.0, 45.0, 48.0, 48.0, 49.0, 37.0, 57.0, 47.0, 38.0, 48.0, 31.0, 39.0, 29.0, 22.0, 17.0, 16.0, 14.0, 14.0, 18.0, 12.0, 7.0, 7.0, 1.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.365234375, -0.35382080078125, -0.3424072265625, -0.33099365234375, -0.319580078125, -0.30816650390625, -0.2967529296875, -0.28533935546875, -0.27392578125, -0.26251220703125, -0.2510986328125, -0.23968505859375, -0.228271484375, -0.21685791015625, -0.2054443359375, -0.19403076171875, -0.1826171875, -0.17120361328125, -0.1597900390625, -0.14837646484375, -0.136962890625, -0.12554931640625, -0.1141357421875, -0.10272216796875, -0.09130859375, -0.07989501953125, -0.0684814453125, -0.05706787109375, -0.045654296875, -0.03424072265625, -0.0228271484375, -0.01141357421875, 0.0, 0.01141357421875, 0.0228271484375, 0.03424072265625, 0.045654296875, 0.05706787109375, 0.0684814453125, 0.07989501953125, 0.09130859375, 0.10272216796875, 0.1141357421875, 0.12554931640625, 0.136962890625, 0.14837646484375, 0.1597900390625, 0.17120361328125, 0.1826171875, 0.19403076171875, 0.2054443359375, 0.21685791015625, 0.228271484375, 0.23968505859375, 0.2510986328125, 0.26251220703125, 0.27392578125, 0.28533935546875, 0.2967529296875, 0.30816650390625, 0.319580078125, 0.33099365234375, 0.3424072265625, 0.35382080078125, 0.365234375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 5.0, 9.0, 8.0, 10.0, 15.0, 17.0, 32.0, 54.0, 69.0, 124.0, 240.0, 505.0, 1194.0, 3694.0, 14903.0, 106730.0, 781236.0, 117639.0, 15885.0, 3828.0, 1263.0, 475.0, 238.0, 148.0, 82.0, 47.0, 32.0, 24.0, 18.0, 9.0, 7.0, 2.0, 0.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.20703125, -1.1710205078125, -1.135009765625, -1.0989990234375, -1.06298828125, -1.0269775390625, -0.990966796875, -0.9549560546875, -0.9189453125, -0.8829345703125, -0.846923828125, -0.8109130859375, -0.77490234375, -0.7388916015625, -0.702880859375, -0.6668701171875, -0.630859375, -0.5948486328125, -0.558837890625, -0.5228271484375, -0.48681640625, -0.4508056640625, -0.414794921875, -0.3787841796875, -0.3427734375, -0.3067626953125, -0.270751953125, -0.2347412109375, -0.19873046875, -0.1627197265625, -0.126708984375, -0.0906982421875, -0.0546875, -0.0186767578125, 0.017333984375, 0.0533447265625, 0.08935546875, 0.1253662109375, 0.161376953125, 0.1973876953125, 0.2333984375, 0.2694091796875, 0.305419921875, 0.3414306640625, 0.37744140625, 0.4134521484375, 0.449462890625, 0.4854736328125, 0.521484375, 0.5574951171875, 0.593505859375, 0.6295166015625, 0.66552734375, 0.7015380859375, 0.737548828125, 0.7735595703125, 0.8095703125, 0.8455810546875, 0.881591796875, 0.9176025390625, 0.95361328125, 0.9896240234375, 1.025634765625, 1.0616455078125, 1.09765625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 7.0, 8.0, 7.0, 13.0, 26.0, 18.0, 31.0, 29.0, 38.0, 48.0, 54.0, 58.0, 49.0, 71.0, 73.0, 76.0, 60.0, 65.0, 56.0, 31.0, 40.0, 30.0, 22.0, 22.0, 20.0, 12.0, 7.0, 10.0, 6.0, 5.0, 3.0, 4.0, 0.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.955078125, -1.872589111328125, -1.79010009765625, -1.707611083984375, -1.6251220703125, -1.542633056640625, -1.46014404296875, -1.377655029296875, -1.295166015625, -1.212677001953125, -1.13018798828125, -1.047698974609375, -0.9652099609375, -0.882720947265625, -0.80023193359375, -0.717742919921875, -0.63525390625, -0.552764892578125, -0.47027587890625, -0.387786865234375, -0.3052978515625, -0.222808837890625, -0.14031982421875, -0.057830810546875, 0.024658203125, 0.107147216796875, 0.18963623046875, 0.272125244140625, 0.3546142578125, 0.437103271484375, 0.51959228515625, 0.602081298828125, 0.6845703125, 0.767059326171875, 0.84954833984375, 0.932037353515625, 1.0145263671875, 1.097015380859375, 1.17950439453125, 1.261993408203125, 1.344482421875, 1.426971435546875, 1.50946044921875, 1.591949462890625, 1.6744384765625, 1.756927490234375, 1.83941650390625, 1.921905517578125, 2.00439453125, 2.086883544921875, 2.16937255859375, 2.251861572265625, 2.3343505859375, 2.416839599609375, 2.49932861328125, 2.581817626953125, 2.664306640625, 2.746795654296875, 2.82928466796875, 2.911773681640625, 2.9942626953125, 3.076751708984375, 3.15924072265625, 3.241729736328125, 3.32421875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 9.0, 5.0, 8.0, 10.0, 21.0, 55.0, 190.0, 866.0, 184153.0, 861774.0, 1115.0, 215.0, 77.0, 36.0, 7.0, 4.0, 2.0, 4.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7978515625, -1.7230987548828125, -1.648345947265625, -1.5735931396484375, -1.49884033203125, -1.4240875244140625, -1.349334716796875, -1.2745819091796875, -1.1998291015625, -1.1250762939453125, -1.050323486328125, -0.9755706787109375, -0.90081787109375, -0.8260650634765625, -0.751312255859375, -0.6765594482421875, -0.601806640625, -0.5270538330078125, -0.452301025390625, -0.3775482177734375, -0.30279541015625, -0.2280426025390625, -0.153289794921875, -0.0785369873046875, -0.0037841796875, 0.0709686279296875, 0.145721435546875, 0.2204742431640625, 0.29522705078125, 0.3699798583984375, 0.444732666015625, 0.5194854736328125, 0.59423828125, 0.6689910888671875, 0.743743896484375, 0.8184967041015625, 0.89324951171875, 0.9680023193359375, 1.042755126953125, 1.1175079345703125, 1.1922607421875, 1.2670135498046875, 1.341766357421875, 1.4165191650390625, 1.49127197265625, 1.5660247802734375, 1.640777587890625, 1.7155303955078125, 1.790283203125, 1.8650360107421875, 1.939788818359375, 2.0145416259765625, 2.08929443359375, 2.1640472412109375, 2.238800048828125, 2.3135528564453125, 2.3883056640625, 2.4630584716796875, 2.537811279296875, 2.6125640869140625, 2.68731689453125, 2.7620697021484375, 2.836822509765625, 2.9115753173828125, 2.986328125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 4.0, 5.0, 12.0, 7.0, 8.0, 18.0, 26.0, 36.0, 50.0, 80.0, 76.0, 102.0, 131.0, 103.0, 87.0, 85.0, 48.0, 38.0, 29.0, 17.0, 5.0, 15.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.733438491821289e-05, -9.35560092329979e-05, -8.97776335477829e-05, -8.59992578625679e-05, -8.22208821773529e-05, -7.844250649213791e-05, -7.466413080692291e-05, -7.088575512170792e-05, -6.710737943649292e-05, -6.332900375127792e-05, -5.955062806606293e-05, -5.577225238084793e-05, -5.1993876695632935e-05, -4.821550101041794e-05, -4.443712532520294e-05, -4.0658749639987946e-05, -3.688037395477295e-05, -3.310199826955795e-05, -2.9323622584342957e-05, -2.554524689912796e-05, -2.1766871213912964e-05, -1.7988495528697968e-05, -1.4210119843482971e-05, -1.0431744158267975e-05, -6.6533684730529785e-06, -2.874992787837982e-06, 9.033828973770142e-07, 4.6817585825920105e-06, 8.460134267807007e-06, 1.2238509953022003e-05, 1.6016885638237e-05, 1.9795261323451996e-05, 2.3573637008666992e-05, 2.735201269388199e-05, 3.1130388379096985e-05, 3.490876406431198e-05, 3.868713974952698e-05, 4.2465515434741974e-05, 4.624389111995697e-05, 5.0022266805171967e-05, 5.380064249038696e-05, 5.757901817560196e-05, 6.135739386081696e-05, 6.513576954603195e-05, 6.891414523124695e-05, 7.269252091646194e-05, 7.647089660167694e-05, 8.024927228689194e-05, 8.402764797210693e-05, 8.780602365732193e-05, 9.158439934253693e-05, 9.536277502775192e-05, 9.914115071296692e-05, 0.00010291952639818192, 0.00010669790208339691, 0.00011047627776861191, 0.0001142546534538269, 0.0001180330291390419, 0.0001218114048242569, 0.0001255897805094719, 0.0001293681561946869, 0.00013314653187990189, 0.00013692490756511688, 0.00014070328325033188, 0.00014448165893554688]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 7.0, 13.0, 17.0, 22.0, 53.0, 73.0, 221.0, 933.0, 23965.0, 1015745.0, 6629.0, 566.0, 160.0, 58.0, 44.0, 22.0, 15.0, 9.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0126953125, -0.979339599609375, -0.94598388671875, -0.912628173828125, -0.8792724609375, -0.845916748046875, -0.81256103515625, -0.779205322265625, -0.745849609375, -0.712493896484375, -0.67913818359375, -0.645782470703125, -0.6124267578125, -0.579071044921875, -0.54571533203125, -0.512359619140625, -0.47900390625, -0.445648193359375, -0.41229248046875, -0.378936767578125, -0.3455810546875, -0.312225341796875, -0.27886962890625, -0.245513916015625, -0.212158203125, -0.178802490234375, -0.14544677734375, -0.112091064453125, -0.0787353515625, -0.045379638671875, -0.01202392578125, 0.021331787109375, 0.0546875, 0.088043212890625, 0.12139892578125, 0.154754638671875, 0.1881103515625, 0.221466064453125, 0.25482177734375, 0.288177490234375, 0.321533203125, 0.354888916015625, 0.38824462890625, 0.421600341796875, 0.4549560546875, 0.488311767578125, 0.52166748046875, 0.555023193359375, 0.58837890625, 0.621734619140625, 0.65509033203125, 0.688446044921875, 0.7218017578125, 0.755157470703125, 0.78851318359375, 0.821868896484375, 0.855224609375, 0.888580322265625, 0.92193603515625, 0.955291748046875, 0.9886474609375, 1.022003173828125, 1.05535888671875, 1.088714599609375, 1.1220703125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 8.0, 8.0, 18.0, 49.0, 224.0, 382.0, 206.0, 70.0, 22.0, 7.0, 8.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.109375, -2.0650177001953125, -2.020660400390625, -1.9763031005859375, -1.93194580078125, -1.8875885009765625, -1.843231201171875, -1.7988739013671875, -1.7545166015625, -1.7101593017578125, -1.665802001953125, -1.6214447021484375, -1.57708740234375, -1.5327301025390625, -1.488372802734375, -1.4440155029296875, -1.399658203125, -1.3553009033203125, -1.310943603515625, -1.2665863037109375, -1.22222900390625, -1.1778717041015625, -1.133514404296875, -1.0891571044921875, -1.0447998046875, -1.0004425048828125, -0.956085205078125, -0.9117279052734375, -0.86737060546875, -0.8230133056640625, -0.778656005859375, -0.7342987060546875, -0.68994140625, -0.6455841064453125, -0.601226806640625, -0.5568695068359375, -0.51251220703125, -0.4681549072265625, -0.423797607421875, -0.3794403076171875, -0.3350830078125, -0.2907257080078125, -0.246368408203125, -0.2020111083984375, -0.15765380859375, -0.1132965087890625, -0.068939208984375, -0.0245819091796875, 0.019775390625, 0.0641326904296875, 0.108489990234375, 0.1528472900390625, 0.19720458984375, 0.2415618896484375, 0.285919189453125, 0.3302764892578125, 0.3746337890625, 0.4189910888671875, 0.463348388671875, 0.5077056884765625, 0.55206298828125, 0.5964202880859375, 0.640777587890625, 0.6851348876953125, 0.7294921875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 12.0, 12.0, 32.0, 33.0, 65.0, 102.0, 180.0, 166.0, 157.0, 87.0, 65.0, 35.0, 27.0, 17.0, 7.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4891886711120605, -5.271323204040527, -5.053457736968994, -4.835592269897461, -4.617727279663086, -4.3998613357543945, -4.1819963455200195, -3.9641308784484863, -3.746265411376953, -3.52839994430542, -3.3105344772338867, -3.0926692485809326, -2.8748037815093994, -2.656938314437866, -2.439073085784912, -2.221207618713379, -2.0033421516418457, -1.7854766845703125, -1.5676113367080688, -1.3497459888458252, -1.131880521774292, -0.9140150547027588, -0.6961497068405151, -0.4782843589782715, -0.2604188919067383, -0.042553484439849854, 0.17531192302703857, 0.393177330493927, 0.6110427379608154, 0.8289082050323486, 1.0467735528945923, 1.264638900756836, 1.482503890991211, 1.7003693580627441, 1.9182347059249878, 2.1361000537872314, 2.3539655208587646, 2.571830987930298, 2.789696216583252, 3.007561683654785, 3.2254271507263184, 3.4432926177978516, 3.6611580848693848, 3.879023313522339, 4.096888542175293, 4.314754486083984, 4.532619476318359, 4.750484943389893, 4.968350410461426, 5.186215877532959, 5.404081344604492, 5.621946811676025, 5.839812278747559, 6.057677268981934, 6.275542736053467, 6.493408203125, 6.711273670196533, 6.929139137268066, 7.1470046043396, 7.364870071411133, 7.582735061645508, 7.800601005554199, 8.018465995788574, 8.236331939697266, 8.45419692993164]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 7.0, 3.0, 7.0, 9.0, 12.0, 11.0, 23.0, 10.0, 21.0, 10.0, 23.0, 26.0, 25.0, 35.0, 35.0, 47.0, 54.0, 46.0, 56.0, 51.0, 49.0, 58.0, 45.0, 36.0, 47.0, 42.0, 40.0, 37.0, 23.0, 22.0, 18.0, 14.0, 13.0, 10.0, 8.0, 4.0, 4.0, 5.0, 7.0, 2.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.621416091918945, -9.329771995544434, -9.038126945495605, -8.746482849121094, -8.454837799072266, -8.163193702697754, -7.871549129486084, -7.579904556274414, -7.288260459899902, -6.996615886688232, -6.7049713134765625, -6.413327217102051, -6.121682643890381, -5.830038070678711, -5.538393497467041, -5.246748924255371, -4.955104351043701, -4.663459777832031, -4.371815204620361, -4.080170631408691, -3.7885265350341797, -3.4968819618225098, -3.20523738861084, -2.913593053817749, -2.621948480606079, -2.330303907394409, -2.0386595726013184, -1.7470149993896484, -1.455370545387268, -1.1637260913848877, -0.8720815181732178, -0.580437183380127, -0.28879261016845703, 0.0028518736362457275, 0.2944963574409485, 0.5861408710479736, 0.877785325050354, 1.1694297790527344, 1.4610743522644043, 1.7527186870574951, 2.044363260269165, 2.336007833480835, 2.627652168273926, 2.9192967414855957, 3.2109413146972656, 3.5025856494903564, 3.7942302227020264, 4.085874557495117, 4.377519130706787, 4.669163703918457, 4.960808277130127, 5.252452850341797, 5.544096946716309, 5.8357415199279785, 6.127386093139648, 6.41903018951416, 6.710675239562988, 7.002319812774658, 7.293964385986328, 7.58560848236084, 7.87725305557251, 8.16889762878418, 8.460542678833008, 8.75218677520752, 9.043830871582031]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 4.0, 3.0, 2.0, 6.0, 9.0, 9.0, 8.0, 22.0, 34.0, 42.0, 58.0, 87.0, 139.0, 246.0, 473.0, 1070.0, 2844.0, 12698.0, 847141.0, 3311650.0, 12887.0, 2848.0, 986.0, 431.0, 241.0, 133.0, 80.0, 51.0, 29.0, 15.0, 10.0, 13.0, 6.0, 5.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8955078125, -0.8699264526367188, -0.8443450927734375, -0.8187637329101562, -0.793182373046875, -0.7676010131835938, -0.7420196533203125, -0.7164382934570312, -0.69085693359375, -0.6652755737304688, -0.6396942138671875, -0.6141128540039062, -0.588531494140625, -0.5629501342773438, -0.5373687744140625, -0.5117874145507812, -0.4862060546875, -0.46062469482421875, -0.4350433349609375, -0.40946197509765625, -0.383880615234375, -0.35829925537109375, -0.3327178955078125, -0.30713653564453125, -0.28155517578125, -0.25597381591796875, -0.2303924560546875, -0.20481109619140625, -0.179229736328125, -0.15364837646484375, -0.1280670166015625, -0.10248565673828125, -0.076904296875, -0.05132293701171875, -0.0257415771484375, -0.00016021728515625, 0.025421142578125, 0.05100250244140625, 0.0765838623046875, 0.10216522216796875, 0.12774658203125, 0.15332794189453125, 0.1789093017578125, 0.20449066162109375, 0.230072021484375, 0.25565338134765625, 0.2812347412109375, 0.30681610107421875, 0.3323974609375, 0.35797882080078125, 0.3835601806640625, 0.40914154052734375, 0.434722900390625, 0.46030426025390625, 0.4858856201171875, 0.5114669799804688, 0.53704833984375, 0.5626296997070312, 0.5882110595703125, 0.6137924194335938, 0.639373779296875, 0.6649551391601562, 0.6905364990234375, 0.7161178588867188, 0.74169921875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 11.0, 7.0, 7.0, 12.0, 20.0, 22.0, 25.0, 31.0, 23.0, 39.0, 44.0, 52.0, 54.0, 46.0, 60.0, 60.0, 62.0, 56.0, 45.0, 55.0, 44.0, 39.0, 30.0, 29.0, 22.0, 18.0, 29.0, 13.0, 8.0, 11.0, 6.0, 5.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.513671875, -0.4992103576660156, -0.48474884033203125, -0.4702873229980469, -0.4558258056640625, -0.4413642883300781, -0.42690277099609375, -0.4124412536621094, -0.397979736328125, -0.3835182189941406, -0.36905670166015625, -0.3545951843261719, -0.3401336669921875, -0.3256721496582031, -0.31121063232421875, -0.2967491149902344, -0.28228759765625, -0.2678260803222656, -0.25336456298828125, -0.23890304565429688, -0.2244415283203125, -0.20998001098632812, -0.19551849365234375, -0.18105697631835938, -0.166595458984375, -0.15213394165039062, -0.13767242431640625, -0.12321090698242188, -0.1087493896484375, -0.09428787231445312, -0.07982635498046875, -0.06536483764648438, -0.0509033203125, -0.036441802978515625, -0.02198028564453125, -0.007518768310546875, 0.0069427490234375, 0.021404266357421875, 0.03586578369140625, 0.050327301025390625, 0.064788818359375, 0.07925033569335938, 0.09371185302734375, 0.10817337036132812, 0.1226348876953125, 0.13709640502929688, 0.15155792236328125, 0.16601943969726562, 0.18048095703125, 0.19494247436523438, 0.20940399169921875, 0.22386550903320312, 0.2383270263671875, 0.2527885437011719, 0.26725006103515625, 0.2817115783691406, 0.296173095703125, 0.3106346130371094, 0.32509613037109375, 0.3395576477050781, 0.3540191650390625, 0.3684806823730469, 0.38294219970703125, 0.3974037170410156, 0.411865234375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 4.0, 0.0, 4.0, 2.0, 5.0, 4.0, 10.0, 13.0, 11.0, 21.0, 28.0, 38.0, 46.0, 66.0, 107.0, 111.0, 156.0, 237.0, 486.0, 725.0, 1377.0, 2818.0, 6711.0, 23421.0, 219023.0, 3854448.0, 63048.0, 12408.0, 4341.0, 1966.0, 1023.0, 578.0, 324.0, 214.0, 119.0, 94.0, 68.0, 57.0, 50.0, 27.0, 31.0, 18.0, 16.0, 9.0, 11.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.417724609375, -0.4034538269042969, -0.38918304443359375, -0.3749122619628906, -0.3606414794921875, -0.3463706970214844, -0.33209991455078125, -0.3178291320800781, -0.303558349609375, -0.2892875671386719, -0.27501678466796875, -0.2607460021972656, -0.2464752197265625, -0.23220443725585938, -0.21793365478515625, -0.20366287231445312, -0.18939208984375, -0.17512130737304688, -0.16085052490234375, -0.14657974243164062, -0.1323089599609375, -0.11803817749023438, -0.10376739501953125, -0.08949661254882812, -0.075225830078125, -0.060955047607421875, -0.04668426513671875, -0.032413482666015625, -0.0181427001953125, -0.003871917724609375, 0.01039886474609375, 0.024669647216796875, 0.0389404296875, 0.053211212158203125, 0.06748199462890625, 0.08175277709960938, 0.0960235595703125, 0.11029434204101562, 0.12456512451171875, 0.13883590698242188, 0.153106689453125, 0.16737747192382812, 0.18164825439453125, 0.19591903686523438, 0.2101898193359375, 0.22446060180664062, 0.23873138427734375, 0.2530021667480469, 0.26727294921875, 0.2815437316894531, 0.29581451416015625, 0.3100852966308594, 0.3243560791015625, 0.3386268615722656, 0.35289764404296875, 0.3671684265136719, 0.381439208984375, 0.3957099914550781, 0.40998077392578125, 0.4242515563964844, 0.4385223388671875, 0.4527931213378906, 0.46706390380859375, 0.4813346862792969, 0.49560546875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 10.0, 15.0, 18.0, 50.0, 198.0, 3442.0, 240.0, 55.0, 17.0, 11.0, 9.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.290771484375, -0.2818450927734375, -0.272918701171875, -0.2639923095703125, -0.25506591796875, -0.2461395263671875, -0.237213134765625, -0.2282867431640625, -0.2193603515625, -0.2104339599609375, -0.201507568359375, -0.1925811767578125, -0.18365478515625, -0.1747283935546875, -0.165802001953125, -0.1568756103515625, -0.14794921875, -0.1390228271484375, -0.130096435546875, -0.1211700439453125, -0.11224365234375, -0.1033172607421875, -0.094390869140625, -0.0854644775390625, -0.0765380859375, -0.0676116943359375, -0.058685302734375, -0.0497589111328125, -0.04083251953125, -0.0319061279296875, -0.022979736328125, -0.0140533447265625, -0.005126953125, 0.0037994384765625, 0.012725830078125, 0.0216522216796875, 0.03057861328125, 0.0395050048828125, 0.048431396484375, 0.0573577880859375, 0.0662841796875, 0.0752105712890625, 0.084136962890625, 0.0930633544921875, 0.10198974609375, 0.1109161376953125, 0.119842529296875, 0.1287689208984375, 0.1376953125, 0.1466217041015625, 0.155548095703125, 0.1644744873046875, 0.17340087890625, 0.1823272705078125, 0.191253662109375, 0.2001800537109375, 0.2091064453125, 0.2180328369140625, 0.226959228515625, 0.2358856201171875, 0.24481201171875, 0.2537384033203125, 0.262664794921875, 0.2715911865234375, 0.280517578125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 7.0, 19.0, 61.0, 186.0, 296.0, 256.0, 137.0, 33.0, 12.0, 7.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8239659070968628, -0.791095495223999, -0.75822514295578, -0.7253547310829163, -0.6924843788146973, -0.6596139669418335, -0.6267435550689697, -0.593873143196106, -0.561002790927887, -0.5281323790550232, -0.4952620267868042, -0.46239161491394043, -0.42952123284339905, -0.39665085077285767, -0.3637804388999939, -0.3309100568294525, -0.29803967475891113, -0.26516929268836975, -0.23229889571666718, -0.1994284987449646, -0.16655811667442322, -0.13368773460388184, -0.10081733763217926, -0.06794694066047668, -0.0350765585899353, -0.002206169068813324, 0.030664220452308655, 0.06353460997343063, 0.09640499949455261, 0.129275381565094, 0.16214577853679657, 0.19501617550849915, 0.22788643836975098, 0.26075682044029236, 0.29362720251083374, 0.3264976143836975, 0.3593679964542389, 0.3922383785247803, 0.42510879039764404, 0.4579791724681854, 0.4908495545387268, 0.5237199664115906, 0.5565903186798096, 0.5894607305526733, 0.6223311424255371, 0.6552014946937561, 0.6880719065666199, 0.7209422588348389, 0.7538126707077026, 0.7866830825805664, 0.8195534348487854, 0.8524238467216492, 0.8852941989898682, 0.9181646108627319, 0.9510350227355957, 0.9839054346084595, 1.0167758464813232, 1.049646258354187, 1.0825166702270508, 1.115386962890625, 1.1482573747634888, 1.1811277866363525, 1.2139981985092163, 1.24686861038208, 1.2797389030456543]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 4.0, 4.0, 6.0, 6.0, 14.0, 16.0, 13.0, 23.0, 24.0, 29.0, 32.0, 38.0, 37.0, 40.0, 42.0, 43.0, 52.0, 54.0, 55.0, 58.0, 50.0, 55.0, 32.0, 48.0, 34.0, 29.0, 35.0, 20.0, 28.0, 18.0, 16.0, 18.0, 10.0, 5.0, 4.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3616759181022644, -0.34910592436790466, -0.3365359306335449, -0.32396596670150757, -0.3113959729671478, -0.2988259792327881, -0.28625598549842834, -0.2736859917640686, -0.26111602783203125, -0.2485460340976715, -0.23597605526447296, -0.22340606153011322, -0.21083608269691467, -0.19826608896255493, -0.1856960952281952, -0.17312610149383545, -0.1605561077594757, -0.14798611402511597, -0.13541613519191742, -0.12284614145755768, -0.11027615517377853, -0.09770616888999939, -0.08513617515563965, -0.0725661888718605, -0.05999620258808136, -0.047426216304302216, -0.03485622629523277, -0.02228623628616333, -0.009716250002384186, 0.0028537362813949585, 0.0154237300157547, 0.027993716299533844, 0.04056370258331299, 0.05313368886709213, 0.06570367515087128, 0.07827366888523102, 0.09084365516901016, 0.1034136414527893, 0.11598363518714905, 0.1285536289215088, 0.14112360775470734, 0.15369360148906708, 0.16626358032226562, 0.17883357405662537, 0.1914035677909851, 0.20397354662418365, 0.2165435403585434, 0.22911351919174194, 0.24168351292610168, 0.2542535066604614, 0.26682350039482117, 0.2793934941291809, 0.29196345806121826, 0.304533451795578, 0.31710344552993774, 0.3296734392642975, 0.3422434329986572, 0.35481342673301697, 0.3673834204673767, 0.37995338439941406, 0.3925233781337738, 0.40509337186813354, 0.4176633656024933, 0.430233359336853, 0.4428033232688904]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 11.0, 11.0, 17.0, 25.0, 37.0, 78.0, 123.0, 266.0, 535.0, 1285.0, 3519.0, 11558.0, 50822.0, 305097.0, 543072.0, 102342.0, 20661.0, 5647.0, 1876.0, 788.0, 367.0, 188.0, 85.0, 56.0, 35.0, 19.0, 14.0, 6.0, 6.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5537109375, -0.5308380126953125, -0.507965087890625, -0.4850921630859375, -0.46221923828125, -0.4393463134765625, -0.416473388671875, -0.3936004638671875, -0.3707275390625, -0.3478546142578125, -0.324981689453125, -0.3021087646484375, -0.27923583984375, -0.2563629150390625, -0.233489990234375, -0.2106170654296875, -0.187744140625, -0.1648712158203125, -0.141998291015625, -0.1191253662109375, -0.09625244140625, -0.0733795166015625, -0.050506591796875, -0.0276336669921875, -0.0047607421875, 0.0181121826171875, 0.040985107421875, 0.0638580322265625, 0.08673095703125, 0.1096038818359375, 0.132476806640625, 0.1553497314453125, 0.17822265625, 0.2010955810546875, 0.223968505859375, 0.2468414306640625, 0.26971435546875, 0.2925872802734375, 0.315460205078125, 0.3383331298828125, 0.3612060546875, 0.3840789794921875, 0.406951904296875, 0.4298248291015625, 0.45269775390625, 0.4755706787109375, 0.498443603515625, 0.5213165283203125, 0.544189453125, 0.5670623779296875, 0.589935302734375, 0.6128082275390625, 0.63568115234375, 0.6585540771484375, 0.681427001953125, 0.7042999267578125, 0.7271728515625, 0.7500457763671875, 0.772918701171875, 0.7957916259765625, 0.81866455078125, 0.8415374755859375, 0.864410400390625, 0.8872833251953125, 0.91015625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 5.0, 6.0, 13.0, 8.0, 18.0, 21.0, 15.0, 23.0, 32.0, 19.0, 40.0, 48.0, 37.0, 49.0, 58.0, 54.0, 58.0, 52.0, 63.0, 53.0, 41.0, 37.0, 43.0, 42.0, 23.0, 29.0, 26.0, 17.0, 20.0, 11.0, 16.0, 6.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.48974609375, -0.4760704040527344, -0.46239471435546875, -0.4487190246582031, -0.4350433349609375, -0.4213676452636719, -0.40769195556640625, -0.3940162658691406, -0.380340576171875, -0.3666648864746094, -0.35298919677734375, -0.3393135070800781, -0.3256378173828125, -0.3119621276855469, -0.29828643798828125, -0.2846107482910156, -0.27093505859375, -0.2572593688964844, -0.24358367919921875, -0.22990798950195312, -0.2162322998046875, -0.20255661010742188, -0.18888092041015625, -0.17520523071289062, -0.161529541015625, -0.14785385131835938, -0.13417816162109375, -0.12050247192382812, -0.1068267822265625, -0.09315109252929688, -0.07947540283203125, -0.06579971313476562, -0.0521240234375, -0.038448333740234375, -0.02477264404296875, -0.011096954345703125, 0.0025787353515625, 0.016254425048828125, 0.02993011474609375, 0.043605804443359375, 0.057281494140625, 0.07095718383789062, 0.08463287353515625, 0.09830856323242188, 0.1119842529296875, 0.12565994262695312, 0.13933563232421875, 0.15301132202148438, 0.16668701171875, 0.18036270141601562, 0.19403839111328125, 0.20771408081054688, 0.2213897705078125, 0.23506546020507812, 0.24874114990234375, 0.2624168395996094, 0.276092529296875, 0.2897682189941406, 0.30344390869140625, 0.3171195983886719, 0.3307952880859375, 0.3444709777832031, 0.35814666748046875, 0.3718223571777344, 0.385498046875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 5.0, 6.0, 4.0, 5.0, 7.0, 9.0, 24.0, 39.0, 67.0, 119.0, 289.0, 712.0, 2946.0, 29303.0, 841453.0, 163411.0, 7936.0, 1386.0, 436.0, 151.0, 96.0, 61.0, 32.0, 13.0, 15.0, 13.0, 3.0, 7.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-1.9326171875, -1.8827362060546875, -1.832855224609375, -1.7829742431640625, -1.73309326171875, -1.6832122802734375, -1.633331298828125, -1.5834503173828125, -1.5335693359375, -1.4836883544921875, -1.433807373046875, -1.3839263916015625, -1.33404541015625, -1.2841644287109375, -1.234283447265625, -1.1844024658203125, -1.134521484375, -1.0846405029296875, -1.034759521484375, -0.9848785400390625, -0.93499755859375, -0.8851165771484375, -0.835235595703125, -0.7853546142578125, -0.7354736328125, -0.6855926513671875, -0.635711669921875, -0.5858306884765625, -0.53594970703125, -0.4860687255859375, -0.436187744140625, -0.3863067626953125, -0.33642578125, -0.2865447998046875, -0.236663818359375, -0.1867828369140625, -0.13690185546875, -0.0870208740234375, -0.037139892578125, 0.0127410888671875, 0.0626220703125, 0.1125030517578125, 0.162384033203125, 0.2122650146484375, 0.26214599609375, 0.3120269775390625, 0.361907958984375, 0.4117889404296875, 0.461669921875, 0.5115509033203125, 0.561431884765625, 0.6113128662109375, 0.66119384765625, 0.7110748291015625, 0.760955810546875, 0.8108367919921875, 0.8607177734375, 0.9105987548828125, 0.960479736328125, 1.0103607177734375, 1.06024169921875, 1.1101226806640625, 1.160003662109375, 1.2098846435546875, 1.259765625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 10.0, 8.0, 14.0, 16.0, 19.0, 28.0, 33.0, 53.0, 37.0, 58.0, 57.0, 53.0, 67.0, 58.0, 83.0, 63.0, 67.0, 56.0, 46.0, 37.0, 32.0, 39.0, 15.0, 19.0, 8.0, 10.0, 4.0, 2.0, 3.0, 5.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.443359375, -2.36749267578125, -2.2916259765625, -2.21575927734375, -2.139892578125, -2.06402587890625, -1.9881591796875, -1.91229248046875, -1.83642578125, -1.76055908203125, -1.6846923828125, -1.60882568359375, -1.532958984375, -1.45709228515625, -1.3812255859375, -1.30535888671875, -1.2294921875, -1.15362548828125, -1.0777587890625, -1.00189208984375, -0.926025390625, -0.85015869140625, -0.7742919921875, -0.69842529296875, -0.62255859375, -0.54669189453125, -0.4708251953125, -0.39495849609375, -0.319091796875, -0.24322509765625, -0.1673583984375, -0.09149169921875, -0.015625, 0.06024169921875, 0.1361083984375, 0.21197509765625, 0.287841796875, 0.36370849609375, 0.4395751953125, 0.51544189453125, 0.59130859375, 0.66717529296875, 0.7430419921875, 0.81890869140625, 0.894775390625, 0.97064208984375, 1.0465087890625, 1.12237548828125, 1.1982421875, 1.27410888671875, 1.3499755859375, 1.42584228515625, 1.501708984375, 1.57757568359375, 1.6534423828125, 1.72930908203125, 1.80517578125, 1.88104248046875, 1.9569091796875, 2.03277587890625, 2.108642578125, 2.18450927734375, 2.2603759765625, 2.33624267578125, 2.412109375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 7.0, 26.0, 68.0, 193.0, 1625.0, 1039715.0, 6486.0, 316.0, 77.0, 27.0, 10.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.857421875, -3.771026611328125, -3.68463134765625, -3.598236083984375, -3.5118408203125, -3.425445556640625, -3.33905029296875, -3.252655029296875, -3.166259765625, -3.079864501953125, -2.99346923828125, -2.907073974609375, -2.8206787109375, -2.734283447265625, -2.64788818359375, -2.561492919921875, -2.47509765625, -2.388702392578125, -2.30230712890625, -2.215911865234375, -2.1295166015625, -2.043121337890625, -1.95672607421875, -1.870330810546875, -1.783935546875, -1.697540283203125, -1.61114501953125, -1.524749755859375, -1.4383544921875, -1.351959228515625, -1.26556396484375, -1.179168701171875, -1.0927734375, -1.006378173828125, -0.91998291015625, -0.833587646484375, -0.7471923828125, -0.660797119140625, -0.57440185546875, -0.488006591796875, -0.401611328125, -0.315216064453125, -0.22882080078125, -0.142425537109375, -0.0560302734375, 0.030364990234375, 0.11676025390625, 0.203155517578125, 0.28955078125, 0.375946044921875, 0.46234130859375, 0.548736572265625, 0.6351318359375, 0.721527099609375, 0.80792236328125, 0.894317626953125, 0.980712890625, 1.067108154296875, 1.15350341796875, 1.239898681640625, 1.3262939453125, 1.412689208984375, 1.49908447265625, 1.585479736328125, 1.671875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 4.0, 2.0, 4.0, 8.0, 6.0, 15.0, 25.0, 28.0, 32.0, 38.0, 58.0, 66.0, 81.0, 118.0, 97.0, 102.0, 79.0, 48.0, 39.0, 32.0, 21.0, 21.0, 15.0, 23.0, 7.0, 6.0, 7.0, 9.0, 2.0, 1.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.5789947509765625e-05, -5.357526242733002e-05, -5.136057734489441e-05, -4.91458922624588e-05, -4.693120718002319e-05, -4.4716522097587585e-05, -4.250183701515198e-05, -4.028715193271637e-05, -3.807246685028076e-05, -3.5857781767845154e-05, -3.3643096685409546e-05, -3.142841160297394e-05, -2.921372652053833e-05, -2.6999041438102722e-05, -2.4784356355667114e-05, -2.2569671273231506e-05, -2.03549861907959e-05, -1.814030110836029e-05, -1.5925616025924683e-05, -1.3710930943489075e-05, -1.1496245861053467e-05, -9.281560778617859e-06, -7.066875696182251e-06, -4.852190613746643e-06, -2.637505531311035e-06, -4.2282044887542725e-07, 1.7918646335601807e-06, 4.0065497159957886e-06, 6.2212347984313965e-06, 8.435919880867004e-06, 1.0650604963302612e-05, 1.286529004573822e-05, 1.5079975128173828e-05, 1.7294660210609436e-05, 1.9509345293045044e-05, 2.1724030375480652e-05, 2.393871545791626e-05, 2.6153400540351868e-05, 2.8368085622787476e-05, 3.0582770705223083e-05, 3.279745578765869e-05, 3.50121408700943e-05, 3.722682595252991e-05, 3.9441511034965515e-05, 4.165619611740112e-05, 4.387088119983673e-05, 4.608556628227234e-05, 4.830025136470795e-05, 5.0514936447143555e-05, 5.272962152957916e-05, 5.494430661201477e-05, 5.715899169445038e-05, 5.9373676776885986e-05, 6.15883618593216e-05, 6.38030469417572e-05, 6.601773202419281e-05, 6.823241710662842e-05, 7.044710218906403e-05, 7.266178727149963e-05, 7.487647235393524e-05, 7.709115743637085e-05, 7.930584251880646e-05, 8.152052760124207e-05, 8.373521268367767e-05, 8.594989776611328e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 6.0, 15.0, 31.0, 57.0, 139.0, 521.0, 28629.0, 1017289.0, 1477.0, 225.0, 88.0, 38.0, 19.0, 11.0, 4.0, 8.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.439453125, -2.3720703125, -2.3046875, -2.2373046875, -2.169921875, -2.1025390625, -2.03515625, -1.9677734375, -1.900390625, -1.8330078125, -1.765625, -1.6982421875, -1.630859375, -1.5634765625, -1.49609375, -1.4287109375, -1.361328125, -1.2939453125, -1.2265625, -1.1591796875, -1.091796875, -1.0244140625, -0.95703125, -0.8896484375, -0.822265625, -0.7548828125, -0.6875, -0.6201171875, -0.552734375, -0.4853515625, -0.41796875, -0.3505859375, -0.283203125, -0.2158203125, -0.1484375, -0.0810546875, -0.013671875, 0.0537109375, 0.12109375, 0.1884765625, 0.255859375, 0.3232421875, 0.390625, 0.4580078125, 0.525390625, 0.5927734375, 0.66015625, 0.7275390625, 0.794921875, 0.8623046875, 0.9296875, 0.9970703125, 1.064453125, 1.1318359375, 1.19921875, 1.2666015625, 1.333984375, 1.4013671875, 1.46875, 1.5361328125, 1.603515625, 1.6708984375, 1.73828125, 1.8056640625, 1.873046875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 6.0, 11.0, 15.0, 95.0, 349.0, 383.0, 115.0, 22.0, 10.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52294921875, -0.46521759033203125, -0.4074859619140625, -0.34975433349609375, -0.292022705078125, -0.23429107666015625, -0.1765594482421875, -0.11882781982421875, -0.06109619140625, -0.00336456298828125, 0.0543670654296875, 0.11209869384765625, 0.169830322265625, 0.22756195068359375, 0.2852935791015625, 0.34302520751953125, 0.4007568359375, 0.45848846435546875, 0.5162200927734375, 0.5739517211914062, 0.631683349609375, 0.6894149780273438, 0.7471466064453125, 0.8048782348632812, 0.86260986328125, 0.9203414916992188, 0.9780731201171875, 1.0358047485351562, 1.093536376953125, 1.1512680053710938, 1.2089996337890625, 1.2667312622070312, 1.324462890625, 1.3821945190429688, 1.4399261474609375, 1.4976577758789062, 1.555389404296875, 1.6131210327148438, 1.6708526611328125, 1.7285842895507812, 1.78631591796875, 1.8440475463867188, 1.9017791748046875, 1.9595108032226562, 2.017242431640625, 2.0749740600585938, 2.1327056884765625, 2.1904373168945312, 2.2481689453125, 2.3059005737304688, 2.3636322021484375, 2.4213638305664062, 2.479095458984375, 2.5368270874023438, 2.5945587158203125, 2.6522903442382812, 2.71002197265625, 2.7677536010742188, 2.8254852294921875, 2.8832168579101562, 2.940948486328125, 2.9986801147460938, 3.0564117431640625, 3.1141433715820312, 3.171875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 2.0, 9.0, 16.0, 57.0, 196.0, 328.0, 246.0, 78.0, 31.0, 13.0, 11.0, 4.0, 6.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8080573081970215, -7.326276779174805, -6.844496250152588, -6.362715721130371, -5.880935192108154, -5.3991546630859375, -4.9173736572265625, -4.435593605041504, -3.953812837600708, -3.472032308578491, -2.9902517795562744, -2.5084710121154785, -2.0266904830932617, -1.544909954071045, -1.0631294250488281, -0.5813488960266113, -0.09956836700439453, 0.38221219182014465, 0.8639927506446838, 1.3457733392715454, 1.8275538682937622, 2.3093345165252686, 2.7911150455474854, 3.272895574569702, 3.754676103591919, 4.236456871032715, 4.718237400054932, 5.200017929077148, 5.681798458099365, 6.163578987121582, 6.645359516143799, 7.127140045166016, 7.608920097351074, 8.09070110321045, 8.572481155395508, 9.054262161254883, 9.536042213439941, 10.017823219299316, 10.499603271484375, 10.98138427734375, 11.463164329528809, 11.944945335388184, 12.426725387573242, 12.908506393432617, 13.390286445617676, 13.87206745147705, 14.35384750366211, 14.835628509521484, 15.31740951538086, 15.799190521240234, 16.28097152709961, 16.76275062561035, 17.244531631469727, 17.7263126373291, 18.208093643188477, 18.68987274169922, 19.171653747558594, 19.65343475341797, 20.135215759277344, 20.616994857788086, 21.09877586364746, 21.580556869506836, 22.06233787536621, 22.544116973876953, 23.025897979736328]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 7.0, 3.0, 3.0, 9.0, 6.0, 6.0, 16.0, 7.0, 25.0, 19.0, 32.0, 26.0, 21.0, 38.0, 27.0, 40.0, 46.0, 66.0, 43.0, 43.0, 65.0, 43.0, 44.0, 45.0, 39.0, 33.0, 37.0, 36.0, 26.0, 24.0, 17.0, 14.0, 22.0, 14.0, 15.0, 7.0, 5.0, 5.0, 4.0, 5.0, 2.0, 5.0, 2.0, 0.0, 1.0, 4.0, 0.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.860803604125977, -7.61000394821167, -7.3592047691345215, -7.108405113220215, -6.857605934143066, -6.60680627822876, -6.356006622314453, -6.105207443237305, -5.854407787322998, -5.603608131408691, -5.352808952331543, -5.102009296417236, -4.85120964050293, -4.600410461425781, -4.349610805511475, -4.098811149597168, -3.8480119705200195, -3.597212553024292, -3.3464131355285645, -3.095613479614258, -2.8448140621185303, -2.5940146446228027, -2.343214988708496, -2.0924155712127686, -1.841616153717041, -1.5908167362213135, -1.3400171995162964, -1.0892176628112793, -0.8384182453155518, -0.5876188278198242, -0.33681929111480713, -0.08601975440979004, 0.1647796630859375, 0.4155791401863098, 0.6663786172866821, 0.9171780943870544, 1.1679775714874268, 1.4187769889831543, 1.6695765256881714, 1.9203760623931885, 2.171175479888916, 2.4219748973846436, 2.672774314880371, 2.9235739707946777, 3.1743733882904053, 3.425172805786133, 3.6759724617004395, 3.926771879196167, 4.1775712966918945, 4.428370952606201, 4.67917013168335, 4.929969787597656, 5.180768966674805, 5.431568622589111, 5.682368278503418, 5.933167457580566, 6.183967113494873, 6.43476676940918, 6.685565948486328, 6.936365604400635, 7.187165260314941, 7.43796443939209, 7.6887640953063965, 7.939563751220703, 8.190362930297852]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 3.0, 1.0, 3.0, 5.0, 4.0, 11.0, 6.0, 9.0, 15.0, 16.0, 27.0, 32.0, 45.0, 78.0, 138.0, 221.0, 464.0, 1312.0, 5341.0, 78339.0, 4087748.0, 16682.0, 2332.0, 721.0, 310.0, 150.0, 87.0, 67.0, 33.0, 25.0, 15.0, 9.0, 8.0, 2.0, 7.0, 6.0, 5.0, 3.0, 1.0, 3.0, 3.0], "bins": [-1.3779296875, -1.3460845947265625, -1.314239501953125, -1.2823944091796875, -1.25054931640625, -1.2187042236328125, -1.186859130859375, -1.1550140380859375, -1.1231689453125, -1.0913238525390625, -1.059478759765625, -1.0276336669921875, -0.99578857421875, -0.9639434814453125, -0.932098388671875, -0.9002532958984375, -0.868408203125, -0.8365631103515625, -0.804718017578125, -0.7728729248046875, -0.74102783203125, -0.7091827392578125, -0.677337646484375, -0.6454925537109375, -0.6136474609375, -0.5818023681640625, -0.549957275390625, -0.5181121826171875, -0.48626708984375, -0.4544219970703125, -0.422576904296875, -0.3907318115234375, -0.35888671875, -0.3270416259765625, -0.295196533203125, -0.2633514404296875, -0.23150634765625, -0.1996612548828125, -0.167816162109375, -0.1359710693359375, -0.1041259765625, -0.0722808837890625, -0.040435791015625, -0.0085906982421875, 0.02325439453125, 0.0550994873046875, 0.086944580078125, 0.1187896728515625, 0.150634765625, 0.1824798583984375, 0.214324951171875, 0.2461700439453125, 0.27801513671875, 0.3098602294921875, 0.341705322265625, 0.3735504150390625, 0.4053955078125, 0.4372406005859375, 0.469085693359375, 0.5009307861328125, 0.53277587890625, 0.5646209716796875, 0.596466064453125, 0.6283111572265625, 0.66015625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 5.0, 4.0, 8.0, 9.0, 6.0, 10.0, 16.0, 8.0, 22.0, 26.0, 37.0, 28.0, 20.0, 31.0, 37.0, 50.0, 53.0, 60.0, 57.0, 65.0, 58.0, 54.0, 54.0, 43.0, 43.0, 35.0, 25.0, 29.0, 26.0, 17.0, 19.0, 12.0, 7.0, 7.0, 12.0, 3.0, 10.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.355712890625, -0.3415565490722656, -0.32740020751953125, -0.3132438659667969, -0.2990875244140625, -0.2849311828613281, -0.27077484130859375, -0.2566184997558594, -0.242462158203125, -0.22830581665039062, -0.21414947509765625, -0.19999313354492188, -0.1858367919921875, -0.17168045043945312, -0.15752410888671875, -0.14336776733398438, -0.12921142578125, -0.11505508422851562, -0.10089874267578125, -0.08674240112304688, -0.0725860595703125, -0.058429718017578125, -0.04427337646484375, -0.030117034912109375, -0.015960693359375, -0.001804351806640625, 0.01235198974609375, 0.026508331298828125, 0.0406646728515625, 0.054821014404296875, 0.06897735595703125, 0.08313369750976562, 0.0972900390625, 0.11144638061523438, 0.12560272216796875, 0.13975906372070312, 0.1539154052734375, 0.16807174682617188, 0.18222808837890625, 0.19638442993164062, 0.210540771484375, 0.22469711303710938, 0.23885345458984375, 0.2530097961425781, 0.2671661376953125, 0.2813224792480469, 0.29547882080078125, 0.3096351623535156, 0.32379150390625, 0.3379478454589844, 0.35210418701171875, 0.3662605285644531, 0.3804168701171875, 0.3945732116699219, 0.40872955322265625, 0.4228858947753906, 0.437042236328125, 0.4511985778808594, 0.46535491943359375, 0.4795112609863281, 0.4936676025390625, 0.5078239440917969, 0.5219802856445312, 0.5361366271972656, 0.55029296875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 5.0, 3.0, 6.0, 9.0, 10.0, 21.0, 30.0, 55.0, 75.0, 127.0, 185.0, 314.0, 568.0, 1080.0, 2372.0, 7883.0, 79961.0, 4051127.0, 40383.0, 5805.0, 2113.0, 941.0, 505.0, 274.0, 165.0, 90.0, 69.0, 44.0, 15.0, 16.0, 11.0, 5.0, 6.0, 2.0, 1.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6845703125, -0.6634368896484375, -0.642303466796875, -0.6211700439453125, -0.60003662109375, -0.5789031982421875, -0.557769775390625, -0.5366363525390625, -0.5155029296875, -0.4943695068359375, -0.473236083984375, -0.4521026611328125, -0.43096923828125, -0.4098358154296875, -0.388702392578125, -0.3675689697265625, -0.346435546875, -0.3253021240234375, -0.304168701171875, -0.2830352783203125, -0.26190185546875, -0.2407684326171875, -0.219635009765625, -0.1985015869140625, -0.1773681640625, -0.1562347412109375, -0.135101318359375, -0.1139678955078125, -0.09283447265625, -0.0717010498046875, -0.050567626953125, -0.0294342041015625, -0.00830078125, 0.0128326416015625, 0.033966064453125, 0.0550994873046875, 0.07623291015625, 0.0973663330078125, 0.118499755859375, 0.1396331787109375, 0.1607666015625, 0.1819000244140625, 0.203033447265625, 0.2241668701171875, 0.24530029296875, 0.2664337158203125, 0.287567138671875, 0.3087005615234375, 0.329833984375, 0.3509674072265625, 0.372100830078125, 0.3932342529296875, 0.41436767578125, 0.4355010986328125, 0.456634521484375, 0.4777679443359375, 0.4989013671875, 0.5200347900390625, 0.541168212890625, 0.5623016357421875, 0.58343505859375, 0.6045684814453125, 0.625701904296875, 0.6468353271484375, 0.66796875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 4.0, 5.0, 12.0, 34.0, 81.0, 284.0, 3422.0, 139.0, 47.0, 20.0, 9.0, 5.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2587890625, -0.25237464904785156, -0.24596023559570312, -0.2395458221435547, -0.23313140869140625, -0.2267169952392578, -0.22030258178710938, -0.21388816833496094, -0.2074737548828125, -0.20105934143066406, -0.19464492797851562, -0.1882305145263672, -0.18181610107421875, -0.1754016876220703, -0.16898727416992188, -0.16257286071777344, -0.156158447265625, -0.14974403381347656, -0.14332962036132812, -0.1369152069091797, -0.13050079345703125, -0.12408638000488281, -0.11767196655273438, -0.11125755310058594, -0.1048431396484375, -0.09842872619628906, -0.09201431274414062, -0.08559989929199219, -0.07918548583984375, -0.07277107238769531, -0.06635665893554688, -0.05994224548339844, -0.05352783203125, -0.04711341857910156, -0.040699005126953125, -0.03428459167480469, -0.02787017822265625, -0.021455764770507812, -0.015041351318359375, -0.008626937866210938, -0.0022125244140625, 0.0042018890380859375, 0.010616302490234375, 0.017030715942382812, 0.02344512939453125, 0.029859542846679688, 0.036273956298828125, 0.04268836975097656, 0.049102783203125, 0.05551719665527344, 0.061931610107421875, 0.06834602355957031, 0.07476043701171875, 0.08117485046386719, 0.08758926391601562, 0.09400367736816406, 0.1004180908203125, 0.10683250427246094, 0.11324691772460938, 0.11966133117675781, 0.12607574462890625, 0.1324901580810547, 0.13890457153320312, 0.14531898498535156, 0.1517333984375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 8.0, 15.0, 35.0, 163.0, 437.0, 289.0, 56.0, 11.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1942410469055176, -2.1520349979400635, -2.1098289489746094, -2.0676229000091553, -2.025416851043701, -1.9832109212875366, -1.9410048723220825, -1.8987988233566284, -1.8565927743911743, -1.8143867254257202, -1.7721806764602661, -1.7299747467041016, -1.6877686977386475, -1.6455626487731934, -1.6033565998077393, -1.5611505508422852, -1.518944501876831, -1.476738452911377, -1.4345324039459229, -1.3923263549804688, -1.3501204252243042, -1.30791437625885, -1.265708327293396, -1.223502278327942, -1.1812963485717773, -1.1390902996063232, -1.0968842506408691, -1.054678201675415, -1.0124722719192505, -0.9702662229537964, -0.9280601739883423, -0.8858541250228882, -0.8436480760574341, -0.80144202709198, -0.7592360377311707, -0.7170299887657166, -0.6748239398002625, -0.6326179504394531, -0.590411901473999, -0.5482058525085449, -0.5059998035430908, -0.4637937843799591, -0.421587735414505, -0.3793817162513733, -0.3371756672859192, -0.2949696481227875, -0.25276362895965576, -0.21055757999420166, -0.16835159063339233, -0.12614555656909943, -0.08393952995538712, -0.041733503341674805, 0.00047253072261810303, 0.04267856478691101, 0.08488458395004272, 0.12709063291549683, 0.16929665207862854, 0.21150268614292145, 0.25370872020721436, 0.29591473937034607, 0.3381207585334778, 0.3803268074989319, 0.4225328266620636, 0.4647388756275177, 0.5069448947906494]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 6.0, 8.0, 3.0, 12.0, 10.0, 14.0, 17.0, 28.0, 35.0, 33.0, 36.0, 33.0, 56.0, 58.0, 75.0, 66.0, 64.0, 55.0, 45.0, 45.0, 57.0, 58.0, 38.0, 30.0, 28.0, 26.0, 16.0, 10.0, 14.0, 10.0, 6.0, 1.0, 8.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33589857816696167, -0.32257235050201416, -0.30924612283706665, -0.29591989517211914, -0.28259366750717163, -0.2692674398422241, -0.2559412121772766, -0.2426149696111679, -0.2292887419462204, -0.2159625142812729, -0.20263628661632538, -0.18931004405021667, -0.17598381638526917, -0.16265758872032166, -0.14933136105537415, -0.13600513339042664, -0.12267890572547913, -0.10935267806053162, -0.0960264503955841, -0.082700215280056, -0.06937398761510849, -0.05604775995016098, -0.042721524834632874, -0.029395297169685364, -0.016069069504737854, -0.002742839977145195, 0.010583389550447464, 0.023909620940685272, 0.03723584860563278, 0.05056207627058029, 0.0638883113861084, 0.07721453905105591, 0.09054076671600342, 0.10386699438095093, 0.11719322204589844, 0.13051944971084595, 0.14384567737579346, 0.15717190504074097, 0.17049814760684967, 0.18382437527179718, 0.1971506029367447, 0.2104768306016922, 0.2238030582666397, 0.2371293008327484, 0.2504555284976959, 0.26378175616264343, 0.27710798382759094, 0.29043421149253845, 0.30376043915748596, 0.31708666682243347, 0.330412894487381, 0.3437391221523285, 0.357065349817276, 0.3703915774822235, 0.3837178349494934, 0.3970440626144409, 0.4103702902793884, 0.42369651794433594, 0.43702274560928345, 0.45034897327423096, 0.46367520093917847, 0.477001428604126, 0.4903276562690735, 0.503653883934021, 0.5169801115989685]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 10.0, 10.0, 19.0, 22.0, 38.0, 42.0, 73.0, 104.0, 139.0, 279.0, 519.0, 1145.0, 2766.0, 7994.0, 26172.0, 107056.0, 505767.0, 309272.0, 61509.0, 16368.0, 5345.0, 2026.0, 866.0, 414.0, 226.0, 146.0, 66.0, 59.0, 36.0, 17.0, 20.0, 9.0, 4.0, 9.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6064453125, -0.5861053466796875, -0.565765380859375, -0.5454254150390625, -0.52508544921875, -0.5047454833984375, -0.484405517578125, -0.4640655517578125, -0.4437255859375, -0.4233856201171875, -0.403045654296875, -0.3827056884765625, -0.36236572265625, -0.3420257568359375, -0.321685791015625, -0.3013458251953125, -0.281005859375, -0.2606658935546875, -0.240325927734375, -0.2199859619140625, -0.19964599609375, -0.1793060302734375, -0.158966064453125, -0.1386260986328125, -0.1182861328125, -0.0979461669921875, -0.077606201171875, -0.0572662353515625, -0.03692626953125, -0.0165863037109375, 0.003753662109375, 0.0240936279296875, 0.04443359375, 0.0647735595703125, 0.085113525390625, 0.1054534912109375, 0.12579345703125, 0.1461334228515625, 0.166473388671875, 0.1868133544921875, 0.2071533203125, 0.2274932861328125, 0.247833251953125, 0.2681732177734375, 0.28851318359375, 0.3088531494140625, 0.329193115234375, 0.3495330810546875, 0.369873046875, 0.3902130126953125, 0.410552978515625, 0.4308929443359375, 0.45123291015625, 0.4715728759765625, 0.491912841796875, 0.5122528076171875, 0.5325927734375, 0.5529327392578125, 0.573272705078125, 0.5936126708984375, 0.61395263671875, 0.6342926025390625, 0.654632568359375, 0.6749725341796875, 0.6953125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 8.0, 10.0, 10.0, 10.0, 11.0, 15.0, 17.0, 23.0, 35.0, 28.0, 20.0, 47.0, 43.0, 49.0, 62.0, 62.0, 73.0, 66.0, 60.0, 53.0, 47.0, 47.0, 40.0, 32.0, 22.0, 35.0, 19.0, 16.0, 14.0, 9.0, 8.0, 8.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.379150390625, -0.3638343811035156, -0.34851837158203125, -0.3332023620605469, -0.3178863525390625, -0.3025703430175781, -0.28725433349609375, -0.2719383239746094, -0.256622314453125, -0.24130630493164062, -0.22599029541015625, -0.21067428588867188, -0.1953582763671875, -0.18004226684570312, -0.16472625732421875, -0.14941024780273438, -0.13409423828125, -0.11877822875976562, -0.10346221923828125, -0.08814620971679688, -0.0728302001953125, -0.057514190673828125, -0.04219818115234375, -0.026882171630859375, -0.011566162109375, 0.003749847412109375, 0.01906585693359375, 0.034381866455078125, 0.0496978759765625, 0.06501388549804688, 0.08032989501953125, 0.09564590454101562, 0.1109619140625, 0.12627792358398438, 0.14159393310546875, 0.15690994262695312, 0.1722259521484375, 0.18754196166992188, 0.20285797119140625, 0.21817398071289062, 0.233489990234375, 0.24880599975585938, 0.26412200927734375, 0.2794380187988281, 0.2947540283203125, 0.3100700378417969, 0.32538604736328125, 0.3407020568847656, 0.35601806640625, 0.3713340759277344, 0.38665008544921875, 0.4019660949707031, 0.4172821044921875, 0.4325981140136719, 0.44791412353515625, 0.4632301330566406, 0.478546142578125, 0.4938621520996094, 0.5091781616210938, 0.5244941711425781, 0.5398101806640625, 0.5551261901855469, 0.5704421997070312, 0.5857582092285156, 0.60107421875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 4.0, 5.0, 10.0, 11.0, 9.0, 7.0, 26.0, 27.0, 36.0, 30.0, 57.0, 85.0, 135.0, 208.0, 458.0, 993.0, 3176.0, 15080.0, 154572.0, 791858.0, 69076.0, 8858.0, 2215.0, 729.0, 337.0, 181.0, 97.0, 72.0, 47.0, 31.0, 29.0, 23.0, 15.0, 12.0, 11.0, 15.0, 7.0, 4.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.2177734375, -1.1823272705078125, -1.146881103515625, -1.1114349365234375, -1.07598876953125, -1.0405426025390625, -1.005096435546875, -0.9696502685546875, -0.9342041015625, -0.8987579345703125, -0.863311767578125, -0.8278656005859375, -0.79241943359375, -0.7569732666015625, -0.721527099609375, -0.6860809326171875, -0.650634765625, -0.6151885986328125, -0.579742431640625, -0.5442962646484375, -0.50885009765625, -0.4734039306640625, -0.437957763671875, -0.4025115966796875, -0.3670654296875, -0.3316192626953125, -0.296173095703125, -0.2607269287109375, -0.22528076171875, -0.1898345947265625, -0.154388427734375, -0.1189422607421875, -0.08349609375, -0.0480499267578125, -0.012603759765625, 0.0228424072265625, 0.05828857421875, 0.0937347412109375, 0.129180908203125, 0.1646270751953125, 0.2000732421875, 0.2355194091796875, 0.270965576171875, 0.3064117431640625, 0.34185791015625, 0.3773040771484375, 0.412750244140625, 0.4481964111328125, 0.483642578125, 0.5190887451171875, 0.554534912109375, 0.5899810791015625, 0.62542724609375, 0.6608734130859375, 0.696319580078125, 0.7317657470703125, 0.7672119140625, 0.8026580810546875, 0.838104248046875, 0.8735504150390625, 0.90899658203125, 0.9444427490234375, 0.979888916015625, 1.0153350830078125, 1.05078125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 10.0, 10.0, 10.0, 15.0, 26.0, 28.0, 46.0, 45.0, 58.0, 46.0, 65.0, 66.0, 57.0, 73.0, 57.0, 61.0, 69.0, 52.0, 40.0, 30.0, 34.0, 23.0, 14.0, 12.0, 12.0, 12.0, 6.0, 6.0, 5.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.169921875, -3.0893707275390625, -3.008819580078125, -2.9282684326171875, -2.84771728515625, -2.7671661376953125, -2.686614990234375, -2.6060638427734375, -2.5255126953125, -2.4449615478515625, -2.364410400390625, -2.2838592529296875, -2.20330810546875, -2.1227569580078125, -2.042205810546875, -1.9616546630859375, -1.881103515625, -1.8005523681640625, -1.720001220703125, -1.6394500732421875, -1.55889892578125, -1.4783477783203125, -1.397796630859375, -1.3172454833984375, -1.2366943359375, -1.1561431884765625, -1.075592041015625, -0.9950408935546875, -0.91448974609375, -0.8339385986328125, -0.753387451171875, -0.6728363037109375, -0.59228515625, -0.5117340087890625, -0.431182861328125, -0.3506317138671875, -0.27008056640625, -0.1895294189453125, -0.108978271484375, -0.0284271240234375, 0.0521240234375, 0.1326751708984375, 0.213226318359375, 0.2937774658203125, 0.37432861328125, 0.4548797607421875, 0.535430908203125, 0.6159820556640625, 0.696533203125, 0.7770843505859375, 0.857635498046875, 0.9381866455078125, 1.01873779296875, 1.0992889404296875, 1.179840087890625, 1.2603912353515625, 1.3409423828125, 1.4214935302734375, 1.502044677734375, 1.5825958251953125, 1.66314697265625, 1.7436981201171875, 1.824249267578125, 1.9048004150390625, 1.9853515625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 7.0, 4.0, 9.0, 14.0, 30.0, 106.0, 1023.0, 1033082.0, 13816.0, 330.0, 71.0, 32.0, 10.0, 6.0, 4.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.365234375, -2.26580810546875, -2.1663818359375, -2.06695556640625, -1.967529296875, -1.86810302734375, -1.7686767578125, -1.66925048828125, -1.56982421875, -1.47039794921875, -1.3709716796875, -1.27154541015625, -1.172119140625, -1.07269287109375, -0.9732666015625, -0.87384033203125, -0.7744140625, -0.67498779296875, -0.5755615234375, -0.47613525390625, -0.376708984375, -0.27728271484375, -0.1778564453125, -0.07843017578125, 0.02099609375, 0.12042236328125, 0.2198486328125, 0.31927490234375, 0.418701171875, 0.51812744140625, 0.6175537109375, 0.71697998046875, 0.81640625, 0.91583251953125, 1.0152587890625, 1.11468505859375, 1.214111328125, 1.31353759765625, 1.4129638671875, 1.51239013671875, 1.61181640625, 1.71124267578125, 1.8106689453125, 1.91009521484375, 2.009521484375, 2.10894775390625, 2.2083740234375, 2.30780029296875, 2.4072265625, 2.50665283203125, 2.6060791015625, 2.70550537109375, 2.804931640625, 2.90435791015625, 3.0037841796875, 3.10321044921875, 3.20263671875, 3.30206298828125, 3.4014892578125, 3.50091552734375, 3.600341796875, 3.69976806640625, 3.7991943359375, 3.89862060546875, 3.998046875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 4.0, 5.0, 4.0, 12.0, 12.0, 15.0, 18.0, 26.0, 24.0, 30.0, 47.0, 52.0, 93.0, 117.0, 112.0, 110.0, 77.0, 59.0, 50.0, 41.0, 30.0, 20.0, 18.0, 6.0, 9.0, 6.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.955862045288086e-05, -6.752181798219681e-05, -6.548501551151276e-05, -6.34482130408287e-05, -6.141141057014465e-05, -5.93746080994606e-05, -5.733780562877655e-05, -5.53010031580925e-05, -5.326420068740845e-05, -5.1227398216724396e-05, -4.9190595746040344e-05, -4.715379327535629e-05, -4.511699080467224e-05, -4.308018833398819e-05, -4.104338586330414e-05, -3.900658339262009e-05, -3.6969780921936035e-05, -3.4932978451251984e-05, -3.289617598056793e-05, -3.085937350988388e-05, -2.882257103919983e-05, -2.6785768568515778e-05, -2.4748966097831726e-05, -2.2712163627147675e-05, -2.0675361156463623e-05, -1.863855868577957e-05, -1.660175621509552e-05, -1.4564953744411469e-05, -1.2528151273727417e-05, -1.0491348803043365e-05, -8.454546332359314e-06, -6.4177438616752625e-06, -4.380941390991211e-06, -2.3441389203071594e-06, -3.073364496231079e-07, 1.7294660210609436e-06, 3.766268491744995e-06, 5.803070962429047e-06, 7.839873433113098e-06, 9.87667590379715e-06, 1.1913478374481201e-05, 1.3950280845165253e-05, 1.5987083315849304e-05, 1.8023885786533356e-05, 2.0060688257217407e-05, 2.209749072790146e-05, 2.413429319858551e-05, 2.6171095669269562e-05, 2.8207898139953613e-05, 3.0244700610637665e-05, 3.2281503081321716e-05, 3.431830555200577e-05, 3.635510802268982e-05, 3.839191049337387e-05, 4.042871296405792e-05, 4.2465515434741974e-05, 4.4502317905426025e-05, 4.653912037611008e-05, 4.857592284679413e-05, 5.061272531747818e-05, 5.264952778816223e-05, 5.468633025884628e-05, 5.6723132729530334e-05, 5.8759935200214386e-05, 6.079673767089844e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 5.0, 1.0, 4.0, 4.0, 10.0, 9.0, 18.0, 29.0, 64.0, 114.0, 291.0, 945.0, 4909.0, 269784.0, 762898.0, 7606.0, 1173.0, 376.0, 156.0, 81.0, 32.0, 19.0, 12.0, 8.0, 2.0, 4.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5400390625, -0.515594482421875, -0.49114990234375, -0.466705322265625, -0.4422607421875, -0.417816162109375, -0.39337158203125, -0.368927001953125, -0.344482421875, -0.320037841796875, -0.29559326171875, -0.271148681640625, -0.2467041015625, -0.222259521484375, -0.19781494140625, -0.173370361328125, -0.14892578125, -0.124481201171875, -0.10003662109375, -0.075592041015625, -0.0511474609375, -0.026702880859375, -0.00225830078125, 0.022186279296875, 0.046630859375, 0.071075439453125, 0.09552001953125, 0.119964599609375, 0.1444091796875, 0.168853759765625, 0.19329833984375, 0.217742919921875, 0.2421875, 0.266632080078125, 0.29107666015625, 0.315521240234375, 0.3399658203125, 0.364410400390625, 0.38885498046875, 0.413299560546875, 0.437744140625, 0.462188720703125, 0.48663330078125, 0.511077880859375, 0.5355224609375, 0.559967041015625, 0.58441162109375, 0.608856201171875, 0.63330078125, 0.657745361328125, 0.68218994140625, 0.706634521484375, 0.7310791015625, 0.755523681640625, 0.77996826171875, 0.804412841796875, 0.828857421875, 0.853302001953125, 0.87774658203125, 0.902191162109375, 0.9266357421875, 0.951080322265625, 0.97552490234375, 0.999969482421875, 1.0244140625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 5.0, 8.0, 13.0, 25.0, 72.0, 147.0, 226.0, 248.0, 140.0, 47.0, 29.0, 15.0, 6.0, 3.0, 2.0, 2.0, 5.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.60791015625, -0.5740737915039062, -0.5402374267578125, -0.5064010620117188, -0.472564697265625, -0.43872833251953125, -0.4048919677734375, -0.37105560302734375, -0.33721923828125, -0.30338287353515625, -0.2695465087890625, -0.23571014404296875, -0.201873779296875, -0.16803741455078125, -0.1342010498046875, -0.10036468505859375, -0.0665283203125, -0.03269195556640625, 0.0011444091796875, 0.03498077392578125, 0.068817138671875, 0.10265350341796875, 0.1364898681640625, 0.17032623291015625, 0.20416259765625, 0.23799896240234375, 0.2718353271484375, 0.30567169189453125, 0.339508056640625, 0.37334442138671875, 0.4071807861328125, 0.44101715087890625, 0.474853515625, 0.5086898803710938, 0.5425262451171875, 0.5763626098632812, 0.610198974609375, 0.6440353393554688, 0.6778717041015625, 0.7117080688476562, 0.74554443359375, 0.7793807983398438, 0.8132171630859375, 0.8470535278320312, 0.880889892578125, 0.9147262573242188, 0.9485626220703125, 0.9823989868164062, 1.0162353515625, 1.0500717163085938, 1.0839080810546875, 1.1177444458007812, 1.151580810546875, 1.1854171752929688, 1.2192535400390625, 1.2530899047851562, 1.28692626953125, 1.3207626342773438, 1.3545989990234375, 1.3884353637695312, 1.422271728515625, 1.4561080932617188, 1.4899444580078125, 1.5237808227539062, 1.5576171875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 29.0, 77.0, 347.0, 405.0, 111.0, 20.0, 13.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.353656768798828, -9.783933639526367, -9.214211463928223, -8.644489288330078, -8.074766159057617, -7.5050435066223145, -6.935320854187012, -6.365598201751709, -5.795875549316406, -5.2261528968811035, -4.656430244445801, -4.086707592010498, -3.5169849395751953, -2.9472622871398926, -2.37753963470459, -1.807816982269287, -1.2380943298339844, -0.6683716773986816, -0.0986490249633789, 0.47107362747192383, 1.0407962799072266, 1.6105189323425293, 2.180241584777832, 2.7499642372131348, 3.3196868896484375, 3.8894095420837402, 4.459132194519043, 5.028854846954346, 5.598577499389648, 6.168300151824951, 6.738022804260254, 7.307745456695557, 7.877468109130859, 8.44719123840332, 9.016913414001465, 9.58663558959961, 10.15635871887207, 10.726081848144531, 11.295804023742676, 11.86552619934082, 12.435249328613281, 13.004972457885742, 13.574694633483887, 14.144416809082031, 14.714139938354492, 15.283863067626953, 15.853585243225098, 16.423307418823242, 16.993030548095703, 17.562753677368164, 18.132476806640625, 18.702198028564453, 19.271921157836914, 19.841644287109375, 20.411365509033203, 20.981088638305664, 21.550811767578125, 22.120534896850586, 22.690258026123047, 23.259979248046875, 23.829702377319336, 24.399425506591797, 24.969146728515625, 25.538869857788086, 26.108592987060547]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 1.0, 4.0, 5.0, 7.0, 2.0, 6.0, 8.0, 11.0, 8.0, 13.0, 11.0, 15.0, 17.0, 21.0, 25.0, 25.0, 30.0, 25.0, 34.0, 26.0, 38.0, 29.0, 42.0, 46.0, 49.0, 44.0, 53.0, 48.0, 37.0, 35.0, 32.0, 30.0, 23.0, 16.0, 21.0, 21.0, 25.0, 18.0, 13.0, 10.0, 19.0, 13.0, 7.0, 6.0, 6.0, 4.0, 7.0, 9.0, 4.0, 4.0, 0.0, 1.0, 2.0, 0.0, 3.0], "bins": [-8.002874374389648, -7.768739223480225, -7.534604072570801, -7.300469398498535, -7.066334247589111, -6.8321990966796875, -6.598063945770264, -6.36392879486084, -6.129794120788574, -5.89565896987915, -5.661523818969727, -5.427389144897461, -5.193253993988037, -4.959118843078613, -4.7249836921691895, -4.490848541259766, -4.2567138671875, -4.022578716278076, -3.7884438037872314, -3.5543086528778076, -3.320173740386963, -3.086038589477539, -2.8519034385681152, -2.6177685260772705, -2.3836331367492676, -2.1494979858398438, -1.915363073348999, -1.6812279224395752, -1.4470930099487305, -1.2129578590393066, -0.9788228273391724, -0.7446877956390381, -0.5105528831481934, -0.2764178514480591, -0.04228278994560242, 0.19185227155685425, 0.4259873032569885, 0.6601223945617676, 0.8942574262619019, 1.1283924579620361, 1.3625274896621704, 1.5966625213623047, 1.830797553062439, 2.0649325847625732, 2.299067735671997, 2.533202648162842, 2.7673377990722656, 3.0014729499816895, 3.235607862472534, 3.469743013381958, 3.7038779258728027, 3.9380130767822266, 4.17214822769165, 4.406283378601074, 4.64041805267334, 4.874553203582764, 5.1086883544921875, 5.342823505401611, 5.576958656311035, 5.811093330383301, 6.045228481292725, 6.279363632202148, 6.513498783111572, 6.747633934020996, 6.981768608093262]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 7.0, 10.0, 14.0, 13.0, 34.0, 42.0, 82.0, 221.0, 580.0, 2117.0, 29103.0, 4139465.0, 20231.0, 1658.0, 406.0, 135.0, 65.0, 44.0, 17.0, 11.0, 9.0, 8.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5078125, -1.4652862548828125, -1.422760009765625, -1.3802337646484375, -1.33770751953125, -1.2951812744140625, -1.252655029296875, -1.2101287841796875, -1.1676025390625, -1.1250762939453125, -1.082550048828125, -1.0400238037109375, -0.99749755859375, -0.9549713134765625, -0.912445068359375, -0.8699188232421875, -0.827392578125, -0.7848663330078125, -0.742340087890625, -0.6998138427734375, -0.65728759765625, -0.6147613525390625, -0.572235107421875, -0.5297088623046875, -0.4871826171875, -0.4446563720703125, -0.402130126953125, -0.3596038818359375, -0.31707763671875, -0.2745513916015625, -0.232025146484375, -0.1894989013671875, -0.14697265625, -0.1044464111328125, -0.061920166015625, -0.0193939208984375, 0.02313232421875, 0.0656585693359375, 0.108184814453125, 0.1507110595703125, 0.1932373046875, 0.2357635498046875, 0.278289794921875, 0.3208160400390625, 0.36334228515625, 0.4058685302734375, 0.448394775390625, 0.4909210205078125, 0.533447265625, 0.5759735107421875, 0.618499755859375, 0.6610260009765625, 0.70355224609375, 0.7460784912109375, 0.788604736328125, 0.8311309814453125, 0.8736572265625, 0.9161834716796875, 0.958709716796875, 1.0012359619140625, 1.04376220703125, 1.0862884521484375, 1.128814697265625, 1.1713409423828125, 1.2138671875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 7.0, 2.0, 13.0, 12.0, 10.0, 25.0, 27.0, 30.0, 49.0, 36.0, 48.0, 57.0, 55.0, 67.0, 90.0, 69.0, 80.0, 65.0, 42.0, 49.0, 44.0, 24.0, 34.0, 17.0, 13.0, 11.0, 3.0, 4.0, 6.0, 0.0, 1.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.54296875, -0.5261688232421875, -0.509368896484375, -0.4925689697265625, -0.47576904296875, -0.4589691162109375, -0.442169189453125, -0.4253692626953125, -0.4085693359375, -0.3917694091796875, -0.374969482421875, -0.3581695556640625, -0.34136962890625, -0.3245697021484375, -0.307769775390625, -0.2909698486328125, -0.274169921875, -0.2573699951171875, -0.240570068359375, -0.2237701416015625, -0.20697021484375, -0.1901702880859375, -0.173370361328125, -0.1565704345703125, -0.1397705078125, -0.1229705810546875, -0.106170654296875, -0.0893707275390625, -0.07257080078125, -0.0557708740234375, -0.038970947265625, -0.0221710205078125, -0.00537109375, 0.0114288330078125, 0.028228759765625, 0.0450286865234375, 0.06182861328125, 0.0786285400390625, 0.095428466796875, 0.1122283935546875, 0.1290283203125, 0.1458282470703125, 0.162628173828125, 0.1794281005859375, 0.19622802734375, 0.2130279541015625, 0.229827880859375, 0.2466278076171875, 0.263427734375, 0.2802276611328125, 0.297027587890625, 0.3138275146484375, 0.33062744140625, 0.3474273681640625, 0.364227294921875, 0.3810272216796875, 0.3978271484375, 0.4146270751953125, 0.431427001953125, 0.4482269287109375, 0.46502685546875, 0.4818267822265625, 0.498626708984375, 0.5154266357421875, 0.5322265625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 1.0, 4.0, 7.0, 11.0, 18.0, 17.0, 27.0, 20.0, 35.0, 37.0, 35.0, 39.0, 40.0, 42.0, 93.0, 741.0, 4181473.0, 11009.0, 227.0, 67.0, 48.0, 41.0, 51.0, 37.0, 36.0, 22.0, 24.0, 25.0, 17.0, 16.0, 6.0, 5.0, 4.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.56640625, -3.43310546875, -3.2998046875, -3.16650390625, -3.033203125, -2.89990234375, -2.7666015625, -2.63330078125, -2.5, -2.36669921875, -2.2333984375, -2.10009765625, -1.966796875, -1.83349609375, -1.7001953125, -1.56689453125, -1.43359375, -1.30029296875, -1.1669921875, -1.03369140625, -0.900390625, -0.76708984375, -0.6337890625, -0.50048828125, -0.3671875, -0.23388671875, -0.1005859375, 0.03271484375, 0.166015625, 0.29931640625, 0.4326171875, 0.56591796875, 0.69921875, 0.83251953125, 0.9658203125, 1.09912109375, 1.232421875, 1.36572265625, 1.4990234375, 1.63232421875, 1.765625, 1.89892578125, 2.0322265625, 2.16552734375, 2.298828125, 2.43212890625, 2.5654296875, 2.69873046875, 2.83203125, 2.96533203125, 3.0986328125, 3.23193359375, 3.365234375, 3.49853515625, 3.6318359375, 3.76513671875, 3.8984375, 4.03173828125, 4.1650390625, 4.29833984375, 4.431640625, 4.56494140625, 4.6982421875, 4.83154296875, 4.96484375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 6.0, 42.0, 3918.0, 112.0, 10.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35205078125, -0.29000091552734375, -0.2279510498046875, -0.16590118408203125, -0.103851318359375, -0.04180145263671875, 0.0202484130859375, 0.08229827880859375, 0.14434814453125, 0.20639801025390625, 0.2684478759765625, 0.33049774169921875, 0.392547607421875, 0.45459747314453125, 0.5166473388671875, 0.5786972045898438, 0.6407470703125, 0.7027969360351562, 0.7648468017578125, 0.8268966674804688, 0.888946533203125, 0.9509963989257812, 1.0130462646484375, 1.0750961303710938, 1.13714599609375, 1.1991958618164062, 1.2612457275390625, 1.3232955932617188, 1.385345458984375, 1.4473953247070312, 1.5094451904296875, 1.5714950561523438, 1.633544921875, 1.6955947875976562, 1.7576446533203125, 1.8196945190429688, 1.881744384765625, 1.9437942504882812, 2.0058441162109375, 2.0678939819335938, 2.12994384765625, 2.1919937133789062, 2.2540435791015625, 2.3160934448242188, 2.378143310546875, 2.4401931762695312, 2.5022430419921875, 2.5642929077148438, 2.6263427734375, 2.6883926391601562, 2.7504425048828125, 2.8124923706054688, 2.874542236328125, 2.9365921020507812, 2.9986419677734375, 3.0606918334960938, 3.12274169921875, 3.1847915649414062, 3.2468414306640625, 3.3088912963867188, 3.370941162109375, 3.4329910278320312, 3.4950408935546875, 3.5570907592773438, 3.619140625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 3.0, 5.0, 4.0, 4.0, 26.0, 150.0, 689.0, 116.0, 15.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1708192825317383, -1.8895900249481201, -1.608360767364502, -1.3271315097808838, -1.0459022521972656, -0.7646729946136475, -0.4834437370300293, -0.20221447944641113, 0.07901477813720703, 0.3602440357208252, 0.6414732933044434, 0.9227025508880615, 1.2039318084716797, 1.4851610660552979, 1.766390323638916, 2.047619581222534, 2.3288488388061523, 2.6100780963897705, 2.8913073539733887, 3.172536611557007, 3.453765869140625, 3.734995126724243, 4.016224384307861, 4.297453880310059, 4.578682899475098, 4.859911918640137, 5.141141414642334, 5.422370910644531, 5.70359992980957, 5.984828948974609, 6.266058444976807, 6.547287940979004, 6.828516960144043, 7.109745979309082, 7.390975475311279, 7.672204971313477, 7.953433990478516, 8.234663009643555, 8.515892028808594, 8.79712200164795, 9.078351020812988, 9.359580039978027, 9.640810012817383, 9.922039031982422, 10.203268051147461, 10.4844970703125, 10.765726089477539, 11.046956062316895, 11.328185081481934, 11.609414100646973, 11.890644073486328, 12.171873092651367, 12.453102111816406, 12.734331130981445, 13.015560150146484, 13.29679012298584, 13.578019142150879, 13.859248161315918, 14.140478134155273, 14.421707153320312, 14.702936172485352, 14.98416519165039, 15.26539421081543, 15.546624183654785, 15.827853202819824]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 7.0, 6.0, 16.0, 20.0, 42.0, 62.0, 103.0, 142.0, 158.0, 165.0, 102.0, 86.0, 36.0, 29.0, 19.0, 7.0, 5.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3709845542907715, -7.169337749481201, -6.967691421508789, -6.766044616699219, -6.564397811889648, -6.362751007080078, -6.161104202270508, -5.959457874298096, -5.757811069488525, -5.556164264678955, -5.354517936706543, -5.152871131896973, -4.951224327087402, -4.749577522277832, -4.547930717468262, -4.34628438949585, -4.144637584686279, -3.942990779876709, -3.7413442134857178, -3.5396976470947266, -3.3380508422851562, -3.136404037475586, -2.9347574710845947, -2.7331109046936035, -2.531464099884033, -2.329817295074463, -2.1281707286834717, -1.926524043083191, -1.7248773574829102, -1.5232306718826294, -1.3215839862823486, -1.1199373006820679, -0.9182901382446289, -0.7166434526443481, -0.5149967670440674, -0.3133500814437866, -0.11170339584350586, 0.0899432897567749, 0.29158997535705566, 0.4932366609573364, 0.6948833465576172, 0.896530032157898, 1.0981767177581787, 1.2998234033584595, 1.5014700889587402, 1.703116774559021, 1.9047634601593018, 2.106410026550293, 2.3080568313598633, 2.5097036361694336, 2.711350202560425, 2.912996768951416, 3.1146435737609863, 3.3162903785705566, 3.517936944961548, 3.719583511352539, 3.9212303161621094, 4.12287712097168, 4.32452392578125, 4.526170253753662, 4.727817058563232, 4.929463863372803, 5.131110191345215, 5.332756996154785, 5.5344038009643555]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 7.0, 11.0, 8.0, 13.0, 32.0, 36.0, 70.0, 141.0, 249.0, 597.0, 1755.0, 6593.0, 42995.0, 639703.0, 325389.0, 24160.0, 4491.0, 1346.0, 493.0, 212.0, 109.0, 55.0, 37.0, 20.0, 11.0, 13.0, 7.0, 4.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95703125, -0.91693115234375, -0.8768310546875, -0.83673095703125, -0.796630859375, -0.75653076171875, -0.7164306640625, -0.67633056640625, -0.63623046875, -0.59613037109375, -0.5560302734375, -0.51593017578125, -0.475830078125, -0.43572998046875, -0.3956298828125, -0.35552978515625, -0.3154296875, -0.27532958984375, -0.2352294921875, -0.19512939453125, -0.155029296875, -0.11492919921875, -0.0748291015625, -0.03472900390625, 0.00537109375, 0.04547119140625, 0.0855712890625, 0.12567138671875, 0.165771484375, 0.20587158203125, 0.2459716796875, 0.28607177734375, 0.326171875, 0.36627197265625, 0.4063720703125, 0.44647216796875, 0.486572265625, 0.52667236328125, 0.5667724609375, 0.60687255859375, 0.64697265625, 0.68707275390625, 0.7271728515625, 0.76727294921875, 0.807373046875, 0.84747314453125, 0.8875732421875, 0.92767333984375, 0.9677734375, 1.00787353515625, 1.0479736328125, 1.08807373046875, 1.128173828125, 1.16827392578125, 1.2083740234375, 1.24847412109375, 1.28857421875, 1.32867431640625, 1.3687744140625, 1.40887451171875, 1.448974609375, 1.48907470703125, 1.5291748046875, 1.56927490234375, 1.609375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 6.0, 5.0, 6.0, 7.0, 10.0, 20.0, 17.0, 17.0, 25.0, 43.0, 43.0, 45.0, 59.0, 47.0, 53.0, 61.0, 72.0, 70.0, 65.0, 53.0, 56.0, 53.0, 29.0, 32.0, 22.0, 14.0, 16.0, 19.0, 8.0, 4.0, 6.0, 4.0, 6.0, 3.0, 1.0, 3.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.6044921875, -0.5878105163574219, -0.5711288452148438, -0.5544471740722656, -0.5377655029296875, -0.5210838317871094, -0.5044021606445312, -0.4877204895019531, -0.471038818359375, -0.4543571472167969, -0.43767547607421875, -0.4209938049316406, -0.4043121337890625, -0.3876304626464844, -0.37094879150390625, -0.3542671203613281, -0.33758544921875, -0.3209037780761719, -0.30422210693359375, -0.2875404357910156, -0.2708587646484375, -0.2541770935058594, -0.23749542236328125, -0.22081375122070312, -0.204132080078125, -0.18745040893554688, -0.17076873779296875, -0.15408706665039062, -0.1374053955078125, -0.12072372436523438, -0.10404205322265625, -0.08736038208007812, -0.0706787109375, -0.053997039794921875, -0.03731536865234375, -0.020633697509765625, -0.0039520263671875, 0.012729644775390625, 0.02941131591796875, 0.046092987060546875, 0.062774658203125, 0.07945632934570312, 0.09613800048828125, 0.11281967163085938, 0.1295013427734375, 0.14618301391601562, 0.16286468505859375, 0.17954635620117188, 0.19622802734375, 0.21290969848632812, 0.22959136962890625, 0.24627304077148438, 0.2629547119140625, 0.2796363830566406, 0.29631805419921875, 0.3129997253417969, 0.329681396484375, 0.3463630676269531, 0.36304473876953125, 0.3797264099121094, 0.3964080810546875, 0.4130897521972656, 0.42977142333984375, 0.4464530944824219, 0.463134765625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 5.0, 4.0, 8.0, 6.0, 14.0, 33.0, 61.0, 157.0, 565.0, 4193.0, 1016323.0, 25627.0, 1139.0, 258.0, 90.0, 30.0, 21.0, 10.0, 4.0, 7.0, 3.0, 1.0, 2.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6328125, -3.49676513671875, -3.3607177734375, -3.22467041015625, -3.088623046875, -2.95257568359375, -2.8165283203125, -2.68048095703125, -2.54443359375, -2.40838623046875, -2.2723388671875, -2.13629150390625, -2.000244140625, -1.86419677734375, -1.7281494140625, -1.59210205078125, -1.4560546875, -1.32000732421875, -1.1839599609375, -1.04791259765625, -0.911865234375, -0.77581787109375, -0.6397705078125, -0.50372314453125, -0.36767578125, -0.23162841796875, -0.0955810546875, 0.04046630859375, 0.176513671875, 0.31256103515625, 0.4486083984375, 0.58465576171875, 0.720703125, 0.85675048828125, 0.9927978515625, 1.12884521484375, 1.264892578125, 1.40093994140625, 1.5369873046875, 1.67303466796875, 1.80908203125, 1.94512939453125, 2.0811767578125, 2.21722412109375, 2.353271484375, 2.48931884765625, 2.6253662109375, 2.76141357421875, 2.8974609375, 3.03350830078125, 3.1695556640625, 3.30560302734375, 3.441650390625, 3.57769775390625, 3.7137451171875, 3.84979248046875, 3.98583984375, 4.12188720703125, 4.2579345703125, 4.39398193359375, 4.530029296875, 4.66607666015625, 4.8021240234375, 4.93817138671875, 5.07421875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 11.0, 24.0, 39.0, 63.0, 92.0, 130.0, 168.0, 151.0, 131.0, 81.0, 52.0, 32.0, 21.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.73828125, -3.58154296875, -3.4248046875, -3.26806640625, -3.111328125, -2.95458984375, -2.7978515625, -2.64111328125, -2.484375, -2.32763671875, -2.1708984375, -2.01416015625, -1.857421875, -1.70068359375, -1.5439453125, -1.38720703125, -1.23046875, -1.07373046875, -0.9169921875, -0.76025390625, -0.603515625, -0.44677734375, -0.2900390625, -0.13330078125, 0.0234375, 0.18017578125, 0.3369140625, 0.49365234375, 0.650390625, 0.80712890625, 0.9638671875, 1.12060546875, 1.27734375, 1.43408203125, 1.5908203125, 1.74755859375, 1.904296875, 2.06103515625, 2.2177734375, 2.37451171875, 2.53125, 2.68798828125, 2.8447265625, 3.00146484375, 3.158203125, 3.31494140625, 3.4716796875, 3.62841796875, 3.78515625, 3.94189453125, 4.0986328125, 4.25537109375, 4.412109375, 4.56884765625, 4.7255859375, 4.88232421875, 5.0390625, 5.19580078125, 5.3525390625, 5.50927734375, 5.666015625, 5.82275390625, 5.9794921875, 6.13623046875, 6.29296875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 2.0, 7.0, 11.0, 13.0, 37.0, 83.0, 290.0, 1235.0, 54041.0, 987664.0, 4387.0, 522.0, 165.0, 61.0, 14.0, 12.0, 6.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5322265625, -0.5045623779296875, -0.476898193359375, -0.4492340087890625, -0.42156982421875, -0.3939056396484375, -0.366241455078125, -0.3385772705078125, -0.3109130859375, -0.2832489013671875, -0.255584716796875, -0.2279205322265625, -0.20025634765625, -0.1725921630859375, -0.144927978515625, -0.1172637939453125, -0.089599609375, -0.0619354248046875, -0.034271240234375, -0.0066070556640625, 0.02105712890625, 0.0487213134765625, 0.076385498046875, 0.1040496826171875, 0.1317138671875, 0.1593780517578125, 0.187042236328125, 0.2147064208984375, 0.24237060546875, 0.2700347900390625, 0.297698974609375, 0.3253631591796875, 0.35302734375, 0.3806915283203125, 0.408355712890625, 0.4360198974609375, 0.46368408203125, 0.4913482666015625, 0.519012451171875, 0.5466766357421875, 0.5743408203125, 0.6020050048828125, 0.629669189453125, 0.6573333740234375, 0.68499755859375, 0.7126617431640625, 0.740325927734375, 0.7679901123046875, 0.795654296875, 0.8233184814453125, 0.850982666015625, 0.8786468505859375, 0.90631103515625, 0.9339752197265625, 0.961639404296875, 0.9893035888671875, 1.0169677734375, 1.0446319580078125, 1.072296142578125, 1.0999603271484375, 1.12762451171875, 1.1552886962890625, 1.182952880859375, 1.2106170654296875, 1.23828125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 3.0, 2.0, 4.0, 11.0, 8.0, 6.0, 8.0, 11.0, 12.0, 16.0, 23.0, 24.0, 29.0, 49.0, 64.0, 68.0, 85.0, 93.0, 102.0, 81.0, 59.0, 43.0, 37.0, 30.0, 38.0, 22.0, 18.0, 12.0, 7.0, 10.0, 7.0, 4.0, 5.0, 3.0, 1.0, 2.0, 0.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.118680953979492e-05, -3.959052264690399e-05, -3.799423575401306e-05, -3.639794886112213e-05, -3.48016619682312e-05, -3.320537507534027e-05, -3.160908818244934e-05, -3.001280128955841e-05, -2.841651439666748e-05, -2.682022750377655e-05, -2.522394061088562e-05, -2.362765371799469e-05, -2.203136682510376e-05, -2.043507993221283e-05, -1.88387930393219e-05, -1.724250614643097e-05, -1.564621925354004e-05, -1.4049932360649109e-05, -1.2453645467758179e-05, -1.0857358574867249e-05, -9.261071681976318e-06, -7.664784789085388e-06, -6.068497896194458e-06, -4.472211003303528e-06, -2.8759241104125977e-06, -1.2796372175216675e-06, 3.166496753692627e-07, 1.912936568260193e-06, 3.509223461151123e-06, 5.105510354042053e-06, 6.701797246932983e-06, 8.298084139823914e-06, 9.894371032714844e-06, 1.1490657925605774e-05, 1.3086944818496704e-05, 1.4683231711387634e-05, 1.6279518604278564e-05, 1.7875805497169495e-05, 1.9472092390060425e-05, 2.1068379282951355e-05, 2.2664666175842285e-05, 2.4260953068733215e-05, 2.5857239961624146e-05, 2.7453526854515076e-05, 2.9049813747406006e-05, 3.0646100640296936e-05, 3.2242387533187866e-05, 3.3838674426078796e-05, 3.5434961318969727e-05, 3.703124821186066e-05, 3.862753510475159e-05, 4.022382199764252e-05, 4.182010889053345e-05, 4.341639578342438e-05, 4.501268267631531e-05, 4.660896956920624e-05, 4.820525646209717e-05, 4.98015433549881e-05, 5.139783024787903e-05, 5.299411714076996e-05, 5.459040403366089e-05, 5.618669092655182e-05, 5.778297781944275e-05, 5.937926471233368e-05, 6.097555160522461e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 5.0, 2.0, 9.0, 19.0, 71.0, 360.0, 41090.0, 1006260.0, 613.0, 90.0, 22.0, 13.0, 6.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.521484375, -2.458648681640625, -2.39581298828125, -2.332977294921875, -2.2701416015625, -2.207305908203125, -2.14447021484375, -2.081634521484375, -2.018798828125, -1.955963134765625, -1.89312744140625, -1.830291748046875, -1.7674560546875, -1.704620361328125, -1.64178466796875, -1.578948974609375, -1.51611328125, -1.453277587890625, -1.39044189453125, -1.327606201171875, -1.2647705078125, -1.201934814453125, -1.13909912109375, -1.076263427734375, -1.013427734375, -0.950592041015625, -0.88775634765625, -0.824920654296875, -0.7620849609375, -0.699249267578125, -0.63641357421875, -0.573577880859375, -0.5107421875, -0.447906494140625, -0.38507080078125, -0.322235107421875, -0.2593994140625, -0.196563720703125, -0.13372802734375, -0.070892333984375, -0.008056640625, 0.054779052734375, 0.11761474609375, 0.180450439453125, 0.2432861328125, 0.306121826171875, 0.36895751953125, 0.431793212890625, 0.49462890625, 0.557464599609375, 0.62030029296875, 0.683135986328125, 0.7459716796875, 0.808807373046875, 0.87164306640625, 0.934478759765625, 0.997314453125, 1.060150146484375, 1.12298583984375, 1.185821533203125, 1.2486572265625, 1.311492919921875, 1.37432861328125, 1.437164306640625, 1.5]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 7.0, 10.0, 20.0, 22.0, 40.0, 55.0, 93.0, 95.0, 111.0, 153.0, 125.0, 96.0, 52.0, 32.0, 25.0, 18.0, 14.0, 12.0, 3.0, 8.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.348388671875, -0.33597564697265625, -0.3235626220703125, -0.31114959716796875, -0.298736572265625, -0.28632354736328125, -0.2739105224609375, -0.26149749755859375, -0.24908447265625, -0.23667144775390625, -0.2242584228515625, -0.21184539794921875, -0.199432373046875, -0.18701934814453125, -0.1746063232421875, -0.16219329833984375, -0.1497802734375, -0.13736724853515625, -0.1249542236328125, -0.11254119873046875, -0.100128173828125, -0.08771514892578125, -0.0753021240234375, -0.06288909912109375, -0.05047607421875, -0.03806304931640625, -0.0256500244140625, -0.01323699951171875, -0.000823974609375, 0.01158905029296875, 0.0240020751953125, 0.03641510009765625, 0.048828125, 0.06124114990234375, 0.0736541748046875, 0.08606719970703125, 0.098480224609375, 0.11089324951171875, 0.1233062744140625, 0.13571929931640625, 0.14813232421875, 0.16054534912109375, 0.1729583740234375, 0.18537139892578125, 0.197784423828125, 0.21019744873046875, 0.2226104736328125, 0.23502349853515625, 0.2474365234375, 0.25984954833984375, 0.2722625732421875, 0.28467559814453125, 0.297088623046875, 0.30950164794921875, 0.3219146728515625, 0.33432769775390625, 0.34674072265625, 0.35915374755859375, 0.3715667724609375, 0.38397979736328125, 0.396392822265625, 0.40880584716796875, 0.4212188720703125, 0.43363189697265625, 0.446044921875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 7.0, 43.0, 255.0, 540.0, 119.0, 25.0, 11.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.860916137695312, -29.035783767700195, -28.210649490356445, -27.385517120361328, -26.560382843017578, -25.73525047302246, -24.91011619567871, -24.084983825683594, -23.259849548339844, -22.434717178344727, -21.609582901000977, -20.78445053100586, -19.95931625366211, -19.134183883666992, -18.309049606323242, -17.483917236328125, -16.658782958984375, -15.833649635314941, -15.008516311645508, -14.183382987976074, -13.35824966430664, -12.533117294311523, -11.707983016967773, -10.882850646972656, -10.057718276977539, -9.232584953308105, -8.407451629638672, -7.582318305969238, -6.757184982299805, -5.932052135467529, -5.106918811798096, -4.281785488128662, -3.4566516876220703, -2.6315183639526367, -1.8063851594924927, -0.9812519550323486, -0.15611863136291504, 0.6690144538879395, 1.494147777557373, 2.3192811012268066, 3.1444144248962402, 3.969547748565674, 4.794681072235107, 5.619813919067383, 6.444947242736816, 7.27008056640625, 8.095213890075684, 8.920347213745117, 9.74548053741455, 10.570613861083984, 11.395747184753418, 12.220880508422852, 13.046013832092285, 13.871147155761719, 14.696279525756836, 15.521413803100586, 16.346546173095703, 17.17167854309082, 17.99681282043457, 18.821945190429688, 19.647079467773438, 20.472211837768555, 21.297346115112305, 22.122478485107422, 22.947612762451172]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 7.0, 11.0, 13.0, 13.0, 17.0, 20.0, 15.0, 18.0, 20.0, 27.0, 27.0, 41.0, 42.0, 42.0, 56.0, 73.0, 64.0, 57.0, 51.0, 35.0, 41.0, 48.0, 41.0, 34.0, 33.0, 33.0, 15.0, 10.0, 21.0, 13.0, 12.0, 7.0, 10.0, 12.0, 6.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.649940490722656, -8.339446067810059, -8.028952598571777, -7.71845817565918, -7.40796422958374, -7.097470283508301, -6.786975860595703, -6.476481914520264, -6.165987968444824, -5.855494022369385, -5.545000076293945, -5.234505653381348, -4.924011707305908, -4.613517761230469, -4.303023338317871, -3.9925293922424316, -3.682035446166992, -3.3715415000915527, -3.061047315597534, -2.7505531311035156, -2.440059185028076, -2.1295652389526367, -1.8190710544586182, -1.5085768699645996, -1.1980829238891602, -0.8875888586044312, -0.5770947933197021, -0.26660072803497314, 0.04389333724975586, 0.35438740253448486, 0.6648814678192139, 0.9753756523132324, 1.2858695983886719, 1.5963636636734009, 1.9068577289581299, 2.2173519134521484, 2.527845859527588, 2.8383398056030273, 3.148833990097046, 3.4593281745910645, 3.769822120666504, 4.080316066741943, 4.390810012817383, 4.7013044357299805, 5.01179838180542, 5.322292327880859, 5.632786750793457, 5.9432806968688965, 6.253774642944336, 6.564268589019775, 6.874762535095215, 7.1852569580078125, 7.495750904083252, 7.806244850158691, 8.116739273071289, 8.42723274230957, 8.737727165222168, 9.048221588134766, 9.358715057373047, 9.669209480285645, 9.979703903198242, 10.290197372436523, 10.600691795349121, 10.911186218261719, 11.2216796875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 7.0, 2.0, 5.0, 8.0, 15.0, 23.0, 28.0, 59.0, 104.0, 221.0, 585.0, 1697.0, 6730.0, 52782.0, 4001312.0, 117295.0, 9492.0, 2386.0, 845.0, 333.0, 170.0, 76.0, 49.0, 26.0, 13.0, 7.0, 8.0, 5.0, 4.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6787109375, -0.645782470703125, -0.61285400390625, -0.579925537109375, -0.5469970703125, -0.514068603515625, -0.48114013671875, -0.448211669921875, -0.415283203125, -0.382354736328125, -0.34942626953125, -0.316497802734375, -0.2835693359375, -0.250640869140625, -0.21771240234375, -0.184783935546875, -0.15185546875, -0.118927001953125, -0.08599853515625, -0.053070068359375, -0.0201416015625, 0.012786865234375, 0.04571533203125, 0.078643798828125, 0.111572265625, 0.144500732421875, 0.17742919921875, 0.210357666015625, 0.2432861328125, 0.276214599609375, 0.30914306640625, 0.342071533203125, 0.375, 0.407928466796875, 0.44085693359375, 0.473785400390625, 0.5067138671875, 0.539642333984375, 0.57257080078125, 0.605499267578125, 0.638427734375, 0.671356201171875, 0.70428466796875, 0.737213134765625, 0.7701416015625, 0.803070068359375, 0.83599853515625, 0.868927001953125, 0.90185546875, 0.934783935546875, 0.96771240234375, 1.000640869140625, 1.0335693359375, 1.066497802734375, 1.09942626953125, 1.132354736328125, 1.165283203125, 1.198211669921875, 1.23114013671875, 1.264068603515625, 1.2969970703125, 1.329925537109375, 1.36285400390625, 1.395782470703125, 1.4287109375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 6.0, 9.0, 12.0, 11.0, 13.0, 24.0, 35.0, 29.0, 38.0, 52.0, 37.0, 51.0, 57.0, 78.0, 77.0, 55.0, 59.0, 61.0, 48.0, 49.0, 48.0, 36.0, 23.0, 29.0, 18.0, 14.0, 8.0, 6.0, 1.0, 7.0, 5.0, 3.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3994140625, -0.385040283203125, -0.37066650390625, -0.356292724609375, -0.3419189453125, -0.327545166015625, -0.31317138671875, -0.298797607421875, -0.284423828125, -0.270050048828125, -0.25567626953125, -0.241302490234375, -0.2269287109375, -0.212554931640625, -0.19818115234375, -0.183807373046875, -0.16943359375, -0.155059814453125, -0.14068603515625, -0.126312255859375, -0.1119384765625, -0.097564697265625, -0.08319091796875, -0.068817138671875, -0.054443359375, -0.040069580078125, -0.02569580078125, -0.011322021484375, 0.0030517578125, 0.017425537109375, 0.03179931640625, 0.046173095703125, 0.060546875, 0.074920654296875, 0.08929443359375, 0.103668212890625, 0.1180419921875, 0.132415771484375, 0.14678955078125, 0.161163330078125, 0.175537109375, 0.189910888671875, 0.20428466796875, 0.218658447265625, 0.2330322265625, 0.247406005859375, 0.26177978515625, 0.276153564453125, 0.29052734375, 0.304901123046875, 0.31927490234375, 0.333648681640625, 0.3480224609375, 0.362396240234375, 0.37677001953125, 0.391143798828125, 0.405517578125, 0.419891357421875, 0.43426513671875, 0.448638916015625, 0.4630126953125, 0.477386474609375, 0.49176025390625, 0.506134033203125, 0.5205078125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 4.0, 8.0, 13.0, 13.0, 18.0, 17.0, 58.0, 148.0, 519.0, 2803.0, 45298.0, 4116796.0, 26073.0, 1976.0, 352.0, 87.0, 37.0, 30.0, 12.0, 9.0, 5.0, 5.0, 2.0, 4.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3857421875, -1.3312530517578125, -1.276763916015625, -1.2222747802734375, -1.16778564453125, -1.1132965087890625, -1.058807373046875, -1.0043182373046875, -0.9498291015625, -0.8953399658203125, -0.840850830078125, -0.7863616943359375, -0.73187255859375, -0.6773834228515625, -0.622894287109375, -0.5684051513671875, -0.513916015625, -0.4594268798828125, -0.404937744140625, -0.3504486083984375, -0.29595947265625, -0.2414703369140625, -0.186981201171875, -0.1324920654296875, -0.0780029296875, -0.0235137939453125, 0.030975341796875, 0.0854644775390625, 0.13995361328125, 0.1944427490234375, 0.248931884765625, 0.3034210205078125, 0.35791015625, 0.4123992919921875, 0.466888427734375, 0.5213775634765625, 0.57586669921875, 0.6303558349609375, 0.684844970703125, 0.7393341064453125, 0.7938232421875, 0.8483123779296875, 0.902801513671875, 0.9572906494140625, 1.01177978515625, 1.0662689208984375, 1.120758056640625, 1.1752471923828125, 1.229736328125, 1.2842254638671875, 1.338714599609375, 1.3932037353515625, 1.44769287109375, 1.5021820068359375, 1.556671142578125, 1.6111602783203125, 1.6656494140625, 1.7201385498046875, 1.774627685546875, 1.8291168212890625, 1.88360595703125, 1.9380950927734375, 1.992584228515625, 2.0470733642578125, 2.1015625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 0.0, 3.0, 6.0, 5.0, 8.0, 11.0, 10.0, 11.0, 14.0, 23.0, 32.0, 45.0, 98.0, 301.0, 1295.0, 1599.0, 376.0, 93.0, 55.0, 24.0, 18.0, 10.0, 11.0, 7.0, 1.0, 5.0, 5.0, 4.0, 0.0, 1.0, 4.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.1826171875, -1.1523971557617188, -1.1221771240234375, -1.0919570922851562, -1.061737060546875, -1.0315170288085938, -1.0012969970703125, -0.9710769653320312, -0.94085693359375, -0.9106369018554688, -0.8804168701171875, -0.8501968383789062, -0.819976806640625, -0.7897567749023438, -0.7595367431640625, -0.7293167114257812, -0.6990966796875, -0.6688766479492188, -0.6386566162109375, -0.6084365844726562, -0.578216552734375, -0.5479965209960938, -0.5177764892578125, -0.48755645751953125, -0.45733642578125, -0.42711639404296875, -0.3968963623046875, -0.36667633056640625, -0.336456298828125, -0.30623626708984375, -0.2760162353515625, -0.24579620361328125, -0.215576171875, -0.18535614013671875, -0.1551361083984375, -0.12491607666015625, -0.094696044921875, -0.06447601318359375, -0.0342559814453125, -0.00403594970703125, 0.02618408203125, 0.05640411376953125, 0.0866241455078125, 0.11684417724609375, 0.147064208984375, 0.17728424072265625, 0.2075042724609375, 0.23772430419921875, 0.2679443359375, 0.29816436767578125, 0.3283843994140625, 0.35860443115234375, 0.388824462890625, 0.41904449462890625, 0.4492645263671875, 0.47948455810546875, 0.50970458984375, 0.5399246215820312, 0.5701446533203125, 0.6003646850585938, 0.630584716796875, 0.6608047485351562, 0.6910247802734375, 0.7212448120117188, 0.75146484375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 6.0, 3.0, 7.0, 11.0, 18.0, 45.0, 152.0, 269.0, 288.0, 134.0, 39.0, 11.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.934274673461914, -8.717409133911133, -8.500543594360352, -8.28367805480957, -8.066812515258789, -7.849946975708008, -7.633081912994385, -7.4162163734436035, -7.199350833892822, -6.982485294342041, -6.76561975479126, -6.5487542152404785, -6.3318891525268555, -6.115023612976074, -5.898158073425293, -5.681292533874512, -5.4644269943237305, -5.247561454772949, -5.030695915222168, -4.813830375671387, -4.5969648361206055, -4.380099296569824, -4.163234233856201, -3.94636869430542, -3.7295031547546387, -3.5126376152038574, -3.295772075653076, -3.078906774520874, -2.8620412349700928, -2.6451756954193115, -2.4283103942871094, -2.211444854736328, -1.9945788383483887, -1.7777132987976074, -1.5608478784561157, -1.343982458114624, -1.1271169185638428, -0.9102513790130615, -0.6933859586715698, -0.4765205383300781, -0.2596549987792969, -0.0427895188331604, 0.17407596111297607, 0.39094144105911255, 0.607806921005249, 0.8246724605560303, 1.041537880897522, 1.2584033012390137, 1.475268840789795, 1.6921343803405762, 1.9089998006820679, 2.1258652210235596, 2.342730760574341, 2.559596300125122, 2.776461601257324, 2.9933271408081055, 3.2101926803588867, 3.427058219909668, 3.643923759460449, 3.8607890605926514, 4.077654838562012, 4.294520378112793, 4.511385440826416, 4.728250980377197, 4.9451165199279785]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 3.0, 9.0, 5.0, 7.0, 18.0, 12.0, 21.0, 13.0, 23.0, 27.0, 33.0, 27.0, 39.0, 46.0, 51.0, 46.0, 49.0, 60.0, 37.0, 54.0, 47.0, 54.0, 48.0, 39.0, 35.0, 32.0, 34.0, 31.0, 21.0, 14.0, 11.0, 12.0, 7.0, 5.0, 11.0, 6.0, 6.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0], "bins": [-4.226373672485352, -4.113289833068848, -4.0002055168151855, -3.8871214389801025, -3.7740373611450195, -3.6609535217285156, -3.5478692054748535, -3.4347853660583496, -3.3217012882232666, -3.2086172103881836, -3.0955331325531006, -2.9824490547180176, -2.8693649768829346, -2.7562808990478516, -2.6431970596313477, -2.5301129817962646, -2.4170289039611816, -2.3039448261260986, -2.1908607482910156, -2.0777766704559326, -1.9646927118301392, -1.8516086339950562, -1.7385245561599731, -1.6254405975341797, -1.5123562812805176, -1.3992722034454346, -1.2861881256103516, -1.1731040477752686, -1.060020089149475, -0.9469360113143921, -0.8338519334793091, -0.7207679152488708, -0.6076838970184326, -0.494599848985672, -0.3815158009529114, -0.26843172311782837, -0.15534767508506775, -0.04226362705230713, 0.07082045078277588, 0.1839044690132141, 0.2969885468482971, 0.41007259488105774, 0.5231566429138184, 0.6362407207489014, 0.7493247985839844, 0.8624088168144226, 0.9754928946495056, 1.0885769128799438, 1.2016609907150269, 1.3147450685501099, 1.4278291463851929, 1.5409131050109863, 1.6539971828460693, 1.7670812606811523, 1.8801653385162354, 1.9932494163513184, 2.1063334941864014, 2.2194175720214844, 2.3325016498565674, 2.4455857276916504, 2.5586698055267334, 2.6717538833618164, 2.7848377227783203, 2.8979218006134033, 3.0110058784484863]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 4.0, 7.0, 7.0, 15.0, 34.0, 26.0, 53.0, 72.0, 111.0, 142.0, 218.0, 359.0, 534.0, 855.0, 1517.0, 2430.0, 4340.0, 8104.0, 15859.0, 33339.0, 75341.0, 183625.0, 340089.0, 215784.0, 88227.0, 38286.0, 18115.0, 9153.0, 4873.0, 2727.0, 1624.0, 979.0, 602.0, 379.0, 246.0, 159.0, 96.0, 71.0, 44.0, 30.0, 25.0, 18.0, 14.0, 6.0, 6.0, 2.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.29150390625, -0.28197479248046875, -0.2724456787109375, -0.26291656494140625, -0.253387451171875, -0.24385833740234375, -0.2343292236328125, -0.22480010986328125, -0.21527099609375, -0.20574188232421875, -0.1962127685546875, -0.18668365478515625, -0.177154541015625, -0.16762542724609375, -0.1580963134765625, -0.14856719970703125, -0.1390380859375, -0.12950897216796875, -0.1199798583984375, -0.11045074462890625, -0.100921630859375, -0.09139251708984375, -0.0818634033203125, -0.07233428955078125, -0.06280517578125, -0.05327606201171875, -0.0437469482421875, -0.03421783447265625, -0.024688720703125, -0.01515960693359375, -0.0056304931640625, 0.00389862060546875, 0.013427734375, 0.02295684814453125, 0.0324859619140625, 0.04201507568359375, 0.051544189453125, 0.06107330322265625, 0.0706024169921875, 0.08013153076171875, 0.08966064453125, 0.09918975830078125, 0.1087188720703125, 0.11824798583984375, 0.127777099609375, 0.13730621337890625, 0.1468353271484375, 0.15636444091796875, 0.1658935546875, 0.17542266845703125, 0.1849517822265625, 0.19448089599609375, 0.204010009765625, 0.21353912353515625, 0.2230682373046875, 0.23259735107421875, 0.24212646484375, 0.25165557861328125, 0.2611846923828125, 0.27071380615234375, 0.280242919921875, 0.28977203369140625, 0.2993011474609375, 0.30883026123046875, 0.318359375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 2.0, 12.0, 7.0, 14.0, 16.0, 12.0, 17.0, 24.0, 17.0, 28.0, 25.0, 36.0, 46.0, 59.0, 43.0, 39.0, 61.0, 56.0, 46.0, 62.0, 40.0, 46.0, 48.0, 45.0, 32.0, 31.0, 27.0, 21.0, 13.0, 22.0, 8.0, 12.0, 7.0, 7.0, 4.0, 6.0, 4.0, 5.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34619140625, -0.33492279052734375, -0.3236541748046875, -0.31238555908203125, -0.301116943359375, -0.28984832763671875, -0.2785797119140625, -0.26731109619140625, -0.25604248046875, -0.24477386474609375, -0.2335052490234375, -0.22223663330078125, -0.210968017578125, -0.19969940185546875, -0.1884307861328125, -0.17716217041015625, -0.1658935546875, -0.15462493896484375, -0.1433563232421875, -0.13208770751953125, -0.120819091796875, -0.10955047607421875, -0.0982818603515625, -0.08701324462890625, -0.07574462890625, -0.06447601318359375, -0.0532073974609375, -0.04193878173828125, -0.030670166015625, -0.01940155029296875, -0.0081329345703125, 0.00313568115234375, 0.014404296875, 0.02567291259765625, 0.0369415283203125, 0.04821014404296875, 0.059478759765625, 0.07074737548828125, 0.0820159912109375, 0.09328460693359375, 0.10455322265625, 0.11582183837890625, 0.1270904541015625, 0.13835906982421875, 0.149627685546875, 0.16089630126953125, 0.1721649169921875, 0.18343353271484375, 0.1947021484375, 0.20597076416015625, 0.2172393798828125, 0.22850799560546875, 0.239776611328125, 0.25104522705078125, 0.2623138427734375, 0.27358245849609375, 0.28485107421875, 0.29611968994140625, 0.3073883056640625, 0.31865692138671875, 0.329925537109375, 0.34119415283203125, 0.3524627685546875, 0.36373138427734375, 0.375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 1.0, 4.0, 13.0, 9.0, 11.0, 9.0, 20.0, 31.0, 66.0, 56.0, 123.0, 207.0, 380.0, 702.0, 1894.0, 9539.0, 230640.0, 778746.0, 21190.0, 2877.0, 937.0, 474.0, 250.0, 162.0, 78.0, 55.0, 26.0, 18.0, 18.0, 9.0, 6.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.505859375, -1.466400146484375, -1.42694091796875, -1.387481689453125, -1.3480224609375, -1.308563232421875, -1.26910400390625, -1.229644775390625, -1.190185546875, -1.150726318359375, -1.11126708984375, -1.071807861328125, -1.0323486328125, -0.992889404296875, -0.95343017578125, -0.913970947265625, -0.87451171875, -0.835052490234375, -0.79559326171875, -0.756134033203125, -0.7166748046875, -0.677215576171875, -0.63775634765625, -0.598297119140625, -0.558837890625, -0.519378662109375, -0.47991943359375, -0.440460205078125, -0.4010009765625, -0.361541748046875, -0.32208251953125, -0.282623291015625, -0.2431640625, -0.203704833984375, -0.16424560546875, -0.124786376953125, -0.0853271484375, -0.045867919921875, -0.00640869140625, 0.033050537109375, 0.072509765625, 0.111968994140625, 0.15142822265625, 0.190887451171875, 0.2303466796875, 0.269805908203125, 0.30926513671875, 0.348724365234375, 0.38818359375, 0.427642822265625, 0.46710205078125, 0.506561279296875, 0.5460205078125, 0.585479736328125, 0.62493896484375, 0.664398193359375, 0.703857421875, 0.743316650390625, 0.78277587890625, 0.822235107421875, 0.8616943359375, 0.901153564453125, 0.94061279296875, 0.980072021484375, 1.01953125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 4.0, 9.0, 10.0, 8.0, 6.0, 16.0, 23.0, 19.0, 16.0, 25.0, 29.0, 45.0, 59.0, 68.0, 54.0, 52.0, 37.0, 59.0, 56.0, 43.0, 41.0, 41.0, 47.0, 39.0, 43.0, 25.0, 37.0, 16.0, 24.0, 15.0, 7.0, 8.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.390625, -1.34478759765625, -1.2989501953125, -1.25311279296875, -1.207275390625, -1.16143798828125, -1.1156005859375, -1.06976318359375, -1.02392578125, -0.97808837890625, -0.9322509765625, -0.88641357421875, -0.840576171875, -0.79473876953125, -0.7489013671875, -0.70306396484375, -0.6572265625, -0.61138916015625, -0.5655517578125, -0.51971435546875, -0.473876953125, -0.42803955078125, -0.3822021484375, -0.33636474609375, -0.29052734375, -0.24468994140625, -0.1988525390625, -0.15301513671875, -0.107177734375, -0.06134033203125, -0.0155029296875, 0.03033447265625, 0.076171875, 0.12200927734375, 0.1678466796875, 0.21368408203125, 0.259521484375, 0.30535888671875, 0.3511962890625, 0.39703369140625, 0.44287109375, 0.48870849609375, 0.5345458984375, 0.58038330078125, 0.626220703125, 0.67205810546875, 0.7178955078125, 0.76373291015625, 0.8095703125, 0.85540771484375, 0.9012451171875, 0.94708251953125, 0.992919921875, 1.03875732421875, 1.0845947265625, 1.13043212890625, 1.17626953125, 1.22210693359375, 1.2679443359375, 1.31378173828125, 1.359619140625, 1.40545654296875, 1.4512939453125, 1.49713134765625, 1.54296875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 4.0, 4.0, 12.0, 20.0, 37.0, 58.0, 119.0, 231.0, 770.0, 4367.0, 401056.0, 635590.0, 5009.0, 768.0, 250.0, 105.0, 54.0, 32.0, 24.0, 12.0, 10.0, 9.0, 4.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.359619140625, -0.3416633605957031, -0.32370758056640625, -0.3057518005371094, -0.2877960205078125, -0.2698402404785156, -0.25188446044921875, -0.23392868041992188, -0.215972900390625, -0.19801712036132812, -0.18006134033203125, -0.16210556030273438, -0.1441497802734375, -0.12619400024414062, -0.10823822021484375, -0.09028244018554688, -0.07232666015625, -0.054370880126953125, -0.03641510009765625, -0.018459320068359375, -0.0005035400390625, 0.017452239990234375, 0.03540802001953125, 0.053363800048828125, 0.071319580078125, 0.08927536010742188, 0.10723114013671875, 0.12518692016601562, 0.1431427001953125, 0.16109848022460938, 0.17905426025390625, 0.19701004028320312, 0.2149658203125, 0.23292160034179688, 0.25087738037109375, 0.2688331604003906, 0.2867889404296875, 0.3047447204589844, 0.32270050048828125, 0.3406562805175781, 0.358612060546875, 0.3765678405761719, 0.39452362060546875, 0.4124794006347656, 0.4304351806640625, 0.4483909606933594, 0.46634674072265625, 0.4843025207519531, 0.50225830078125, 0.5202140808105469, 0.5381698608398438, 0.5561256408691406, 0.5740814208984375, 0.5920372009277344, 0.6099929809570312, 0.6279487609863281, 0.645904541015625, 0.6638603210449219, 0.6818161010742188, 0.6997718811035156, 0.7177276611328125, 0.7356834411621094, 0.7536392211914062, 0.7715950012207031, 0.78955078125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 11.0, 7.0, 7.0, 7.0, 15.0, 18.0, 19.0, 20.0, 31.0, 53.0, 62.0, 61.0, 89.0, 103.0, 101.0, 88.0, 84.0, 50.0, 45.0, 27.0, 13.0, 17.0, 21.0, 6.0, 10.0, 5.0, 6.0, 6.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.263090133666992e-05, -5.09209930896759e-05, -4.9211084842681885e-05, -4.7501176595687866e-05, -4.579126834869385e-05, -4.408136010169983e-05, -4.237145185470581e-05, -4.066154360771179e-05, -3.8951635360717773e-05, -3.7241727113723755e-05, -3.5531818866729736e-05, -3.382191061973572e-05, -3.21120023727417e-05, -3.040209412574768e-05, -2.8692185878753662e-05, -2.6982277631759644e-05, -2.5272369384765625e-05, -2.3562461137771606e-05, -2.1852552890777588e-05, -2.014264464378357e-05, -1.843273639678955e-05, -1.6722828149795532e-05, -1.5012919902801514e-05, -1.3303011655807495e-05, -1.1593103408813477e-05, -9.883195161819458e-06, -8.17328691482544e-06, -6.463378667831421e-06, -4.753470420837402e-06, -3.043562173843384e-06, -1.3336539268493652e-06, 3.762543201446533e-07, 2.086162567138672e-06, 3.7960708141326904e-06, 5.505979061126709e-06, 7.2158873081207275e-06, 8.925795555114746e-06, 1.0635703802108765e-05, 1.2345612049102783e-05, 1.4055520296096802e-05, 1.576542854309082e-05, 1.747533679008484e-05, 1.9185245037078857e-05, 2.0895153284072876e-05, 2.2605061531066895e-05, 2.4314969778060913e-05, 2.602487802505493e-05, 2.773478627204895e-05, 2.944469451904297e-05, 3.115460276603699e-05, 3.2864511013031006e-05, 3.4574419260025024e-05, 3.628432750701904e-05, 3.799423575401306e-05, 3.970414400100708e-05, 4.14140522480011e-05, 4.312396049499512e-05, 4.4833868741989136e-05, 4.6543776988983154e-05, 4.825368523597717e-05, 4.996359348297119e-05, 5.167350172996521e-05, 5.338340997695923e-05, 5.509331822395325e-05, 5.6803226470947266e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 11.0, 16.0, 20.0, 31.0, 69.0, 85.0, 157.0, 240.0, 577.0, 1504.0, 5554.0, 49707.0, 855046.0, 123237.0, 8695.0, 2063.0, 729.0, 330.0, 168.0, 105.0, 62.0, 34.0, 29.0, 21.0, 17.0, 9.0, 11.0, 6.0, 5.0, 8.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35400390625, -0.3440704345703125, -0.334136962890625, -0.3242034912109375, -0.31427001953125, -0.3043365478515625, -0.294403076171875, -0.2844696044921875, -0.2745361328125, -0.2646026611328125, -0.254669189453125, -0.2447357177734375, -0.23480224609375, -0.2248687744140625, -0.214935302734375, -0.2050018310546875, -0.195068359375, -0.1851348876953125, -0.175201416015625, -0.1652679443359375, -0.15533447265625, -0.1454010009765625, -0.135467529296875, -0.1255340576171875, -0.1156005859375, -0.1056671142578125, -0.095733642578125, -0.0858001708984375, -0.07586669921875, -0.0659332275390625, -0.055999755859375, -0.0460662841796875, -0.0361328125, -0.0261993408203125, -0.016265869140625, -0.0063323974609375, 0.00360107421875, 0.0135345458984375, 0.023468017578125, 0.0334014892578125, 0.0433349609375, 0.0532684326171875, 0.063201904296875, 0.0731353759765625, 0.08306884765625, 0.0930023193359375, 0.102935791015625, 0.1128692626953125, 0.122802734375, 0.1327362060546875, 0.142669677734375, 0.1526031494140625, 0.16253662109375, 0.1724700927734375, 0.182403564453125, 0.1923370361328125, 0.2022705078125, 0.2122039794921875, 0.222137451171875, 0.2320709228515625, 0.24200439453125, 0.2519378662109375, 0.261871337890625, 0.2718048095703125, 0.28173828125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 4.0, 2.0, 3.0, 6.0, 6.0, 4.0, 8.0, 8.0, 15.0, 18.0, 24.0, 39.0, 30.0, 51.0, 67.0, 75.0, 76.0, 91.0, 87.0, 64.0, 71.0, 61.0, 39.0, 31.0, 36.0, 20.0, 21.0, 12.0, 11.0, 3.0, 6.0, 2.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.2310791015625, -0.22271156311035156, -0.21434402465820312, -0.2059764862060547, -0.19760894775390625, -0.1892414093017578, -0.18087387084960938, -0.17250633239746094, -0.1641387939453125, -0.15577125549316406, -0.14740371704101562, -0.1390361785888672, -0.13066864013671875, -0.12230110168457031, -0.11393356323242188, -0.10556602478027344, -0.097198486328125, -0.08883094787597656, -0.08046340942382812, -0.07209587097167969, -0.06372833251953125, -0.05536079406738281, -0.046993255615234375, -0.03862571716308594, -0.0302581787109375, -0.021890640258789062, -0.013523101806640625, -0.0051555633544921875, 0.00321197509765625, 0.011579513549804688, 0.019947052001953125, 0.028314590454101562, 0.03668212890625, 0.04504966735839844, 0.053417205810546875, 0.06178474426269531, 0.07015228271484375, 0.07851982116699219, 0.08688735961914062, 0.09525489807128906, 0.1036224365234375, 0.11198997497558594, 0.12035751342773438, 0.1287250518798828, 0.13709259033203125, 0.1454601287841797, 0.15382766723632812, 0.16219520568847656, 0.170562744140625, 0.17893028259277344, 0.18729782104492188, 0.1956653594970703, 0.20403289794921875, 0.2124004364013672, 0.22076797485351562, 0.22913551330566406, 0.2375030517578125, 0.24587059020996094, 0.2542381286621094, 0.2626056671142578, 0.27097320556640625, 0.2793407440185547, 0.2877082824707031, 0.29607582092285156, 0.304443359375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 2.0, 8.0, 13.0, 8.0, 56.0, 141.0, 389.0, 296.0, 60.0, 19.0, 7.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.575984954833984, -5.2640790939331055, -4.952172756195068, -4.640266418457031, -4.328360557556152, -4.016454696655273, -3.7045483589172363, -3.3926422595977783, -3.0807361602783203, -2.7688300609588623, -2.4569239616394043, -2.1450178623199463, -1.8331117630004883, -1.5212056636810303, -1.2092995643615723, -0.8973934650421143, -0.5854873657226562, -0.27358126640319824, 0.038324832916259766, 0.3502309322357178, 0.6621370315551758, 0.9740431308746338, 1.2859492301940918, 1.5978553295135498, 1.9097614288330078, 2.221667528152466, 2.533573627471924, 2.845479726791382, 3.15738582611084, 3.469291925430298, 3.781198024749756, 4.093104362487793, 4.405011177062988, 4.716917037963867, 5.028823375701904, 5.340729713439941, 5.65263557434082, 5.964541435241699, 6.276447772979736, 6.588354110717773, 6.900259971618652, 7.212165832519531, 7.524072170257568, 7.8359785079956055, 8.147884368896484, 8.459790229797363, 8.771696090698242, 9.083602905273438, 9.395508766174316, 9.707414627075195, 10.01932144165039, 10.33122730255127, 10.643133163452148, 10.955039024353027, 11.266944885253906, 11.578851699829102, 11.89075756072998, 12.20266342163086, 12.514570236206055, 12.826476097106934, 13.138381958007812, 13.450287818908691, 13.76219367980957, 14.074100494384766, 14.386006355285645]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 6.0, 12.0, 15.0, 20.0, 18.0, 19.0, 27.0, 32.0, 45.0, 35.0, 48.0, 46.0, 53.0, 75.0, 63.0, 72.0, 67.0, 49.0, 51.0, 48.0, 38.0, 33.0, 23.0, 24.0, 12.0, 27.0, 18.0, 11.0, 3.0, 2.0, 3.0, 4.0, 3.0, 3.0, 4.0, 1.0], "bins": [-8.951157569885254, -8.741640090942383, -8.532122611999512, -8.32260513305664, -8.113086700439453, -7.903569221496582, -7.694051742553711, -7.48453426361084, -7.275016784667969, -7.065499305725098, -6.855981349945068, -6.646463871002197, -6.436946392059326, -6.227428436279297, -6.017910957336426, -5.808393478393555, -5.598875522613525, -5.389358043670654, -5.179840087890625, -4.970322608947754, -4.760805130004883, -4.551287651062012, -4.341769695281982, -4.132252216339111, -3.922734498977661, -3.713216781616211, -3.50369930267334, -3.2941815853118896, -3.0846638679504395, -2.8751463890075684, -2.665628671646118, -2.456110954284668, -2.246593475341797, -2.0370757579803467, -1.8275582790374756, -1.6180405616760254, -1.4085229635238647, -1.199005365371704, -0.9894876480102539, -0.7799700498580933, -0.5704524517059326, -0.3609348237514496, -0.15141719579696655, 0.05810046195983887, 0.2676180601119995, 0.47713565826416016, 0.6866533756256104, 0.896170973777771, 1.1056885719299316, 1.3152061700820923, 1.524723768234253, 1.7342414855957031, 1.9437590837478638, 2.1532766819000244, 2.3627943992614746, 2.5723118782043457, 2.781829595565796, 2.991347312927246, 3.200864791870117, 3.4103825092315674, 3.6199002265930176, 3.8294177055358887, 4.038935661315918, 4.248453140258789, 4.45797061920166]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 6.0, 4.0, 9.0, 10.0, 21.0, 22.0, 36.0, 34.0, 47.0, 78.0, 96.0, 154.0, 274.0, 576.0, 3393.0, 2916750.0, 1267795.0, 3770.0, 548.0, 218.0, 122.0, 80.0, 58.0, 50.0, 25.0, 23.0, 21.0, 21.0, 8.0, 6.0, 8.0, 3.0, 3.0, 6.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.60546875, -1.550048828125, -1.49462890625, -1.439208984375, -1.3837890625, -1.328369140625, -1.27294921875, -1.217529296875, -1.162109375, -1.106689453125, -1.05126953125, -0.995849609375, -0.9404296875, -0.885009765625, -0.82958984375, -0.774169921875, -0.71875, -0.663330078125, -0.60791015625, -0.552490234375, -0.4970703125, -0.441650390625, -0.38623046875, -0.330810546875, -0.275390625, -0.219970703125, -0.16455078125, -0.109130859375, -0.0537109375, 0.001708984375, 0.05712890625, 0.112548828125, 0.16796875, 0.223388671875, 0.27880859375, 0.334228515625, 0.3896484375, 0.445068359375, 0.50048828125, 0.555908203125, 0.611328125, 0.666748046875, 0.72216796875, 0.777587890625, 0.8330078125, 0.888427734375, 0.94384765625, 0.999267578125, 1.0546875, 1.110107421875, 1.16552734375, 1.220947265625, 1.2763671875, 1.331787109375, 1.38720703125, 1.442626953125, 1.498046875, 1.553466796875, 1.60888671875, 1.664306640625, 1.7197265625, 1.775146484375, 1.83056640625, 1.885986328125, 1.94140625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 9.0, 16.0, 26.0, 41.0, 62.0, 71.0, 100.0, 118.0, 123.0, 122.0, 101.0, 88.0, 53.0, 39.0, 18.0, 15.0, 10.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-1.177734375, -1.1543693542480469, -1.1310043334960938, -1.1076393127441406, -1.0842742919921875, -1.0609092712402344, -1.0375442504882812, -1.0141792297363281, -0.990814208984375, -0.9674491882324219, -0.9440841674804688, -0.9207191467285156, -0.8973541259765625, -0.8739891052246094, -0.8506240844726562, -0.8272590637207031, -0.80389404296875, -0.7805290222167969, -0.7571640014648438, -0.7337989807128906, -0.7104339599609375, -0.6870689392089844, -0.6637039184570312, -0.6403388977050781, -0.616973876953125, -0.5936088562011719, -0.5702438354492188, -0.5468788146972656, -0.5235137939453125, -0.5001487731933594, -0.47678375244140625, -0.4534187316894531, -0.4300537109375, -0.4066886901855469, -0.38332366943359375, -0.3599586486816406, -0.3365936279296875, -0.3132286071777344, -0.28986358642578125, -0.2664985656738281, -0.243133544921875, -0.21976852416992188, -0.19640350341796875, -0.17303848266601562, -0.1496734619140625, -0.12630844116210938, -0.10294342041015625, -0.07957839965820312, -0.05621337890625, -0.032848358154296875, -0.00948333740234375, 0.013881683349609375, 0.0372467041015625, 0.060611724853515625, 0.08397674560546875, 0.10734176635742188, 0.130706787109375, 0.15407180786132812, 0.17743682861328125, 0.20080184936523438, 0.2241668701171875, 0.24753189086914062, 0.27089691162109375, 0.2942619323730469, 0.317626953125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 14.0, 9.0, 13.0, 20.0, 38.0, 54.0, 91.0, 120.0, 207.0, 323.0, 559.0, 1003.0, 2158.0, 4897.0, 13425.0, 54437.0, 1470335.0, 2549161.0, 70091.0, 15976.0, 5775.0, 2601.0, 1285.0, 618.0, 400.0, 245.0, 142.0, 103.0, 50.0, 47.0, 22.0, 21.0, 8.0, 6.0, 7.0, 5.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44091796875, -0.4271659851074219, -0.41341400146484375, -0.3996620178222656, -0.3859100341796875, -0.3721580505371094, -0.35840606689453125, -0.3446540832519531, -0.330902099609375, -0.3171501159667969, -0.30339813232421875, -0.2896461486816406, -0.2758941650390625, -0.2621421813964844, -0.24839019775390625, -0.23463821411132812, -0.22088623046875, -0.20713424682617188, -0.19338226318359375, -0.17963027954101562, -0.1658782958984375, -0.15212631225585938, -0.13837432861328125, -0.12462234497070312, -0.110870361328125, -0.09711837768554688, -0.08336639404296875, -0.06961441040039062, -0.0558624267578125, -0.042110443115234375, -0.02835845947265625, -0.014606475830078125, -0.0008544921875, 0.012897491455078125, 0.02664947509765625, 0.040401458740234375, 0.0541534423828125, 0.06790542602539062, 0.08165740966796875, 0.09540939331054688, 0.109161376953125, 0.12291336059570312, 0.13666534423828125, 0.15041732788085938, 0.1641693115234375, 0.17792129516601562, 0.19167327880859375, 0.20542526245117188, 0.21917724609375, 0.23292922973632812, 0.24668121337890625, 0.2604331970214844, 0.2741851806640625, 0.2879371643066406, 0.30168914794921875, 0.3154411315917969, 0.329193115234375, 0.3429450988769531, 0.35669708251953125, 0.3704490661621094, 0.3842010498046875, 0.3979530334472656, 0.41170501708984375, 0.4254570007324219, 0.439208984375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 6.0, 8.0, 3.0, 7.0, 13.0, 11.0, 34.0, 36.0, 113.0, 382.0, 1400.0, 1425.0, 384.0, 103.0, 54.0, 29.0, 31.0, 7.0, 4.0, 7.0, 3.0, 6.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.85205078125, -0.8270111083984375, -0.801971435546875, -0.7769317626953125, -0.75189208984375, -0.7268524169921875, -0.701812744140625, -0.6767730712890625, -0.6517333984375, -0.6266937255859375, -0.601654052734375, -0.5766143798828125, -0.55157470703125, -0.5265350341796875, -0.501495361328125, -0.4764556884765625, -0.451416015625, -0.4263763427734375, -0.401336669921875, -0.3762969970703125, -0.35125732421875, -0.3262176513671875, -0.301177978515625, -0.2761383056640625, -0.2510986328125, -0.2260589599609375, -0.201019287109375, -0.1759796142578125, -0.15093994140625, -0.1259002685546875, -0.100860595703125, -0.0758209228515625, -0.05078125, -0.0257415771484375, -0.000701904296875, 0.0243377685546875, 0.04937744140625, 0.0744171142578125, 0.099456787109375, 0.1244964599609375, 0.1495361328125, 0.1745758056640625, 0.199615478515625, 0.2246551513671875, 0.24969482421875, 0.2747344970703125, 0.299774169921875, 0.3248138427734375, 0.349853515625, 0.3748931884765625, 0.399932861328125, 0.4249725341796875, 0.45001220703125, 0.4750518798828125, 0.500091552734375, 0.5251312255859375, 0.5501708984375, 0.5752105712890625, 0.600250244140625, 0.6252899169921875, 0.65032958984375, 0.6753692626953125, 0.700408935546875, 0.7254486083984375, 0.75048828125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 5.0, 11.0, 33.0, 77.0, 180.0, 327.0, 235.0, 78.0, 32.0, 13.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.667299270629883, -5.51667594909668, -5.366052627563477, -5.215429306030273, -5.06480598449707, -4.914182662963867, -4.763559341430664, -4.612936019897461, -4.462312698364258, -4.311689376831055, -4.161066055297852, -4.010442733764648, -3.8598194122314453, -3.709196090698242, -3.558572769165039, -3.407949447631836, -3.2573258876800537, -3.1067025661468506, -2.9560792446136475, -2.8054559230804443, -2.654832601547241, -2.504209280014038, -2.353585720062256, -2.2029623985290527, -2.0523390769958496, -1.9017157554626465, -1.7510924339294434, -1.6004691123962402, -1.449845790863037, -1.299222469329834, -1.1485990285873413, -0.9979757070541382, -0.8473525047302246, -0.6967291831970215, -0.5461058616638184, -0.39548248052597046, -0.24485915899276733, -0.09423583745956421, 0.05638754367828369, 0.20701086521148682, 0.35763418674468994, 0.5082575082778931, 0.6588808298110962, 0.8095042109489441, 0.9601275324821472, 1.1107509136199951, 1.2613742351531982, 1.4119975566864014, 1.5626208782196045, 1.7132441997528076, 1.8638675212860107, 2.014490842819214, 2.165114164352417, 2.31573748588562, 2.4663610458374023, 2.6169843673706055, 2.7676076889038086, 2.9182310104370117, 3.068854331970215, 3.219477653503418, 3.370100975036621, 3.520724296569824, 3.6713476181030273, 3.8219709396362305, 3.9725942611694336]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 11.0, 13.0, 20.0, 22.0, 41.0, 52.0, 68.0, 91.0, 77.0, 80.0, 103.0, 84.0, 75.0, 63.0, 46.0, 47.0, 33.0, 28.0, 18.0, 13.0, 6.0, 7.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2218856811523438, -2.1032114028930664, -1.9845373630523682, -1.8658630847930908, -1.7471890449523926, -1.6285147666931152, -1.5098406076431274, -1.3911664485931396, -1.2724922895431519, -1.153818130493164, -1.0351439714431763, -0.9164697527885437, -0.7977955937385559, -0.6791214346885681, -0.5604472160339355, -0.44177305698394775, -0.32309889793395996, -0.20442472398281097, -0.08575055003166199, 0.03292363882064819, 0.151597797870636, 0.2702719569206238, 0.38894617557525635, 0.5076203346252441, 0.6262944936752319, 0.7449686527252197, 0.8636428117752075, 0.9823170304298401, 1.1009912490844727, 1.219665288925171, 1.3383395671844482, 1.457013726234436, 1.5756878852844238, 1.6943620443344116, 1.8130362033843994, 1.9317104816436768, 2.050384521484375, 2.1690587997436523, 2.2877330780029297, 2.406407117843628, 2.525081157684326, 2.6437554359436035, 2.7624294757843018, 2.881103754043579, 2.9997777938842773, 3.1184520721435547, 3.237126350402832, 3.3558003902435303, 3.4744746685028076, 3.593148946762085, 3.711822986602783, 3.8304972648620605, 3.949171304702759, 4.067845344543457, 4.186519622802734, 4.305193901062012, 4.423868179321289, 4.542542457580566, 4.661216735839844, 4.779890537261963, 4.89856481552124, 5.017239093780518, 5.135913372039795, 5.254587173461914, 5.373261451721191]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 7.0, 3.0, 5.0, 3.0, 11.0, 14.0, 17.0, 29.0, 40.0, 64.0, 109.0, 147.0, 250.0, 397.0, 710.0, 1205.0, 2547.0, 5061.0, 11733.0, 28457.0, 76295.0, 225806.0, 405289.0, 184016.0, 63088.0, 24010.0, 9930.0, 4365.0, 2175.0, 1136.0, 632.0, 373.0, 239.0, 156.0, 75.0, 70.0, 31.0, 27.0, 13.0, 11.0, 4.0, 2.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.31201171875, -0.30175018310546875, -0.2914886474609375, -0.28122711181640625, -0.270965576171875, -0.26070404052734375, -0.2504425048828125, -0.24018096923828125, -0.22991943359375, -0.21965789794921875, -0.2093963623046875, -0.19913482666015625, -0.188873291015625, -0.17861175537109375, -0.1683502197265625, -0.15808868408203125, -0.1478271484375, -0.13756561279296875, -0.1273040771484375, -0.11704254150390625, -0.106781005859375, -0.09651947021484375, -0.0862579345703125, -0.07599639892578125, -0.06573486328125, -0.05547332763671875, -0.0452117919921875, -0.03495025634765625, -0.024688720703125, -0.01442718505859375, -0.0041656494140625, 0.00609588623046875, 0.016357421875, 0.02661895751953125, 0.0368804931640625, 0.04714202880859375, 0.057403564453125, 0.06766510009765625, 0.0779266357421875, 0.08818817138671875, 0.09844970703125, 0.10871124267578125, 0.1189727783203125, 0.12923431396484375, 0.139495849609375, 0.14975738525390625, 0.1600189208984375, 0.17028045654296875, 0.1805419921875, 0.19080352783203125, 0.2010650634765625, 0.21132659912109375, 0.221588134765625, 0.23184967041015625, 0.2421112060546875, 0.25237274169921875, 0.26263427734375, 0.27289581298828125, 0.2831573486328125, 0.29341888427734375, 0.303680419921875, 0.31394195556640625, 0.3242034912109375, 0.33446502685546875, 0.3447265625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 10.0, 14.0, 15.0, 15.0, 19.0, 29.0, 20.0, 38.0, 49.0, 44.0, 45.0, 50.0, 52.0, 52.0, 69.0, 64.0, 50.0, 53.0, 44.0, 49.0, 42.0, 36.0, 26.0, 23.0, 24.0, 15.0, 15.0, 12.0, 6.0, 5.0, 10.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.39892578125, -0.38800811767578125, -0.3770904541015625, -0.36617279052734375, -0.355255126953125, -0.34433746337890625, -0.3334197998046875, -0.32250213623046875, -0.31158447265625, -0.30066680908203125, -0.2897491455078125, -0.27883148193359375, -0.267913818359375, -0.25699615478515625, -0.2460784912109375, -0.23516082763671875, -0.2242431640625, -0.21332550048828125, -0.2024078369140625, -0.19149017333984375, -0.180572509765625, -0.16965484619140625, -0.1587371826171875, -0.14781951904296875, -0.13690185546875, -0.12598419189453125, -0.1150665283203125, -0.10414886474609375, -0.093231201171875, -0.08231353759765625, -0.0713958740234375, -0.06047821044921875, -0.049560546875, -0.03864288330078125, -0.0277252197265625, -0.01680755615234375, -0.005889892578125, 0.00502777099609375, 0.0159454345703125, 0.02686309814453125, 0.03778076171875, 0.04869842529296875, 0.0596160888671875, 0.07053375244140625, 0.081451416015625, 0.09236907958984375, 0.1032867431640625, 0.11420440673828125, 0.1251220703125, 0.13603973388671875, 0.1469573974609375, 0.15787506103515625, 0.168792724609375, 0.17971038818359375, 0.1906280517578125, 0.20154571533203125, 0.21246337890625, 0.22338104248046875, 0.2342987060546875, 0.24521636962890625, 0.256134033203125, 0.26705169677734375, 0.2779693603515625, 0.28888702392578125, 0.2998046875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 7.0, 5.0, 6.0, 15.0, 25.0, 22.0, 32.0, 49.0, 84.0, 110.0, 158.0, 320.0, 548.0, 1171.0, 3521.0, 22202.0, 405695.0, 580135.0, 27621.0, 4065.0, 1247.0, 546.0, 342.0, 215.0, 128.0, 75.0, 57.0, 40.0, 29.0, 21.0, 11.0, 10.0, 11.0, 9.0, 4.0, 5.0, 3.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.88818359375, -0.8604660034179688, -0.8327484130859375, -0.8050308227539062, -0.777313232421875, -0.7495956420898438, -0.7218780517578125, -0.6941604614257812, -0.66644287109375, -0.6387252807617188, -0.6110076904296875, -0.5832901000976562, -0.555572509765625, -0.5278549194335938, -0.5001373291015625, -0.47241973876953125, -0.4447021484375, -0.41698455810546875, -0.3892669677734375, -0.36154937744140625, -0.333831787109375, -0.30611419677734375, -0.2783966064453125, -0.25067901611328125, -0.22296142578125, -0.19524383544921875, -0.1675262451171875, -0.13980865478515625, -0.112091064453125, -0.08437347412109375, -0.0566558837890625, -0.02893829345703125, -0.001220703125, 0.02649688720703125, 0.0542144775390625, 0.08193206787109375, 0.109649658203125, 0.13736724853515625, 0.1650848388671875, 0.19280242919921875, 0.22052001953125, 0.24823760986328125, 0.2759552001953125, 0.30367279052734375, 0.331390380859375, 0.35910797119140625, 0.3868255615234375, 0.41454315185546875, 0.4422607421875, 0.46997833251953125, 0.4976959228515625, 0.5254135131835938, 0.553131103515625, 0.5808486938476562, 0.6085662841796875, 0.6362838745117188, 0.66400146484375, 0.6917190551757812, 0.7194366455078125, 0.7471542358398438, 0.774871826171875, 0.8025894165039062, 0.8303070068359375, 0.8580245971679688, 0.8857421875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 5.0, 3.0, 0.0, 7.0, 5.0, 8.0, 12.0, 10.0, 11.0, 14.0, 18.0, 27.0, 42.0, 35.0, 33.0, 42.0, 50.0, 39.0, 41.0, 53.0, 43.0, 55.0, 40.0, 54.0, 58.0, 50.0, 35.0, 34.0, 30.0, 29.0, 26.0, 19.0, 18.0, 17.0, 5.0, 11.0, 6.0, 6.0, 3.0, 3.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.857421875, -0.8229522705078125, -0.788482666015625, -0.7540130615234375, -0.71954345703125, -0.6850738525390625, -0.650604248046875, -0.6161346435546875, -0.5816650390625, -0.5471954345703125, -0.512725830078125, -0.4782562255859375, -0.44378662109375, -0.4093170166015625, -0.374847412109375, -0.3403778076171875, -0.305908203125, -0.2714385986328125, -0.236968994140625, -0.2024993896484375, -0.16802978515625, -0.1335601806640625, -0.099090576171875, -0.0646209716796875, -0.0301513671875, 0.0043182373046875, 0.038787841796875, 0.0732574462890625, 0.10772705078125, 0.1421966552734375, 0.176666259765625, 0.2111358642578125, 0.24560546875, 0.2800750732421875, 0.314544677734375, 0.3490142822265625, 0.38348388671875, 0.4179534912109375, 0.452423095703125, 0.4868927001953125, 0.5213623046875, 0.5558319091796875, 0.590301513671875, 0.6247711181640625, 0.65924072265625, 0.6937103271484375, 0.728179931640625, 0.7626495361328125, 0.797119140625, 0.8315887451171875, 0.866058349609375, 0.9005279541015625, 0.93499755859375, 0.9694671630859375, 1.003936767578125, 1.0384063720703125, 1.0728759765625, 1.1073455810546875, 1.141815185546875, 1.1762847900390625, 1.21075439453125, 1.2452239990234375, 1.279693603515625, 1.3141632080078125, 1.3486328125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 7.0, 6.0, 3.0, 7.0, 5.0, 8.0, 16.0, 22.0, 47.0, 86.0, 150.0, 409.0, 1453.0, 11745.0, 910768.0, 118786.0, 3717.0, 745.0, 257.0, 117.0, 69.0, 49.0, 21.0, 21.0, 16.0, 7.0, 6.0, 6.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.447998046875, -0.4324302673339844, -0.41686248779296875, -0.4012947082519531, -0.3857269287109375, -0.3701591491699219, -0.35459136962890625, -0.3390235900878906, -0.323455810546875, -0.3078880310058594, -0.29232025146484375, -0.2767524719238281, -0.2611846923828125, -0.24561691284179688, -0.23004913330078125, -0.21448135375976562, -0.19891357421875, -0.18334579467773438, -0.16777801513671875, -0.15221023559570312, -0.1366424560546875, -0.12107467651367188, -0.10550689697265625, -0.08993911743164062, -0.074371337890625, -0.058803558349609375, -0.04323577880859375, -0.027667999267578125, -0.0121002197265625, 0.003467559814453125, 0.01903533935546875, 0.034603118896484375, 0.0501708984375, 0.06573867797851562, 0.08130645751953125, 0.09687423706054688, 0.1124420166015625, 0.12800979614257812, 0.14357757568359375, 0.15914535522460938, 0.174713134765625, 0.19028091430664062, 0.20584869384765625, 0.22141647338867188, 0.2369842529296875, 0.2525520324707031, 0.26811981201171875, 0.2836875915527344, 0.29925537109375, 0.3148231506347656, 0.33039093017578125, 0.3459587097167969, 0.3615264892578125, 0.3770942687988281, 0.39266204833984375, 0.4082298278808594, 0.423797607421875, 0.4393653869628906, 0.45493316650390625, 0.4705009460449219, 0.4860687255859375, 0.5016365051269531, 0.5172042846679688, 0.5327720642089844, 0.54833984375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 1.0, 4.0, 4.0, 4.0, 2.0, 4.0, 7.0, 4.0, 6.0, 12.0, 19.0, 20.0, 24.0, 28.0, 56.0, 61.0, 85.0, 127.0, 95.0, 116.0, 91.0, 69.0, 43.0, 28.0, 21.0, 15.0, 14.0, 7.0, 6.0, 9.0, 4.0, 3.0, 4.0, 4.0, 5.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.608797073364258e-05, -5.430355668067932e-05, -5.2519142627716064e-05, -5.073472857475281e-05, -4.895031452178955e-05, -4.7165900468826294e-05, -4.538148641586304e-05, -4.359707236289978e-05, -4.1812658309936523e-05, -4.0028244256973267e-05, -3.824383020401001e-05, -3.645941615104675e-05, -3.4675002098083496e-05, -3.289058804512024e-05, -3.110617399215698e-05, -2.9321759939193726e-05, -2.753734588623047e-05, -2.5752931833267212e-05, -2.3968517780303955e-05, -2.2184103727340698e-05, -2.039968967437744e-05, -1.8615275621414185e-05, -1.6830861568450928e-05, -1.5046447515487671e-05, -1.3262033462524414e-05, -1.1477619409561157e-05, -9.6932053565979e-06, -7.908791303634644e-06, -6.124377250671387e-06, -4.33996319770813e-06, -2.555549144744873e-06, -7.711350917816162e-07, 1.0132789611816406e-06, 2.7976930141448975e-06, 4.582107067108154e-06, 6.366521120071411e-06, 8.150935173034668e-06, 9.935349225997925e-06, 1.1719763278961182e-05, 1.3504177331924438e-05, 1.5288591384887695e-05, 1.7073005437850952e-05, 1.885741949081421e-05, 2.0641833543777466e-05, 2.2426247596740723e-05, 2.421066164970398e-05, 2.5995075702667236e-05, 2.7779489755630493e-05, 2.956390380859375e-05, 3.134831786155701e-05, 3.3132731914520264e-05, 3.491714596748352e-05, 3.670156002044678e-05, 3.8485974073410034e-05, 4.027038812637329e-05, 4.205480217933655e-05, 4.3839216232299805e-05, 4.562363028526306e-05, 4.740804433822632e-05, 4.9192458391189575e-05, 5.097687244415283e-05, 5.276128649711609e-05, 5.4545700550079346e-05, 5.63301146030426e-05, 5.811452865600586e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 7.0, 13.0, 18.0, 21.0, 56.0, 110.0, 263.0, 869.0, 6183.0, 416733.0, 615731.0, 7060.0, 965.0, 283.0, 116.0, 62.0, 25.0, 16.0, 10.0, 5.0, 1.0, 1.0, 4.0, 7.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55224609375, -0.5377235412597656, -0.5232009887695312, -0.5086784362792969, -0.4941558837890625, -0.4796333312988281, -0.46511077880859375, -0.4505882263183594, -0.436065673828125, -0.4215431213378906, -0.40702056884765625, -0.3924980163574219, -0.3779754638671875, -0.3634529113769531, -0.34893035888671875, -0.3344078063964844, -0.31988525390625, -0.3053627014160156, -0.29084014892578125, -0.2763175964355469, -0.2617950439453125, -0.24727249145507812, -0.23274993896484375, -0.21822738647460938, -0.203704833984375, -0.18918228149414062, -0.17465972900390625, -0.16013717651367188, -0.1456146240234375, -0.13109207153320312, -0.11656951904296875, -0.10204696655273438, -0.0875244140625, -0.07300186157226562, -0.05847930908203125, -0.043956756591796875, -0.0294342041015625, -0.014911651611328125, -0.00038909912109375, 0.014133453369140625, 0.028656005859375, 0.043178558349609375, 0.05770111083984375, 0.07222366333007812, 0.0867462158203125, 0.10126876831054688, 0.11579132080078125, 0.13031387329101562, 0.14483642578125, 0.15935897827148438, 0.17388153076171875, 0.18840408325195312, 0.2029266357421875, 0.21744918823242188, 0.23197174072265625, 0.24649429321289062, 0.261016845703125, 0.2755393981933594, 0.29006195068359375, 0.3045845031738281, 0.3191070556640625, 0.3336296081542969, 0.34815216064453125, 0.3626747131347656, 0.377197265625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 9.0, 12.0, 17.0, 23.0, 34.0, 47.0, 82.0, 60.0, 114.0, 104.0, 94.0, 112.0, 70.0, 60.0, 40.0, 36.0, 29.0, 10.0, 9.0, 10.0, 7.0, 4.0, 4.0, 5.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.288330078125, -0.280914306640625, -0.27349853515625, -0.266082763671875, -0.2586669921875, -0.251251220703125, -0.24383544921875, -0.236419677734375, -0.22900390625, -0.221588134765625, -0.21417236328125, -0.206756591796875, -0.1993408203125, -0.191925048828125, -0.18450927734375, -0.177093505859375, -0.169677734375, -0.162261962890625, -0.15484619140625, -0.147430419921875, -0.1400146484375, -0.132598876953125, -0.12518310546875, -0.117767333984375, -0.1103515625, -0.102935791015625, -0.09552001953125, -0.088104248046875, -0.0806884765625, -0.073272705078125, -0.06585693359375, -0.058441162109375, -0.051025390625, -0.043609619140625, -0.03619384765625, -0.028778076171875, -0.0213623046875, -0.013946533203125, -0.00653076171875, 0.000885009765625, 0.00830078125, 0.015716552734375, 0.02313232421875, 0.030548095703125, 0.0379638671875, 0.045379638671875, 0.05279541015625, 0.060211181640625, 0.067626953125, 0.075042724609375, 0.08245849609375, 0.089874267578125, 0.0972900390625, 0.104705810546875, 0.11212158203125, 0.119537353515625, 0.126953125, 0.134368896484375, 0.14178466796875, 0.149200439453125, 0.1566162109375, 0.164031982421875, 0.17144775390625, 0.178863525390625, 0.186279296875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 6.0, 4.0, 36.0, 153.0, 488.0, 241.0, 47.0, 13.0, 7.0, 3.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.478628158569336, -5.1472625732421875, -4.815897464752197, -4.484532356262207, -4.153166770935059, -3.8218014240264893, -3.49043607711792, -3.1590707302093506, -2.8277053833007812, -2.496340036392212, -2.1649746894836426, -1.8336093425750732, -1.502243995666504, -1.1708786487579346, -0.8395133018493652, -0.5081479549407959, -0.17678260803222656, 0.15458273887634277, 0.4859480857849121, 0.8173134326934814, 1.1486787796020508, 1.4800441265106201, 1.8114094734191895, 2.142774820327759, 2.474140167236328, 2.8055055141448975, 3.136870861053467, 3.468236207962036, 3.7996015548706055, 4.130967140197754, 4.462332248687744, 4.793697357177734, 5.125063896179199, 5.456429481506348, 5.787794589996338, 6.119159698486328, 6.450525283813477, 6.781890869140625, 7.113255977630615, 7.4446210861206055, 7.775986671447754, 8.107352256774902, 8.438716888427734, 8.770082473754883, 9.101448059082031, 9.43281364440918, 9.764179229736328, 10.09554386138916, 10.426909446716309, 10.758275032043457, 11.089639663696289, 11.421005249023438, 11.752370834350586, 12.083736419677734, 12.415102005004883, 12.746466636657715, 13.077832221984863, 13.409197807312012, 13.740562438964844, 14.071928024291992, 14.40329360961914, 14.734659194946289, 15.066024780273438, 15.39738941192627, 15.728754997253418]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 4.0, 5.0, 5.0, 14.0, 13.0, 7.0, 16.0, 13.0, 12.0, 29.0, 22.0, 21.0, 38.0, 45.0, 42.0, 46.0, 43.0, 58.0, 73.0, 59.0, 62.0, 57.0, 39.0, 46.0, 31.0, 28.0, 31.0, 28.0, 27.0, 18.0, 15.0, 8.0, 12.0, 7.0, 9.0, 7.0, 5.0, 7.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.1485066413879395, -5.001501083374023, -4.854495525360107, -4.707489490509033, -4.560483932495117, -4.413478374481201, -4.266472816467285, -4.119467258453369, -3.972461462020874, -3.825455904006958, -3.678450107574463, -3.531444549560547, -3.384438991546631, -3.2374331951141357, -3.0904276371002197, -2.9434218406677246, -2.7964162826538086, -2.6494107246398926, -2.5024049282073975, -2.3553993701934814, -2.2083935737609863, -2.0613880157470703, -1.9143824577331543, -1.7673767805099487, -1.6203711032867432, -1.4733654260635376, -1.326359748840332, -1.179354190826416, -1.0323485136032104, -0.8853428363800049, -0.7383372187614441, -0.5913316011428833, -0.44432640075683594, -0.29732075333595276, -0.15031510591506958, -0.0033094584941864014, 0.14369618892669678, 0.29070186614990234, 0.43770748376846313, 0.5847131013870239, 0.7317187786102295, 0.8787244558334351, 1.0257301330566406, 1.1727356910705566, 1.3197413682937622, 1.4667470455169678, 1.6137526035308838, 1.7607582807540894, 1.907763957977295, 2.054769515991211, 2.201775312423706, 2.348780870437622, 2.495786666870117, 2.642792224884033, 2.789797782897949, 2.9368033409118652, 3.0838091373443604, 3.2308146953582764, 3.3778204917907715, 3.5248260498046875, 3.6718316078186035, 3.8188374042510986, 3.9658429622650146, 4.11284875869751, 4.259854316711426]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 3.0, 3.0, 16.0, 17.0, 41.0, 47.0, 62.0, 106.0, 188.0, 368.0, 724.0, 1593.0, 4365.0, 17276.0, 232017.0, 3456607.0, 445604.0, 25747.0, 5792.0, 1884.0, 868.0, 409.0, 223.0, 119.0, 74.0, 45.0, 32.0, 15.0, 19.0, 9.0, 4.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4677734375, -0.4542503356933594, -0.44072723388671875, -0.4272041320800781, -0.4136810302734375, -0.4001579284667969, -0.38663482666015625, -0.3731117248535156, -0.359588623046875, -0.3460655212402344, -0.33254241943359375, -0.3190193176269531, -0.3054962158203125, -0.2919731140136719, -0.27845001220703125, -0.2649269104003906, -0.25140380859375, -0.23788070678710938, -0.22435760498046875, -0.21083450317382812, -0.1973114013671875, -0.18378829956054688, -0.17026519775390625, -0.15674209594726562, -0.143218994140625, -0.12969589233398438, -0.11617279052734375, -0.10264968872070312, -0.0891265869140625, -0.07560348510742188, -0.06208038330078125, -0.048557281494140625, -0.0350341796875, -0.021511077880859375, -0.00798797607421875, 0.005535125732421875, 0.0190582275390625, 0.032581329345703125, 0.04610443115234375, 0.059627532958984375, 0.073150634765625, 0.08667373657226562, 0.10019683837890625, 0.11371994018554688, 0.1272430419921875, 0.14076614379882812, 0.15428924560546875, 0.16781234741210938, 0.18133544921875, 0.19485855102539062, 0.20838165283203125, 0.22190475463867188, 0.2354278564453125, 0.24895095825195312, 0.26247406005859375, 0.2759971618652344, 0.289520263671875, 0.3030433654785156, 0.31656646728515625, 0.3300895690917969, 0.3436126708984375, 0.3571357727050781, 0.37065887451171875, 0.3841819763183594, 0.397705078125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 6.0, 2.0, 8.0, 4.0, 10.0, 7.0, 8.0, 12.0, 18.0, 15.0, 21.0, 27.0, 30.0, 53.0, 48.0, 41.0, 42.0, 54.0, 56.0, 54.0, 54.0, 48.0, 49.0, 34.0, 52.0, 47.0, 31.0, 37.0, 23.0, 33.0, 18.0, 11.0, 14.0, 12.0, 8.0, 9.0, 10.0, 1.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2578125, -0.24920654296875, -0.2406005859375, -0.23199462890625, -0.223388671875, -0.21478271484375, -0.2061767578125, -0.19757080078125, -0.18896484375, -0.18035888671875, -0.1717529296875, -0.16314697265625, -0.154541015625, -0.14593505859375, -0.1373291015625, -0.12872314453125, -0.1201171875, -0.11151123046875, -0.1029052734375, -0.09429931640625, -0.085693359375, -0.07708740234375, -0.0684814453125, -0.05987548828125, -0.05126953125, -0.04266357421875, -0.0340576171875, -0.02545166015625, -0.016845703125, -0.00823974609375, 0.0003662109375, 0.00897216796875, 0.017578125, 0.02618408203125, 0.0347900390625, 0.04339599609375, 0.052001953125, 0.06060791015625, 0.0692138671875, 0.07781982421875, 0.08642578125, 0.09503173828125, 0.1036376953125, 0.11224365234375, 0.120849609375, 0.12945556640625, 0.1380615234375, 0.14666748046875, 0.1552734375, 0.16387939453125, 0.1724853515625, 0.18109130859375, 0.189697265625, 0.19830322265625, 0.2069091796875, 0.21551513671875, 0.22412109375, 0.23272705078125, 0.2413330078125, 0.24993896484375, 0.258544921875, 0.26715087890625, 0.2757568359375, 0.28436279296875, 0.29296875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 4.0, 8.0, 21.0, 26.0, 31.0, 39.0, 59.0, 107.0, 163.0, 301.0, 583.0, 1341.0, 3933.0, 15875.0, 96728.0, 3334394.0, 682698.0, 44435.0, 8898.0, 2584.0, 1008.0, 470.0, 221.0, 123.0, 74.0, 45.0, 25.0, 22.0, 21.0, 13.0, 7.0, 8.0, 3.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41455078125, -0.40064239501953125, -0.3867340087890625, -0.37282562255859375, -0.358917236328125, -0.34500885009765625, -0.3311004638671875, -0.31719207763671875, -0.30328369140625, -0.28937530517578125, -0.2754669189453125, -0.26155853271484375, -0.247650146484375, -0.23374176025390625, -0.2198333740234375, -0.20592498779296875, -0.1920166015625, -0.17810821533203125, -0.1641998291015625, -0.15029144287109375, -0.136383056640625, -0.12247467041015625, -0.1085662841796875, -0.09465789794921875, -0.08074951171875, -0.06684112548828125, -0.0529327392578125, -0.03902435302734375, -0.025115966796875, -0.01120758056640625, 0.0027008056640625, 0.01660919189453125, 0.030517578125, 0.04442596435546875, 0.0583343505859375, 0.07224273681640625, 0.086151123046875, 0.10005950927734375, 0.1139678955078125, 0.12787628173828125, 0.14178466796875, 0.15569305419921875, 0.1696014404296875, 0.18350982666015625, 0.197418212890625, 0.21132659912109375, 0.2252349853515625, 0.23914337158203125, 0.2530517578125, 0.26696014404296875, 0.2808685302734375, 0.29477691650390625, 0.308685302734375, 0.32259368896484375, 0.3365020751953125, 0.35041046142578125, 0.36431884765625, 0.37822723388671875, 0.3921356201171875, 0.40604400634765625, 0.419952392578125, 0.43386077880859375, 0.4477691650390625, 0.46167755126953125, 0.4755859375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 8.0, 4.0, 2.0, 7.0, 7.0, 10.0, 14.0, 27.0, 38.0, 43.0, 73.0, 122.0, 254.0, 677.0, 1209.0, 830.0, 332.0, 141.0, 86.0, 54.0, 43.0, 36.0, 13.0, 20.0, 12.0, 5.0, 4.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.61328125, -0.5956039428710938, -0.5779266357421875, -0.5602493286132812, -0.542572021484375, -0.5248947143554688, -0.5072174072265625, -0.48954010009765625, -0.47186279296875, -0.45418548583984375, -0.4365081787109375, -0.41883087158203125, -0.401153564453125, -0.38347625732421875, -0.3657989501953125, -0.34812164306640625, -0.3304443359375, -0.31276702880859375, -0.2950897216796875, -0.27741241455078125, -0.259735107421875, -0.24205780029296875, -0.2243804931640625, -0.20670318603515625, -0.18902587890625, -0.17134857177734375, -0.1536712646484375, -0.13599395751953125, -0.118316650390625, -0.10063934326171875, -0.0829620361328125, -0.06528472900390625, -0.047607421875, -0.02993011474609375, -0.0122528076171875, 0.00542449951171875, 0.023101806640625, 0.04077911376953125, 0.0584564208984375, 0.07613372802734375, 0.09381103515625, 0.11148834228515625, 0.1291656494140625, 0.14684295654296875, 0.164520263671875, 0.18219757080078125, 0.1998748779296875, 0.21755218505859375, 0.2352294921875, 0.25290679931640625, 0.2705841064453125, 0.28826141357421875, 0.305938720703125, 0.32361602783203125, 0.3412933349609375, 0.35897064208984375, 0.37664794921875, 0.39432525634765625, 0.4120025634765625, 0.42967987060546875, 0.447357177734375, 0.46503448486328125, 0.4827117919921875, 0.5003890991210938, 0.51806640625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 1.0, 3.0, 1.0, 6.0, 16.0, 33.0, 98.0, 187.0, 220.0, 235.0, 111.0, 42.0, 15.0, 8.0, 7.0, 1.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.7039122581481934, -3.5741631984710693, -3.4444143772125244, -3.3146653175354004, -3.1849164962768555, -3.0551674365997314, -2.9254183769226074, -2.7956695556640625, -2.6659204959869385, -2.5361714363098145, -2.4064226150512695, -2.2766735553741455, -2.1469244956970215, -2.0171756744384766, -1.8874266147613525, -1.757677674293518, -1.6279287338256836, -1.4981797933578491, -1.3684308528900146, -1.2386817932128906, -1.1089328527450562, -0.9791839122772217, -0.8494349122047424, -0.7196859121322632, -0.5899369716644287, -0.46018800139427185, -0.330439031124115, -0.20069006085395813, -0.07094109058380127, 0.0588078498840332, 0.18855684995651245, 0.3183058500289917, 0.44805431365966797, 0.5778032541275024, 0.7075522541999817, 0.8373012542724609, 0.9670501947402954, 1.0967991352081299, 1.226548194885254, 1.3562971353530884, 1.4860460758209229, 1.6157950162887573, 1.7455439567565918, 1.8752930164337158, 2.00504207611084, 2.1347908973693848, 2.264539957046509, 2.394289016723633, 2.5240378379821777, 2.6537868976593018, 2.7835357189178467, 2.9132847785949707, 3.0430335998535156, 3.1727826595306396, 3.3025317192077637, 3.4322805404663086, 3.5620296001434326, 3.6917786598205566, 3.8215274810791016, 3.9512765407562256, 4.08102560043335, 4.2107744216918945, 4.3405232429504395, 4.470272541046143, 4.6000213623046875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 5.0, 2.0, 6.0, 11.0, 12.0, 24.0, 19.0, 29.0, 27.0, 30.0, 39.0, 39.0, 45.0, 65.0, 64.0, 56.0, 58.0, 59.0, 59.0, 55.0, 46.0, 58.0, 44.0, 29.0, 25.0, 26.0, 21.0, 12.0, 11.0, 4.0, 8.0, 2.0, 11.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8198716640472412, -1.7408299446105957, -1.6617882251739502, -1.5827466249465942, -1.5037049055099487, -1.4246631860733032, -1.3456215858459473, -1.2665798664093018, -1.1875381469726562, -1.1084964275360107, -1.0294547080993652, -0.9504131078720093, -0.8713713884353638, -0.7923296689987183, -0.7132880091667175, -0.6342463493347168, -0.5552046298980713, -0.47616294026374817, -0.39712125062942505, -0.31807956099510193, -0.2390378713607788, -0.1599961817264557, -0.08095449209213257, -0.001912832260131836, 0.07712888717651367, 0.1561705768108368, 0.2352122664451599, 0.31425395607948303, 0.39329564571380615, 0.4723373353481293, 0.5513790249824524, 0.6304206848144531, 0.7094626426696777, 0.7885043621063232, 0.867546021938324, 0.9465876817703247, 1.0256294012069702, 1.1046711206436157, 1.1837127208709717, 1.2627544403076172, 1.3417961597442627, 1.4208378791809082, 1.4998795986175537, 1.5789211988449097, 1.6579629182815552, 1.7370046377182007, 1.8160462379455566, 1.8950879573822021, 1.9741296768188477, 2.053171396255493, 2.1322131156921387, 2.211254835128784, 2.2902965545654297, 2.369338035583496, 2.4483797550201416, 2.527421474456787, 2.6064631938934326, 2.685504913330078, 2.7645466327667236, 2.843588352203369, 2.9226298332214355, 3.001671552658081, 3.0807132720947266, 3.159754991531372, 3.2387967109680176]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 4.0, 5.0, 8.0, 7.0, 23.0, 24.0, 40.0, 59.0, 75.0, 150.0, 246.0, 326.0, 664.0, 1112.0, 2051.0, 3969.0, 7979.0, 16053.0, 34439.0, 74984.0, 159115.0, 276252.0, 239778.0, 122667.0, 56494.0, 26253.0, 12378.0, 6140.0, 3244.0, 1716.0, 929.0, 525.0, 314.0, 187.0, 108.0, 78.0, 52.0, 32.0, 23.0, 17.0, 15.0, 8.0, 9.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.20849609375, -0.20194435119628906, -0.19539260864257812, -0.1888408660888672, -0.18228912353515625, -0.1757373809814453, -0.16918563842773438, -0.16263389587402344, -0.1560821533203125, -0.14953041076660156, -0.14297866821289062, -0.1364269256591797, -0.12987518310546875, -0.12332344055175781, -0.11677169799804688, -0.11021995544433594, -0.103668212890625, -0.09711647033691406, -0.09056472778320312, -0.08401298522949219, -0.07746124267578125, -0.07090950012207031, -0.06435775756835938, -0.05780601501464844, -0.0512542724609375, -0.04470252990722656, -0.038150787353515625, -0.03159904479980469, -0.02504730224609375, -0.018495559692382812, -0.011943817138671875, -0.0053920745849609375, 0.00115966796875, 0.0077114105224609375, 0.014263153076171875, 0.020814895629882812, 0.02736663818359375, 0.03391838073730469, 0.040470123291015625, 0.04702186584472656, 0.0535736083984375, 0.06012535095214844, 0.06667709350585938, 0.07322883605957031, 0.07978057861328125, 0.08633232116699219, 0.09288406372070312, 0.09943580627441406, 0.105987548828125, 0.11253929138183594, 0.11909103393554688, 0.1256427764892578, 0.13219451904296875, 0.1387462615966797, 0.14529800415039062, 0.15184974670410156, 0.1584014892578125, 0.16495323181152344, 0.17150497436523438, 0.1780567169189453, 0.18460845947265625, 0.1911602020263672, 0.19771194458007812, 0.20426368713378906, 0.2108154296875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 7.0, 7.0, 14.0, 7.0, 12.0, 20.0, 19.0, 18.0, 35.0, 48.0, 36.0, 47.0, 49.0, 52.0, 47.0, 50.0, 54.0, 70.0, 46.0, 55.0, 50.0, 42.0, 39.0, 30.0, 33.0, 23.0, 20.0, 17.0, 14.0, 9.0, 10.0, 7.0, 7.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2646484375, -0.2559623718261719, -0.24727630615234375, -0.23859024047851562, -0.2299041748046875, -0.22121810913085938, -0.21253204345703125, -0.20384597778320312, -0.195159912109375, -0.18647384643554688, -0.17778778076171875, -0.16910171508789062, -0.1604156494140625, -0.15172958374023438, -0.14304351806640625, -0.13435745239257812, -0.12567138671875, -0.11698532104492188, -0.10829925537109375, -0.09961318969726562, -0.0909271240234375, -0.08224105834960938, -0.07355499267578125, -0.06486892700195312, -0.056182861328125, -0.047496795654296875, -0.03881072998046875, -0.030124664306640625, -0.0214385986328125, -0.012752532958984375, -0.00406646728515625, 0.004619598388671875, 0.0133056640625, 0.021991729736328125, 0.03067779541015625, 0.039363861083984375, 0.0480499267578125, 0.056735992431640625, 0.06542205810546875, 0.07410812377929688, 0.082794189453125, 0.09148025512695312, 0.10016632080078125, 0.10885238647460938, 0.1175384521484375, 0.12622451782226562, 0.13491058349609375, 0.14359664916992188, 0.15228271484375, 0.16096878051757812, 0.16965484619140625, 0.17834091186523438, 0.1870269775390625, 0.19571304321289062, 0.20439910888671875, 0.21308517456054688, 0.221771240234375, 0.23045730590820312, 0.23914337158203125, 0.24782943725585938, 0.2565155029296875, 0.2652015686035156, 0.27388763427734375, 0.2825736999511719, 0.291259765625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 8.0, 12.0, 10.0, 21.0, 20.0, 33.0, 37.0, 61.0, 83.0, 101.0, 148.0, 206.0, 239.0, 432.0, 658.0, 1185.0, 3232.0, 18517.0, 479331.0, 518689.0, 18991.0, 3231.0, 1220.0, 595.0, 447.0, 294.0, 188.0, 160.0, 108.0, 90.0, 66.0, 37.0, 28.0, 21.0, 23.0, 15.0, 8.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.72314453125, -0.698211669921875, -0.67327880859375, -0.648345947265625, -0.6234130859375, -0.598480224609375, -0.57354736328125, -0.548614501953125, -0.523681640625, -0.498748779296875, -0.47381591796875, -0.448883056640625, -0.4239501953125, -0.399017333984375, -0.37408447265625, -0.349151611328125, -0.32421875, -0.299285888671875, -0.27435302734375, -0.249420166015625, -0.2244873046875, -0.199554443359375, -0.17462158203125, -0.149688720703125, -0.124755859375, -0.099822998046875, -0.07489013671875, -0.049957275390625, -0.0250244140625, -9.1552734375e-05, 0.02484130859375, 0.049774169921875, 0.07470703125, 0.099639892578125, 0.12457275390625, 0.149505615234375, 0.1744384765625, 0.199371337890625, 0.22430419921875, 0.249237060546875, 0.274169921875, 0.299102783203125, 0.32403564453125, 0.348968505859375, 0.3739013671875, 0.398834228515625, 0.42376708984375, 0.448699951171875, 0.4736328125, 0.498565673828125, 0.52349853515625, 0.548431396484375, 0.5733642578125, 0.598297119140625, 0.62322998046875, 0.648162841796875, 0.673095703125, 0.698028564453125, 0.72296142578125, 0.747894287109375, 0.7728271484375, 0.797760009765625, 0.82269287109375, 0.847625732421875, 0.87255859375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 10.0, 3.0, 5.0, 10.0, 14.0, 13.0, 22.0, 16.0, 21.0, 33.0, 33.0, 56.0, 45.0, 59.0, 42.0, 65.0, 44.0, 58.0, 48.0, 61.0, 52.0, 55.0, 39.0, 37.0, 28.0, 36.0, 27.0, 20.0, 10.0, 11.0, 11.0, 10.0, 4.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.98095703125, -0.9457473754882812, -0.9105377197265625, -0.8753280639648438, -0.840118408203125, -0.8049087524414062, -0.7696990966796875, -0.7344894409179688, -0.69927978515625, -0.6640701293945312, -0.6288604736328125, -0.5936508178710938, -0.558441162109375, -0.5232315063476562, -0.4880218505859375, -0.45281219482421875, -0.4176025390625, -0.38239288330078125, -0.3471832275390625, -0.31197357177734375, -0.276763916015625, -0.24155426025390625, -0.2063446044921875, -0.17113494873046875, -0.13592529296875, -0.10071563720703125, -0.0655059814453125, -0.03029632568359375, 0.004913330078125, 0.04012298583984375, 0.0753326416015625, 0.11054229736328125, 0.145751953125, 0.18096160888671875, 0.2161712646484375, 0.25138092041015625, 0.286590576171875, 0.32180023193359375, 0.3570098876953125, 0.39221954345703125, 0.42742919921875, 0.46263885498046875, 0.4978485107421875, 0.5330581665039062, 0.568267822265625, 0.6034774780273438, 0.6386871337890625, 0.6738967895507812, 0.7091064453125, 0.7443161010742188, 0.7795257568359375, 0.8147354125976562, 0.849945068359375, 0.8851547241210938, 0.9203643798828125, 0.9555740356445312, 0.99078369140625, 1.0259933471679688, 1.0612030029296875, 1.0964126586914062, 1.131622314453125, 1.1668319702148438, 1.2020416259765625, 1.2372512817382812, 1.2724609375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 5.0, 3.0, 4.0, 12.0, 21.0, 45.0, 76.0, 147.0, 314.0, 928.0, 3538.0, 25962.0, 826766.0, 177600.0, 10140.0, 1924.0, 586.0, 227.0, 115.0, 66.0, 31.0, 15.0, 11.0, 13.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3134765625, -0.30446624755859375, -0.2954559326171875, -0.28644561767578125, -0.277435302734375, -0.26842498779296875, -0.2594146728515625, -0.25040435791015625, -0.24139404296875, -0.23238372802734375, -0.2233734130859375, -0.21436309814453125, -0.205352783203125, -0.19634246826171875, -0.1873321533203125, -0.17832183837890625, -0.1693115234375, -0.16030120849609375, -0.1512908935546875, -0.14228057861328125, -0.133270263671875, -0.12425994873046875, -0.1152496337890625, -0.10623931884765625, -0.09722900390625, -0.08821868896484375, -0.0792083740234375, -0.07019805908203125, -0.061187744140625, -0.05217742919921875, -0.0431671142578125, -0.03415679931640625, -0.025146484375, -0.01613616943359375, -0.0071258544921875, 0.00188446044921875, 0.010894775390625, 0.01990509033203125, 0.0289154052734375, 0.03792572021484375, 0.04693603515625, 0.05594635009765625, 0.0649566650390625, 0.07396697998046875, 0.082977294921875, 0.09198760986328125, 0.1009979248046875, 0.11000823974609375, 0.1190185546875, 0.12802886962890625, 0.1370391845703125, 0.14604949951171875, 0.155059814453125, 0.16407012939453125, 0.1730804443359375, 0.18209075927734375, 0.19110107421875, 0.20011138916015625, 0.2091217041015625, 0.21813201904296875, 0.227142333984375, 0.23615264892578125, 0.2451629638671875, 0.25417327880859375, 0.26318359375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 5.0, 7.0, 3.0, 2.0, 5.0, 8.0, 6.0, 9.0, 11.0, 15.0, 18.0, 28.0, 24.0, 28.0, 39.0, 57.0, 71.0, 108.0, 108.0, 97.0, 75.0, 63.0, 50.0, 33.0, 24.0, 21.0, 12.0, 13.0, 13.0, 13.0, 7.0, 8.0, 5.0, 4.0, 4.0, 2.0, 5.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.449222564697266e-05, -6.256252527236938e-05, -6.063282489776611e-05, -5.870312452316284e-05, -5.677342414855957e-05, -5.48437237739563e-05, -5.291402339935303e-05, -5.0984323024749756e-05, -4.9054622650146484e-05, -4.712492227554321e-05, -4.519522190093994e-05, -4.326552152633667e-05, -4.13358211517334e-05, -3.940612077713013e-05, -3.7476420402526855e-05, -3.5546720027923584e-05, -3.361701965332031e-05, -3.168731927871704e-05, -2.975761890411377e-05, -2.7827918529510498e-05, -2.5898218154907227e-05, -2.3968517780303955e-05, -2.2038817405700684e-05, -2.0109117031097412e-05, -1.817941665649414e-05, -1.624971628189087e-05, -1.4320015907287598e-05, -1.2390315532684326e-05, -1.0460615158081055e-05, -8.530914783477783e-06, -6.601214408874512e-06, -4.67151403427124e-06, -2.7418136596679688e-06, -8.121132850646973e-07, 1.1175870895385742e-06, 3.0472874641418457e-06, 4.976987838745117e-06, 6.906688213348389e-06, 8.83638858795166e-06, 1.0766088962554932e-05, 1.2695789337158203e-05, 1.4625489711761475e-05, 1.6555190086364746e-05, 1.8484890460968018e-05, 2.041459083557129e-05, 2.234429121017456e-05, 2.4273991584777832e-05, 2.6203691959381104e-05, 2.8133392333984375e-05, 3.0063092708587646e-05, 3.199279308319092e-05, 3.392249345779419e-05, 3.585219383239746e-05, 3.778189420700073e-05, 3.9711594581604004e-05, 4.1641294956207275e-05, 4.357099533081055e-05, 4.550069570541382e-05, 4.743039608001709e-05, 4.936009645462036e-05, 5.128979682922363e-05, 5.3219497203826904e-05, 5.5149197578430176e-05, 5.707889795303345e-05, 5.900859832763672e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 10.0, 7.0, 12.0, 27.0, 39.0, 78.0, 116.0, 222.0, 557.0, 1529.0, 6044.0, 44924.0, 859394.0, 121037.0, 10948.0, 2238.0, 730.0, 311.0, 166.0, 81.0, 29.0, 28.0, 16.0, 9.0, 8.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.222900390625, -0.21484375, -0.206787109375, -0.19873046875, -0.190673828125, -0.1826171875, -0.174560546875, -0.16650390625, -0.158447265625, -0.150390625, -0.142333984375, -0.13427734375, -0.126220703125, -0.1181640625, -0.110107421875, -0.10205078125, -0.093994140625, -0.0859375, -0.077880859375, -0.06982421875, -0.061767578125, -0.0537109375, -0.045654296875, -0.03759765625, -0.029541015625, -0.021484375, -0.013427734375, -0.00537109375, 0.002685546875, 0.0107421875, 0.018798828125, 0.02685546875, 0.034912109375, 0.04296875, 0.051025390625, 0.05908203125, 0.067138671875, 0.0751953125, 0.083251953125, 0.09130859375, 0.099365234375, 0.107421875, 0.115478515625, 0.12353515625, 0.131591796875, 0.1396484375, 0.147705078125, 0.15576171875, 0.163818359375, 0.171875, 0.179931640625, 0.18798828125, 0.196044921875, 0.2041015625, 0.212158203125, 0.22021484375, 0.228271484375, 0.236328125, 0.244384765625, 0.25244140625, 0.260498046875, 0.2685546875, 0.276611328125, 0.28466796875, 0.292724609375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 6.0, 3.0, 5.0, 6.0, 10.0, 10.0, 16.0, 18.0, 26.0, 17.0, 36.0, 48.0, 45.0, 55.0, 66.0, 67.0, 83.0, 77.0, 57.0, 70.0, 44.0, 36.0, 36.0, 29.0, 27.0, 26.0, 14.0, 16.0, 14.0, 9.0, 5.0, 7.0, 5.0, 6.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15673828125, -0.1522235870361328, -0.14770889282226562, -0.14319419860839844, -0.13867950439453125, -0.13416481018066406, -0.12965011596679688, -0.1251354217529297, -0.1206207275390625, -0.11610603332519531, -0.11159133911132812, -0.10707664489746094, -0.10256195068359375, -0.09804725646972656, -0.09353256225585938, -0.08901786804199219, -0.084503173828125, -0.07998847961425781, -0.07547378540039062, -0.07095909118652344, -0.06644439697265625, -0.06192970275878906, -0.057415008544921875, -0.05290031433105469, -0.0483856201171875, -0.04387092590332031, -0.039356231689453125, -0.03484153747558594, -0.03032684326171875, -0.025812149047851562, -0.021297454833984375, -0.016782760620117188, -0.01226806640625, -0.0077533721923828125, -0.003238677978515625, 0.0012760162353515625, 0.00579071044921875, 0.010305404663085938, 0.014820098876953125, 0.019334793090820312, 0.0238494873046875, 0.028364181518554688, 0.032878875732421875, 0.03739356994628906, 0.04190826416015625, 0.04642295837402344, 0.050937652587890625, 0.05545234680175781, 0.059967041015625, 0.06448173522949219, 0.06899642944335938, 0.07351112365722656, 0.07802581787109375, 0.08254051208496094, 0.08705520629882812, 0.09156990051269531, 0.0960845947265625, 0.10059928894042969, 0.10511398315429688, 0.10962867736816406, 0.11414337158203125, 0.11865806579589844, 0.12317276000976562, 0.1276874542236328, 0.1322021484375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 4.0, 3.0, 1.0, 3.0, 3.0, 6.0, 4.0, 8.0, 9.0, 9.0, 24.0, 36.0, 83.0, 175.0, 297.0, 178.0, 94.0, 38.0, 16.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.317379951477051, -5.1720967292785645, -5.026813507080078, -4.881530284881592, -4.7362470626831055, -4.590964317321777, -4.445681095123291, -4.300397872924805, -4.155114650726318, -4.009831428527832, -3.8645482063293457, -3.7192652225494385, -3.573982000350952, -3.428698778152466, -3.2834157943725586, -3.1381325721740723, -2.992849349975586, -2.8475661277770996, -2.7022829055786133, -2.556999921798706, -2.4117166996002197, -2.2664334774017334, -2.121150493621826, -1.9758672714233398, -1.8305840492248535, -1.6853008270263672, -1.5400177240371704, -1.3947346210479736, -1.2494513988494873, -1.104168176651001, -0.9588850736618042, -0.8136019706726074, -0.6683192253112793, -0.5230360627174377, -0.3777529001235962, -0.23246973752975464, -0.08718657493591309, 0.05809658765792847, 0.20337975025177002, 0.3486628532409668, 0.4939460754394531, 0.6392292380332947, 0.7845124006271362, 0.9297955632209778, 1.0750787258148193, 1.2203619480133057, 1.3656450510025024, 1.5109281539916992, 1.6562113761901855, 1.8014945983886719, 1.9467777013778687, 2.0920608043670654, 2.2373440265655518, 2.382627248764038, 2.5279102325439453, 2.6731934547424316, 2.818476676940918, 2.9637598991394043, 3.1090431213378906, 3.254326105117798, 3.399609327316284, 3.5448925495147705, 3.6901755332946777, 3.835458755493164, 3.9807419776916504]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 6.0, 7.0, 6.0, 8.0, 8.0, 12.0, 10.0, 8.0, 14.0, 14.0, 14.0, 17.0, 17.0, 17.0, 23.0, 27.0, 27.0, 22.0, 28.0, 49.0, 45.0, 63.0, 60.0, 61.0, 40.0, 46.0, 35.0, 35.0, 31.0, 37.0, 23.0, 24.0, 25.0, 19.0, 24.0, 17.0, 11.0, 12.0, 12.0, 9.0, 8.0, 9.0, 3.0, 4.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 5.0, 1.0, 1.0, 3.0], "bins": [-2.8981740474700928, -2.8045549392700195, -2.7109358310699463, -2.617316722869873, -2.523697853088379, -2.4300787448883057, -2.3364596366882324, -2.242840528488159, -2.149221420288086, -2.0556023120880127, -1.961983323097229, -1.8683642148971558, -1.774745225906372, -1.6811261177062988, -1.5875070095062256, -1.4938879013061523, -1.4002690315246582, -1.306649923324585, -1.2130309343338013, -1.119411826133728, -1.0257928371429443, -0.9321737289428711, -0.8385546207427979, -0.7449355721473694, -0.6513165235519409, -0.5576974749565125, -0.4640783965587616, -0.37045931816101074, -0.2768402695655823, -0.1832212209701538, -0.08960211277008057, 0.0040169358253479, 0.09763622283935547, 0.19125528633594513, 0.2848743498325348, 0.37849342823028564, 0.4721124768257141, 0.5657315254211426, 0.6593506336212158, 0.7529696822166443, 0.8465887308120728, 0.9402077794075012, 1.0338268280029297, 1.127445936203003, 1.2210650444030762, 1.3146840333938599, 1.408303141593933, 1.5019221305847168, 1.59554123878479, 1.6891603469848633, 1.782779335975647, 1.8763984441757202, 1.970017433166504, 2.063636541366577, 2.1572556495666504, 2.2508747577667236, 2.344493865966797, 2.43811297416687, 2.5317320823669434, 2.6253509521484375, 2.7189700603485107, 2.812589168548584, 2.9062082767486572, 2.9998273849487305, 3.0934462547302246]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 3.0, 5.0, 4.0, 3.0, 2.0, 2.0, 2.0, 9.0, 8.0, 8.0, 9.0, 17.0, 16.0, 25.0, 37.0, 46.0, 59.0, 76.0, 88.0, 123.0, 203.0, 266.0, 459.0, 759.0, 1453.0, 3203.0, 8427.0, 26571.0, 144425.0, 1106969.0, 2360965.0, 448352.0, 63736.0, 16395.0, 5931.0, 2562.0, 1164.0, 706.0, 341.0, 257.0, 161.0, 115.0, 84.0, 61.0, 46.0, 37.0, 28.0, 16.0, 19.0, 11.0, 12.0, 7.0, 7.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2440185546875, -0.23690032958984375, -0.2297821044921875, -0.22266387939453125, -0.215545654296875, -0.20842742919921875, -0.2013092041015625, -0.19419097900390625, -0.18707275390625, -0.17995452880859375, -0.1728363037109375, -0.16571807861328125, -0.158599853515625, -0.15148162841796875, -0.1443634033203125, -0.13724517822265625, -0.130126953125, -0.12300872802734375, -0.1158905029296875, -0.10877227783203125, -0.101654052734375, -0.09453582763671875, -0.0874176025390625, -0.08029937744140625, -0.07318115234375, -0.06606292724609375, -0.0589447021484375, -0.05182647705078125, -0.044708251953125, -0.03759002685546875, -0.0304718017578125, -0.02335357666015625, -0.0162353515625, -0.00911712646484375, -0.0019989013671875, 0.00511932373046875, 0.012237548828125, 0.01935577392578125, 0.0264739990234375, 0.03359222412109375, 0.04071044921875, 0.04782867431640625, 0.0549468994140625, 0.06206512451171875, 0.069183349609375, 0.07630157470703125, 0.0834197998046875, 0.09053802490234375, 0.09765625, 0.10477447509765625, 0.1118927001953125, 0.11901092529296875, 0.126129150390625, 0.13324737548828125, 0.1403656005859375, 0.14748382568359375, 0.15460205078125, 0.16172027587890625, 0.1688385009765625, 0.17595672607421875, 0.183074951171875, 0.19019317626953125, 0.1973114013671875, 0.20442962646484375, 0.2115478515625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 15.0, 6.0, 16.0, 13.0, 16.0, 28.0, 30.0, 38.0, 38.0, 49.0, 53.0, 57.0, 73.0, 56.0, 54.0, 61.0, 60.0, 55.0, 49.0, 40.0, 49.0, 26.0, 26.0, 25.0, 15.0, 18.0, 8.0, 9.0, 6.0, 5.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2822265625, -0.2731895446777344, -0.26415252685546875, -0.2551155090332031, -0.2460784912109375, -0.23704147338867188, -0.22800445556640625, -0.21896743774414062, -0.209930419921875, -0.20089340209960938, -0.19185638427734375, -0.18281936645507812, -0.1737823486328125, -0.16474533081054688, -0.15570831298828125, -0.14667129516601562, -0.13763427734375, -0.12859725952148438, -0.11956024169921875, -0.11052322387695312, -0.1014862060546875, -0.09244918823242188, -0.08341217041015625, -0.07437515258789062, -0.065338134765625, -0.056301116943359375, -0.04726409912109375, -0.038227081298828125, -0.0291900634765625, -0.020153045654296875, -0.01111602783203125, -0.002079010009765625, 0.0069580078125, 0.015995025634765625, 0.02503204345703125, 0.034069061279296875, 0.0431060791015625, 0.052143096923828125, 0.06118011474609375, 0.07021713256835938, 0.079254150390625, 0.08829116821289062, 0.09732818603515625, 0.10636520385742188, 0.1154022216796875, 0.12443923950195312, 0.13347625732421875, 0.14251327514648438, 0.15155029296875, 0.16058731079101562, 0.16962432861328125, 0.17866134643554688, 0.1876983642578125, 0.19673538208007812, 0.20577239990234375, 0.21480941772460938, 0.223846435546875, 0.23288345336914062, 0.24192047119140625, 0.2509574890136719, 0.2599945068359375, 0.2690315246582031, 0.27806854248046875, 0.2871055603027344, 0.296142578125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 10.0, 5.0, 13.0, 22.0, 25.0, 32.0, 45.0, 100.0, 215.0, 400.0, 812.0, 1981.0, 6227.0, 29650.0, 387054.0, 3591285.0, 147931.0, 19799.0, 5183.0, 1851.0, 775.0, 384.0, 199.0, 100.0, 56.0, 43.0, 33.0, 15.0, 8.0, 9.0, 11.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33935546875, -0.3269500732421875, -0.314544677734375, -0.3021392822265625, -0.28973388671875, -0.2773284912109375, -0.264923095703125, -0.2525177001953125, -0.2401123046875, -0.2277069091796875, -0.215301513671875, -0.2028961181640625, -0.19049072265625, -0.1780853271484375, -0.165679931640625, -0.1532745361328125, -0.140869140625, -0.1284637451171875, -0.116058349609375, -0.1036529541015625, -0.09124755859375, -0.0788421630859375, -0.066436767578125, -0.0540313720703125, -0.0416259765625, -0.0292205810546875, -0.016815185546875, -0.0044097900390625, 0.00799560546875, 0.0204010009765625, 0.032806396484375, 0.0452117919921875, 0.0576171875, 0.0700225830078125, 0.082427978515625, 0.0948333740234375, 0.10723876953125, 0.1196441650390625, 0.132049560546875, 0.1444549560546875, 0.1568603515625, 0.1692657470703125, 0.181671142578125, 0.1940765380859375, 0.20648193359375, 0.2188873291015625, 0.231292724609375, 0.2436981201171875, 0.256103515625, 0.2685089111328125, 0.280914306640625, 0.2933197021484375, 0.30572509765625, 0.3181304931640625, 0.330535888671875, 0.3429412841796875, 0.3553466796875, 0.3677520751953125, 0.380157470703125, 0.3925628662109375, 0.40496826171875, 0.4173736572265625, 0.429779052734375, 0.4421844482421875, 0.45458984375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 6.0, 10.0, 8.0, 24.0, 28.0, 49.0, 122.0, 186.0, 400.0, 904.0, 1129.0, 644.0, 267.0, 114.0, 52.0, 31.0, 34.0, 19.0, 8.0, 9.0, 11.0, 1.0, 5.0, 2.0, 3.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5751953125, -0.557861328125, -0.54052734375, -0.523193359375, -0.505859375, -0.488525390625, -0.47119140625, -0.453857421875, -0.4365234375, -0.419189453125, -0.40185546875, -0.384521484375, -0.3671875, -0.349853515625, -0.33251953125, -0.315185546875, -0.2978515625, -0.280517578125, -0.26318359375, -0.245849609375, -0.228515625, -0.211181640625, -0.19384765625, -0.176513671875, -0.1591796875, -0.141845703125, -0.12451171875, -0.107177734375, -0.08984375, -0.072509765625, -0.05517578125, -0.037841796875, -0.0205078125, -0.003173828125, 0.01416015625, 0.031494140625, 0.048828125, 0.066162109375, 0.08349609375, 0.100830078125, 0.1181640625, 0.135498046875, 0.15283203125, 0.170166015625, 0.1875, 0.204833984375, 0.22216796875, 0.239501953125, 0.2568359375, 0.274169921875, 0.29150390625, 0.308837890625, 0.326171875, 0.343505859375, 0.36083984375, 0.378173828125, 0.3955078125, 0.412841796875, 0.43017578125, 0.447509765625, 0.46484375, 0.482177734375, 0.49951171875, 0.516845703125, 0.5341796875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 4.0, 4.0, 8.0, 12.0, 29.0, 75.0, 174.0, 209.0, 237.0, 126.0, 72.0, 23.0, 10.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.06421422958374, -4.9465765953063965, -4.828939437866211, -4.711301803588867, -4.593664169311523, -4.47602653503418, -4.358389377593994, -4.24075174331665, -4.123114585876465, -4.005476951599121, -3.8878395557403564, -3.770202159881592, -3.652564525604248, -3.5349271297454834, -3.4172897338867188, -3.299652099609375, -3.1820144653320312, -3.0643770694732666, -2.946739435195923, -2.829102039337158, -2.7114644050598145, -2.59382700920105, -2.476189613342285, -2.3585519790649414, -2.2409145832061768, -2.123277187347412, -2.0056395530700684, -1.8880021572113037, -1.7703646421432495, -1.6527271270751953, -1.5350897312164307, -1.4174522161483765, -1.2998147010803223, -1.182177186012268, -1.0645396709442139, -0.9469022750854492, -0.829264760017395, -0.7116272449493408, -0.5939897894859314, -0.476352334022522, -0.3587148189544678, -0.24107733368873596, -0.12343984842300415, -0.005802363157272339, 0.11183512210845947, 0.22947263717651367, 0.3471100926399231, 0.4647475481033325, 0.5823850631713867, 0.7000225782394409, 0.8176600337028503, 0.9352974891662598, 1.052935004234314, 1.1705725193023682, 1.2882099151611328, 1.405847430229187, 1.5234849452972412, 1.6411224603652954, 1.7587599754333496, 1.8763973712921143, 1.9940348863601685, 2.1116724014282227, 2.2293097972869873, 2.346947193145752, 2.4645848274230957]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 10.0, 8.0, 6.0, 7.0, 17.0, 17.0, 17.0, 24.0, 19.0, 26.0, 30.0, 44.0, 41.0, 42.0, 49.0, 59.0, 65.0, 49.0, 50.0, 45.0, 57.0, 43.0, 35.0, 44.0, 24.0, 25.0, 32.0, 22.0, 15.0, 15.0, 17.0, 10.0, 12.0, 8.0, 2.0, 5.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-2.379817485809326, -2.3186392784118652, -2.257460832595825, -2.1962826251983643, -2.1351044178009033, -2.0739259719848633, -2.0127477645874023, -1.9515695571899414, -1.890391230583191, -1.8292129039764404, -1.7680346965789795, -1.706856369972229, -1.6456780433654785, -1.5844998359680176, -1.523321509361267, -1.4621431827545166, -1.4009649753570557, -1.3397866487503052, -1.2786084413528442, -1.2174301147460938, -1.1562519073486328, -1.0950735807418823, -1.0338952541351318, -0.9727169871330261, -0.9115387201309204, -0.8503604531288147, -0.789182186126709, -0.7280038595199585, -0.6668255925178528, -0.6056473255157471, -0.5444689989089966, -0.48329073190689087, -0.42211246490478516, -0.36093419790267944, -0.29975590109825134, -0.23857761919498444, -0.17739933729171753, -0.11622107028961182, -0.055042773485183716, 0.006135523319244385, 0.0673137903213501, 0.128492072224617, 0.1896703541278839, 0.250848650932312, 0.3120269179344177, 0.37320518493652344, 0.43438348174095154, 0.49556177854537964, 0.5567400455474854, 0.6179183125495911, 0.6790965795516968, 0.7402749061584473, 0.801453173160553, 0.8626314401626587, 0.9238097667694092, 0.9849880337715149, 1.0461663007736206, 1.107344627380371, 1.168522834777832, 1.2297011613845825, 1.290879487991333, 1.352057695388794, 1.4132360219955444, 1.474414348602295, 1.5355925559997559]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 4.0, 3.0, 4.0, 10.0, 6.0, 7.0, 16.0, 17.0, 26.0, 32.0, 49.0, 71.0, 106.0, 172.0, 260.0, 442.0, 768.0, 1274.0, 2436.0, 4524.0, 9545.0, 21436.0, 50927.0, 126314.0, 289853.0, 304704.0, 136278.0, 55075.0, 22973.0, 10237.0, 5043.0, 2573.0, 1398.0, 755.0, 456.0, 273.0, 169.0, 104.0, 63.0, 39.0, 24.0, 31.0, 18.0, 10.0, 11.0, 7.0, 10.0, 3.0, 4.0, 2.0, 1.0, 3.0], "bins": [-0.265869140625, -0.25869178771972656, -0.2515144348144531, -0.2443370819091797, -0.23715972900390625, -0.2299823760986328, -0.22280502319335938, -0.21562767028808594, -0.2084503173828125, -0.20127296447753906, -0.19409561157226562, -0.1869182586669922, -0.17974090576171875, -0.1725635528564453, -0.16538619995117188, -0.15820884704589844, -0.151031494140625, -0.14385414123535156, -0.13667678833007812, -0.1294994354248047, -0.12232208251953125, -0.11514472961425781, -0.10796737670898438, -0.10079002380371094, -0.0936126708984375, -0.08643531799316406, -0.07925796508789062, -0.07208061218261719, -0.06490325927734375, -0.05772590637207031, -0.050548553466796875, -0.04337120056152344, -0.03619384765625, -0.029016494750976562, -0.021839141845703125, -0.014661788940429688, -0.00748443603515625, -0.0003070831298828125, 0.006870269775390625, 0.014047622680664062, 0.0212249755859375, 0.028402328491210938, 0.035579681396484375, 0.04275703430175781, 0.04993438720703125, 0.05711174011230469, 0.06428909301757812, 0.07146644592285156, 0.078643798828125, 0.08582115173339844, 0.09299850463867188, 0.10017585754394531, 0.10735321044921875, 0.11453056335449219, 0.12170791625976562, 0.12888526916503906, 0.1360626220703125, 0.14323997497558594, 0.15041732788085938, 0.1575946807861328, 0.16477203369140625, 0.1719493865966797, 0.17912673950195312, 0.18630409240722656, 0.1934814453125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 3.0, 13.0, 13.0, 17.0, 14.0, 29.0, 31.0, 29.0, 34.0, 52.0, 60.0, 61.0, 62.0, 59.0, 60.0, 54.0, 62.0, 47.0, 50.0, 60.0, 40.0, 35.0, 27.0, 20.0, 18.0, 15.0, 7.0, 8.0, 9.0, 8.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.268798828125, -0.2599372863769531, -0.25107574462890625, -0.24221420288085938, -0.2333526611328125, -0.22449111938476562, -0.21562957763671875, -0.20676803588867188, -0.197906494140625, -0.18904495239257812, -0.18018341064453125, -0.17132186889648438, -0.1624603271484375, -0.15359878540039062, -0.14473724365234375, -0.13587570190429688, -0.12701416015625, -0.11815261840820312, -0.10929107666015625, -0.10042953491210938, -0.0915679931640625, -0.08270645141601562, -0.07384490966796875, -0.06498336791992188, -0.056121826171875, -0.047260284423828125, -0.03839874267578125, -0.029537200927734375, -0.0206756591796875, -0.011814117431640625, -0.00295257568359375, 0.005908966064453125, 0.0147705078125, 0.023632049560546875, 0.03249359130859375, 0.041355133056640625, 0.0502166748046875, 0.059078216552734375, 0.06793975830078125, 0.07680130004882812, 0.085662841796875, 0.09452438354492188, 0.10338592529296875, 0.11224746704101562, 0.1211090087890625, 0.12997055053710938, 0.13883209228515625, 0.14769363403320312, 0.15655517578125, 0.16541671752929688, 0.17427825927734375, 0.18313980102539062, 0.1920013427734375, 0.20086288452148438, 0.20972442626953125, 0.21858596801757812, 0.227447509765625, 0.23630905151367188, 0.24517059326171875, 0.2540321350097656, 0.2628936767578125, 0.2717552185058594, 0.28061676025390625, 0.2894783020019531, 0.29833984375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 0.0, 4.0, 1.0, 8.0, 8.0, 9.0, 21.0, 22.0, 28.0, 45.0, 50.0, 58.0, 109.0, 143.0, 192.0, 242.0, 327.0, 518.0, 875.0, 1711.0, 4832.0, 31766.0, 648754.0, 329762.0, 20877.0, 4085.0, 1525.0, 769.0, 470.0, 348.0, 270.0, 175.0, 141.0, 114.0, 89.0, 61.0, 35.0, 34.0, 21.0, 17.0, 5.0, 10.0, 7.0, 9.0, 6.0, 3.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5947265625, -0.57415771484375, -0.5535888671875, -0.53302001953125, -0.512451171875, -0.49188232421875, -0.4713134765625, -0.45074462890625, -0.43017578125, -0.40960693359375, -0.3890380859375, -0.36846923828125, -0.347900390625, -0.32733154296875, -0.3067626953125, -0.28619384765625, -0.265625, -0.24505615234375, -0.2244873046875, -0.20391845703125, -0.183349609375, -0.16278076171875, -0.1422119140625, -0.12164306640625, -0.10107421875, -0.08050537109375, -0.0599365234375, -0.03936767578125, -0.018798828125, 0.00177001953125, 0.0223388671875, 0.04290771484375, 0.0634765625, 0.08404541015625, 0.1046142578125, 0.12518310546875, 0.145751953125, 0.16632080078125, 0.1868896484375, 0.20745849609375, 0.22802734375, 0.24859619140625, 0.2691650390625, 0.28973388671875, 0.310302734375, 0.33087158203125, 0.3514404296875, 0.37200927734375, 0.392578125, 0.41314697265625, 0.4337158203125, 0.45428466796875, 0.474853515625, 0.49542236328125, 0.5159912109375, 0.53656005859375, 0.55712890625, 0.57769775390625, 0.5982666015625, 0.61883544921875, 0.639404296875, 0.65997314453125, 0.6805419921875, 0.70111083984375, 0.7216796875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 7.0, 6.0, 7.0, 13.0, 12.0, 18.0, 10.0, 16.0, 26.0, 30.0, 30.0, 36.0, 38.0, 33.0, 57.0, 44.0, 58.0, 60.0, 49.0, 50.0, 52.0, 47.0, 40.0, 37.0, 33.0, 31.0, 29.0, 25.0, 27.0, 23.0, 22.0, 10.0, 6.0, 5.0, 7.0, 2.0, 5.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.70166015625, -0.67529296875, -0.64892578125, -0.62255859375, -0.59619140625, -0.56982421875, -0.54345703125, -0.51708984375, -0.49072265625, -0.46435546875, -0.43798828125, -0.41162109375, -0.38525390625, -0.35888671875, -0.33251953125, -0.30615234375, -0.27978515625, -0.25341796875, -0.22705078125, -0.20068359375, -0.17431640625, -0.14794921875, -0.12158203125, -0.09521484375, -0.06884765625, -0.04248046875, -0.01611328125, 0.01025390625, 0.03662109375, 0.06298828125, 0.08935546875, 0.11572265625, 0.14208984375, 0.16845703125, 0.19482421875, 0.22119140625, 0.24755859375, 0.27392578125, 0.30029296875, 0.32666015625, 0.35302734375, 0.37939453125, 0.40576171875, 0.43212890625, 0.45849609375, 0.48486328125, 0.51123046875, 0.53759765625, 0.56396484375, 0.59033203125, 0.61669921875, 0.64306640625, 0.66943359375, 0.69580078125, 0.72216796875, 0.74853515625, 0.77490234375, 0.80126953125, 0.82763671875, 0.85400390625, 0.88037109375, 0.90673828125, 0.93310546875, 0.95947265625, 0.98583984375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 7.0, 5.0, 8.0, 10.0, 13.0, 19.0, 22.0, 45.0, 78.0, 154.0, 364.0, 1106.0, 7554.0, 181899.0, 828228.0, 25593.0, 2389.0, 557.0, 229.0, 91.0, 56.0, 35.0, 26.0, 23.0, 16.0, 4.0, 7.0, 7.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.246826171875, -0.23865890502929688, -0.23049163818359375, -0.22232437133789062, -0.2141571044921875, -0.20598983764648438, -0.19782257080078125, -0.18965530395507812, -0.181488037109375, -0.17332077026367188, -0.16515350341796875, -0.15698623657226562, -0.1488189697265625, -0.14065170288085938, -0.13248443603515625, -0.12431716918945312, -0.11614990234375, -0.10798263549804688, -0.09981536865234375, -0.09164810180664062, -0.0834808349609375, -0.07531356811523438, -0.06714630126953125, -0.058979034423828125, -0.050811767578125, -0.042644500732421875, -0.03447723388671875, -0.026309967041015625, -0.0181427001953125, -0.009975433349609375, -0.00180816650390625, 0.006359100341796875, 0.0145263671875, 0.022693634033203125, 0.03086090087890625, 0.039028167724609375, 0.0471954345703125, 0.055362701416015625, 0.06352996826171875, 0.07169723510742188, 0.079864501953125, 0.08803176879882812, 0.09619903564453125, 0.10436630249023438, 0.1125335693359375, 0.12070083618164062, 0.12886810302734375, 0.13703536987304688, 0.14520263671875, 0.15336990356445312, 0.16153717041015625, 0.16970443725585938, 0.1778717041015625, 0.18603897094726562, 0.19420623779296875, 0.20237350463867188, 0.210540771484375, 0.21870803833007812, 0.22687530517578125, 0.23504257202148438, 0.2432098388671875, 0.2513771057128906, 0.25954437255859375, 0.2677116394042969, 0.27587890625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 4.0, 1.0, 2.0, 7.0, 4.0, 5.0, 7.0, 9.0, 5.0, 12.0, 15.0, 18.0, 31.0, 43.0, 52.0, 70.0, 105.0, 131.0, 117.0, 86.0, 88.0, 41.0, 34.0, 27.0, 19.0, 8.0, 6.0, 17.0, 10.0, 4.0, 7.0, 6.0, 4.0, 0.0, 1.0, 5.0, 0.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.687641143798828e-05, -6.476230919361115e-05, -6.264820694923401e-05, -6.053410470485687e-05, -5.8420002460479736e-05, -5.63059002161026e-05, -5.4191797971725464e-05, -5.207769572734833e-05, -4.996359348297119e-05, -4.7849491238594055e-05, -4.573538899421692e-05, -4.362128674983978e-05, -4.1507184505462646e-05, -3.939308226108551e-05, -3.7278980016708374e-05, -3.516487777233124e-05, -3.30507755279541e-05, -3.0936673283576965e-05, -2.882257103919983e-05, -2.6708468794822693e-05, -2.4594366550445557e-05, -2.248026430606842e-05, -2.0366162061691284e-05, -1.8252059817314148e-05, -1.6137957572937012e-05, -1.4023855328559875e-05, -1.190975308418274e-05, -9.795650839805603e-06, -7.681548595428467e-06, -5.5674463510513306e-06, -3.4533441066741943e-06, -1.339241862297058e-06, 7.748603820800781e-07, 2.8889626264572144e-06, 5.003064870834351e-06, 7.117167115211487e-06, 9.231269359588623e-06, 1.134537160396576e-05, 1.3459473848342896e-05, 1.5573576092720032e-05, 1.7687678337097168e-05, 1.9801780581474304e-05, 2.191588282585144e-05, 2.4029985070228577e-05, 2.6144087314605713e-05, 2.825818955898285e-05, 3.0372291803359985e-05, 3.248639404773712e-05, 3.460049629211426e-05, 3.6714598536491394e-05, 3.882870078086853e-05, 4.0942803025245667e-05, 4.30569052696228e-05, 4.517100751399994e-05, 4.7285109758377075e-05, 4.939921200275421e-05, 5.151331424713135e-05, 5.3627416491508484e-05, 5.574151873588562e-05, 5.7855620980262756e-05, 5.996972322463989e-05, 6.208382546901703e-05, 6.419792771339417e-05, 6.63120299577713e-05, 6.842613220214844e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 2.0, 0.0, 0.0, 4.0, 6.0, 8.0, 11.0, 23.0, 20.0, 48.0, 63.0, 132.0, 206.0, 334.0, 639.0, 1481.0, 4523.0, 23280.0, 226260.0, 714068.0, 63876.0, 9161.0, 2370.0, 962.0, 458.0, 216.0, 149.0, 92.0, 50.0, 43.0, 23.0, 18.0, 12.0, 6.0, 3.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1873779296875, -0.1824779510498047, -0.17757797241210938, -0.17267799377441406, -0.16777801513671875, -0.16287803649902344, -0.15797805786132812, -0.1530780792236328, -0.1481781005859375, -0.1432781219482422, -0.13837814331054688, -0.13347816467285156, -0.12857818603515625, -0.12367820739746094, -0.11877822875976562, -0.11387825012207031, -0.108978271484375, -0.10407829284667969, -0.09917831420898438, -0.09427833557128906, -0.08937835693359375, -0.08447837829589844, -0.07957839965820312, -0.07467842102050781, -0.0697784423828125, -0.06487846374511719, -0.059978485107421875, -0.05507850646972656, -0.05017852783203125, -0.04527854919433594, -0.040378570556640625, -0.03547859191894531, -0.03057861328125, -0.025678634643554688, -0.020778656005859375, -0.015878677368164062, -0.01097869873046875, -0.0060787200927734375, -0.001178741455078125, 0.0037212371826171875, 0.0086212158203125, 0.013521194458007812, 0.018421173095703125, 0.023321151733398438, 0.02822113037109375, 0.03312110900878906, 0.038021087646484375, 0.04292106628417969, 0.047821044921875, 0.05272102355957031, 0.057621002197265625, 0.06252098083496094, 0.06742095947265625, 0.07232093811035156, 0.07722091674804688, 0.08212089538574219, 0.0870208740234375, 0.09192085266113281, 0.09682083129882812, 0.10172080993652344, 0.10662078857421875, 0.11152076721191406, 0.11642074584960938, 0.12132072448730469, 0.126220703125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 6.0, 12.0, 14.0, 14.0, 24.0, 28.0, 33.0, 58.0, 79.0, 114.0, 121.0, 98.0, 117.0, 72.0, 64.0, 43.0, 36.0, 22.0, 21.0, 11.0, 9.0, 5.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26123046875, -0.255340576171875, -0.24945068359375, -0.243560791015625, -0.2376708984375, -0.231781005859375, -0.22589111328125, -0.220001220703125, -0.214111328125, -0.208221435546875, -0.20233154296875, -0.196441650390625, -0.1905517578125, -0.184661865234375, -0.17877197265625, -0.172882080078125, -0.1669921875, -0.161102294921875, -0.15521240234375, -0.149322509765625, -0.1434326171875, -0.137542724609375, -0.13165283203125, -0.125762939453125, -0.119873046875, -0.113983154296875, -0.10809326171875, -0.102203369140625, -0.0963134765625, -0.090423583984375, -0.08453369140625, -0.078643798828125, -0.07275390625, -0.066864013671875, -0.06097412109375, -0.055084228515625, -0.0491943359375, -0.043304443359375, -0.03741455078125, -0.031524658203125, -0.025634765625, -0.019744873046875, -0.01385498046875, -0.007965087890625, -0.0020751953125, 0.003814697265625, 0.00970458984375, 0.015594482421875, 0.021484375, 0.027374267578125, 0.03326416015625, 0.039154052734375, 0.0450439453125, 0.050933837890625, 0.05682373046875, 0.062713623046875, 0.068603515625, 0.074493408203125, 0.08038330078125, 0.086273193359375, 0.0921630859375, 0.098052978515625, 0.10394287109375, 0.109832763671875, 0.11572265625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 3.0, 5.0, 8.0, 7.0, 14.0, 28.0, 63.0, 155.0, 339.0, 207.0, 94.0, 37.0, 18.0, 7.0, 6.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.472559928894043, -4.334954261779785, -4.197348594665527, -4.059742450714111, -3.9221367835998535, -3.7845311164855957, -3.646925449371338, -3.50931978225708, -3.371713876724243, -3.2341082096099854, -3.0965023040771484, -2.9588966369628906, -2.821290969848633, -2.683685064315796, -2.546079397201538, -2.408473491668701, -2.2708678245544434, -2.1332621574401855, -1.9956562519073486, -1.8580505847930908, -1.7204447984695435, -1.582839012145996, -1.4452333450317383, -1.307627558708191, -1.1700217723846436, -1.0324159860610962, -0.8948102593421936, -0.757204532623291, -0.6195987462997437, -0.4819929599761963, -0.3443872332572937, -0.2067815065383911, -0.06917619705200195, 0.06842955946922302, 0.206035315990448, 0.343641072511673, 0.48124682903289795, 0.6188526153564453, 0.7564583420753479, 0.8940640687942505, 1.0316698551177979, 1.1692756414413452, 1.3068814277648926, 1.4444870948791504, 1.5820928812026978, 1.7196986675262451, 1.857304334640503, 1.9949101209640503, 2.1325159072875977, 2.2701215744018555, 2.4077274799346924, 2.54533314704895, 2.682939052581787, 2.820544719696045, 2.9581503868103027, 3.0957560539245605, 3.2333619594573975, 3.3709676265716553, 3.508573532104492, 3.64617919921875, 3.783784866333008, 3.9213907718658447, 4.058996677398682, 4.1966023445129395, 4.334208011627197]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 3.0, 5.0, 8.0, 14.0, 13.0, 13.0, 15.0, 22.0, 23.0, 27.0, 30.0, 41.0, 49.0, 53.0, 59.0, 76.0, 111.0, 69.0, 63.0, 45.0, 42.0, 40.0, 27.0, 28.0, 23.0, 19.0, 19.0, 18.0, 15.0, 11.0, 10.0, 5.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.347200870513916, -3.2330715656280518, -3.1189424991607666, -3.0048131942749023, -2.890684127807617, -2.776554822921753, -2.6624255180358887, -2.5482964515686035, -2.4341673851013184, -2.320038080215454, -2.205909013748169, -2.0917797088623047, -1.9776506423950195, -1.8635213375091553, -1.7493921518325806, -1.6352629661560059, -1.5211336612701416, -1.407004475593567, -1.2928752899169922, -1.178745985031128, -1.0646169185638428, -0.9504876732826233, -0.8363584280014038, -0.7222292423248291, -0.6081000566482544, -0.4939708709716797, -0.3798416554927826, -0.2657124400138855, -0.1515832543373108, -0.037454068660736084, 0.0766751766204834, 0.1908043622970581, 0.3049333095550537, 0.4190624952316284, 0.5331916809082031, 0.6473209261894226, 0.7614501118659973, 0.875579297542572, 0.9897085428237915, 1.1038377285003662, 1.217966914176941, 1.3320960998535156, 1.4462252855300903, 1.560354471206665, 1.6744837760925293, 1.7886128425598145, 1.9027421474456787, 2.016871452331543, 2.131000518798828, 2.2451298236846924, 2.3592588901519775, 2.473388195037842, 2.587517261505127, 2.701646566390991, 2.8157758712768555, 2.9299049377441406, 3.044034004211426, 3.15816330909729, 3.272292375564575, 3.3864216804504395, 3.5005507469177246, 3.614680051803589, 3.728809356689453, 3.8429384231567383, 3.9570677280426025]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 7.0, 6.0, 7.0, 10.0, 26.0, 38.0, 31.0, 64.0, 95.0, 148.0, 263.0, 573.0, 1607.0, 6485.0, 57089.0, 1948131.0, 2102848.0, 65662.0, 8003.0, 1824.0, 660.0, 288.0, 153.0, 79.0, 60.0, 45.0, 17.0, 24.0, 20.0, 9.0, 3.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.36376953125, -0.3516502380371094, -0.33953094482421875, -0.3274116516113281, -0.3152923583984375, -0.3031730651855469, -0.29105377197265625, -0.2789344787597656, -0.266815185546875, -0.2546958923339844, -0.24257659912109375, -0.23045730590820312, -0.2183380126953125, -0.20621871948242188, -0.19409942626953125, -0.18198013305664062, -0.16986083984375, -0.15774154663085938, -0.14562225341796875, -0.13350296020507812, -0.1213836669921875, -0.10926437377929688, -0.09714508056640625, -0.08502578735351562, -0.072906494140625, -0.060787200927734375, -0.04866790771484375, -0.036548614501953125, -0.0244293212890625, -0.012310028076171875, -0.00019073486328125, 0.011928558349609375, 0.0240478515625, 0.036167144775390625, 0.04828643798828125, 0.060405731201171875, 0.0725250244140625, 0.08464431762695312, 0.09676361083984375, 0.10888290405273438, 0.121002197265625, 0.13312149047851562, 0.14524078369140625, 0.15736007690429688, 0.1694793701171875, 0.18159866333007812, 0.19371795654296875, 0.20583724975585938, 0.21795654296875, 0.23007583618164062, 0.24219512939453125, 0.2543144226074219, 0.2664337158203125, 0.2785530090332031, 0.29067230224609375, 0.3027915954589844, 0.314910888671875, 0.3270301818847656, 0.33914947509765625, 0.3512687683105469, 0.3633880615234375, 0.3755073547363281, 0.38762664794921875, 0.3997459411621094, 0.411865234375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 3.0, 9.0, 17.0, 21.0, 20.0, 26.0, 28.0, 40.0, 43.0, 61.0, 55.0, 78.0, 80.0, 55.0, 68.0, 74.0, 50.0, 54.0, 41.0, 43.0, 37.0, 27.0, 21.0, 16.0, 11.0, 7.0, 3.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.272705078125, -0.263702392578125, -0.25469970703125, -0.245697021484375, -0.2366943359375, -0.227691650390625, -0.21868896484375, -0.209686279296875, -0.20068359375, -0.191680908203125, -0.18267822265625, -0.173675537109375, -0.1646728515625, -0.155670166015625, -0.14666748046875, -0.137664794921875, -0.128662109375, -0.119659423828125, -0.11065673828125, -0.101654052734375, -0.0926513671875, -0.083648681640625, -0.07464599609375, -0.065643310546875, -0.056640625, -0.047637939453125, -0.03863525390625, -0.029632568359375, -0.0206298828125, -0.011627197265625, -0.00262451171875, 0.006378173828125, 0.015380859375, 0.024383544921875, 0.03338623046875, 0.042388916015625, 0.0513916015625, 0.060394287109375, 0.06939697265625, 0.078399658203125, 0.08740234375, 0.096405029296875, 0.10540771484375, 0.114410400390625, 0.1234130859375, 0.132415771484375, 0.14141845703125, 0.150421142578125, 0.159423828125, 0.168426513671875, 0.17742919921875, 0.186431884765625, 0.1954345703125, 0.204437255859375, 0.21343994140625, 0.222442626953125, 0.2314453125, 0.240447998046875, 0.24945068359375, 0.258453369140625, 0.2674560546875, 0.276458740234375, 0.28546142578125, 0.294464111328125, 0.303466796875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 6.0, 3.0, 6.0, 15.0, 28.0, 63.0, 125.0, 255.0, 571.0, 1952.0, 11668.0, 562236.0, 3584142.0, 27898.0, 3629.0, 1051.0, 363.0, 138.0, 73.0, 26.0, 11.0, 12.0, 7.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.63232421875, -0.612030029296875, -0.59173583984375, -0.571441650390625, -0.5511474609375, -0.530853271484375, -0.51055908203125, -0.490264892578125, -0.469970703125, -0.449676513671875, -0.42938232421875, -0.409088134765625, -0.3887939453125, -0.368499755859375, -0.34820556640625, -0.327911376953125, -0.3076171875, -0.287322998046875, -0.26702880859375, -0.246734619140625, -0.2264404296875, -0.206146240234375, -0.18585205078125, -0.165557861328125, -0.145263671875, -0.124969482421875, -0.10467529296875, -0.084381103515625, -0.0640869140625, -0.043792724609375, -0.02349853515625, -0.003204345703125, 0.01708984375, 0.037384033203125, 0.05767822265625, 0.077972412109375, 0.0982666015625, 0.118560791015625, 0.13885498046875, 0.159149169921875, 0.179443359375, 0.199737548828125, 0.22003173828125, 0.240325927734375, 0.2606201171875, 0.280914306640625, 0.30120849609375, 0.321502685546875, 0.341796875, 0.362091064453125, 0.38238525390625, 0.402679443359375, 0.4229736328125, 0.443267822265625, 0.46356201171875, 0.483856201171875, 0.504150390625, 0.524444580078125, 0.54473876953125, 0.565032958984375, 0.5853271484375, 0.605621337890625, 0.62591552734375, 0.646209716796875, 0.66650390625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 6.0, 8.0, 13.0, 22.0, 33.0, 42.0, 104.0, 217.0, 553.0, 1135.0, 1087.0, 456.0, 200.0, 95.0, 48.0, 19.0, 13.0, 8.0, 3.0, 6.0, 4.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5771484375, -0.559539794921875, -0.54193115234375, -0.524322509765625, -0.5067138671875, -0.489105224609375, -0.47149658203125, -0.453887939453125, -0.436279296875, -0.418670654296875, -0.40106201171875, -0.383453369140625, -0.3658447265625, -0.348236083984375, -0.33062744140625, -0.313018798828125, -0.29541015625, -0.277801513671875, -0.26019287109375, -0.242584228515625, -0.2249755859375, -0.207366943359375, -0.18975830078125, -0.172149658203125, -0.154541015625, -0.136932373046875, -0.11932373046875, -0.101715087890625, -0.0841064453125, -0.066497802734375, -0.04888916015625, -0.031280517578125, -0.013671875, 0.003936767578125, 0.02154541015625, 0.039154052734375, 0.0567626953125, 0.074371337890625, 0.09197998046875, 0.109588623046875, 0.127197265625, 0.144805908203125, 0.16241455078125, 0.180023193359375, 0.1976318359375, 0.215240478515625, 0.23284912109375, 0.250457763671875, 0.26806640625, 0.285675048828125, 0.30328369140625, 0.320892333984375, 0.3385009765625, 0.356109619140625, 0.37371826171875, 0.391326904296875, 0.408935546875, 0.426544189453125, 0.44415283203125, 0.461761474609375, 0.4793701171875, 0.496978759765625, 0.51458740234375, 0.532196044921875, 0.5498046875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 12.0, 12.0, 47.0, 185.0, 404.0, 247.0, 62.0, 17.0, 9.0, 5.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7105021476745605, -4.518747329711914, -4.326992511749268, -4.135237693786621, -3.9434828758239746, -3.751728057861328, -3.5599732398986816, -3.368218421936035, -3.1764636039733887, -2.984708786010742, -2.7929539680480957, -2.601199150085449, -2.4094443321228027, -2.2176895141601562, -2.0259346961975098, -1.8341798782348633, -1.6424250602722168, -1.4506702423095703, -1.2589154243469238, -1.0671606063842773, -0.8754057884216309, -0.6836509704589844, -0.4918961524963379, -0.3001413345336914, -0.10838651657104492, 0.08336830139160156, 0.27512311935424805, 0.46687793731689453, 0.658632755279541, 0.8503875732421875, 1.042142391204834, 1.2338972091674805, 1.4256515502929688, 1.6174063682556152, 1.8091611862182617, 2.000916004180908, 2.1926708221435547, 2.384425640106201, 2.5761804580688477, 2.767935276031494, 2.9596900939941406, 3.151444911956787, 3.3431997299194336, 3.53495454788208, 3.7267093658447266, 3.918464183807373, 4.1102190017700195, 4.301973819732666, 4.4937286376953125, 4.685483455657959, 4.8772382736206055, 5.068993091583252, 5.260747909545898, 5.452502727508545, 5.644257545471191, 5.836012363433838, 6.027767181396484, 6.219521999359131, 6.411276817321777, 6.603031635284424, 6.79478645324707, 6.986541271209717, 7.178296089172363, 7.37005090713501, 7.561805725097656]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 5.0, 1.0, 2.0, 4.0, 7.0, 16.0, 12.0, 17.0, 25.0, 29.0, 28.0, 40.0, 52.0, 61.0, 59.0, 49.0, 48.0, 68.0, 49.0, 60.0, 48.0, 50.0, 56.0, 34.0, 40.0, 32.0, 23.0, 16.0, 19.0, 15.0, 9.0, 9.0, 9.0, 6.0, 5.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.606874465942383, -2.5371897220611572, -2.4675049781799316, -2.397820234298706, -2.3281354904174805, -2.258450746536255, -2.1887660026550293, -2.1190812587738037, -2.049396514892578, -1.9797117710113525, -1.910027027130127, -1.8403422832489014, -1.7706575393676758, -1.7009727954864502, -1.6312880516052246, -1.561603307723999, -1.4919184446334839, -1.4222337007522583, -1.3525489568710327, -1.2828642129898071, -1.2131794691085815, -1.143494725227356, -1.0738098621368408, -1.0041251182556152, -0.9344404339790344, -0.8647556900978088, -0.7950709462165833, -0.7253861427307129, -0.6557013988494873, -0.5860166549682617, -0.5163319110870361, -0.44664716720581055, -0.37696242332458496, -0.3072776794433594, -0.2375929206609726, -0.16790816187858582, -0.09822341799736023, -0.028538674116134644, 0.04114609956741333, 0.11083084344863892, 0.1805155873298645, 0.2502003312110901, 0.3198850750923157, 0.38956984877586365, 0.45925459265708923, 0.5289393663406372, 0.5986241102218628, 0.6683088541030884, 0.737993597984314, 0.8076783418655396, 0.8773630857467651, 0.9470478296279907, 1.0167325735092163, 1.086417317390442, 1.156102180480957, 1.2257869243621826, 1.2954716682434082, 1.3651564121246338, 1.4348411560058594, 1.504525899887085, 1.5742106437683105, 1.6438953876495361, 1.7135801315307617, 1.7832648754119873, 1.852949619293213]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 3.0, 5.0, 3.0, 6.0, 8.0, 17.0, 18.0, 32.0, 52.0, 79.0, 137.0, 323.0, 544.0, 1305.0, 3127.0, 8953.0, 30398.0, 125894.0, 438162.0, 329125.0, 79084.0, 20514.0, 6426.0, 2271.0, 1017.0, 483.0, 233.0, 148.0, 53.0, 45.0, 26.0, 14.0, 15.0, 11.0, 6.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.332275390625, -0.3221588134765625, -0.312042236328125, -0.3019256591796875, -0.29180908203125, -0.2816925048828125, -0.271575927734375, -0.2614593505859375, -0.2513427734375, -0.2412261962890625, -0.231109619140625, -0.2209930419921875, -0.21087646484375, -0.2007598876953125, -0.190643310546875, -0.1805267333984375, -0.17041015625, -0.1602935791015625, -0.150177001953125, -0.1400604248046875, -0.12994384765625, -0.1198272705078125, -0.109710693359375, -0.0995941162109375, -0.0894775390625, -0.0793609619140625, -0.069244384765625, -0.0591278076171875, -0.04901123046875, -0.0388946533203125, -0.028778076171875, -0.0186614990234375, -0.008544921875, 0.0015716552734375, 0.011688232421875, 0.0218048095703125, 0.03192138671875, 0.0420379638671875, 0.052154541015625, 0.0622711181640625, 0.0723876953125, 0.0825042724609375, 0.092620849609375, 0.1027374267578125, 0.11285400390625, 0.1229705810546875, 0.133087158203125, 0.1432037353515625, 0.1533203125, 0.1634368896484375, 0.173553466796875, 0.1836700439453125, 0.19378662109375, 0.2039031982421875, 0.214019775390625, 0.2241363525390625, 0.2342529296875, 0.2443695068359375, 0.254486083984375, 0.2646026611328125, 0.27471923828125, 0.2848358154296875, 0.294952392578125, 0.3050689697265625, 0.315185546875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 3.0, 12.0, 12.0, 21.0, 21.0, 24.0, 47.0, 44.0, 49.0, 55.0, 68.0, 67.0, 74.0, 60.0, 67.0, 56.0, 43.0, 64.0, 48.0, 45.0, 31.0, 24.0, 22.0, 15.0, 7.0, 10.0, 3.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.270263671875, -0.261260986328125, -0.25225830078125, -0.243255615234375, -0.2342529296875, -0.225250244140625, -0.21624755859375, -0.207244873046875, -0.1982421875, -0.189239501953125, -0.18023681640625, -0.171234130859375, -0.1622314453125, -0.153228759765625, -0.14422607421875, -0.135223388671875, -0.126220703125, -0.117218017578125, -0.10821533203125, -0.099212646484375, -0.0902099609375, -0.081207275390625, -0.07220458984375, -0.063201904296875, -0.05419921875, -0.045196533203125, -0.03619384765625, -0.027191162109375, -0.0181884765625, -0.009185791015625, -0.00018310546875, 0.008819580078125, 0.017822265625, 0.026824951171875, 0.03582763671875, 0.044830322265625, 0.0538330078125, 0.062835693359375, 0.07183837890625, 0.080841064453125, 0.08984375, 0.098846435546875, 0.10784912109375, 0.116851806640625, 0.1258544921875, 0.134857177734375, 0.14385986328125, 0.152862548828125, 0.161865234375, 0.170867919921875, 0.17987060546875, 0.188873291015625, 0.1978759765625, 0.206878662109375, 0.21588134765625, 0.224884033203125, 0.23388671875, 0.242889404296875, 0.25189208984375, 0.260894775390625, 0.2698974609375, 0.278900146484375, 0.28790283203125, 0.296905517578125, 0.305908203125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 5.0, 4.0, 5.0, 10.0, 14.0, 3.0, 8.0, 11.0, 10.0, 32.0, 33.0, 46.0, 69.0, 72.0, 117.0, 182.0, 318.0, 603.0, 1420.0, 4335.0, 17485.0, 104056.0, 693736.0, 188225.0, 27785.0, 6213.0, 1944.0, 761.0, 366.0, 197.0, 148.0, 97.0, 54.0, 54.0, 39.0, 25.0, 18.0, 14.0, 7.0, 7.0, 11.0, 5.0, 6.0, 5.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.399169921875, -0.38570404052734375, -0.3722381591796875, -0.35877227783203125, -0.345306396484375, -0.33184051513671875, -0.3183746337890625, -0.30490875244140625, -0.29144287109375, -0.27797698974609375, -0.2645111083984375, -0.25104522705078125, -0.237579345703125, -0.22411346435546875, -0.2106475830078125, -0.19718170166015625, -0.1837158203125, -0.17024993896484375, -0.1567840576171875, -0.14331817626953125, -0.129852294921875, -0.11638641357421875, -0.1029205322265625, -0.08945465087890625, -0.07598876953125, -0.06252288818359375, -0.0490570068359375, -0.03559112548828125, -0.022125244140625, -0.00865936279296875, 0.0048065185546875, 0.01827239990234375, 0.03173828125, 0.04520416259765625, 0.0586700439453125, 0.07213592529296875, 0.085601806640625, 0.09906768798828125, 0.1125335693359375, 0.12599945068359375, 0.13946533203125, 0.15293121337890625, 0.1663970947265625, 0.17986297607421875, 0.193328857421875, 0.20679473876953125, 0.2202606201171875, 0.23372650146484375, 0.2471923828125, 0.26065826416015625, 0.2741241455078125, 0.28759002685546875, 0.301055908203125, 0.31452178955078125, 0.3279876708984375, 0.34145355224609375, 0.35491943359375, 0.36838531494140625, 0.3818511962890625, 0.39531707763671875, 0.408782958984375, 0.42224884033203125, 0.4357147216796875, 0.44918060302734375, 0.462646484375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 9.0, 13.0, 8.0, 11.0, 7.0, 6.0, 19.0, 22.0, 22.0, 24.0, 23.0, 37.0, 27.0, 44.0, 49.0, 65.0, 45.0, 51.0, 50.0, 43.0, 52.0, 40.0, 34.0, 29.0, 32.0, 33.0, 26.0, 34.0, 23.0, 17.0, 24.0, 16.0, 11.0, 11.0, 6.0, 7.0, 8.0, 7.0, 1.0, 2.0, 5.0, 1.0, 2.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6484375, -0.62799072265625, -0.6075439453125, -0.58709716796875, -0.566650390625, -0.54620361328125, -0.5257568359375, -0.50531005859375, -0.48486328125, -0.46441650390625, -0.4439697265625, -0.42352294921875, -0.403076171875, -0.38262939453125, -0.3621826171875, -0.34173583984375, -0.3212890625, -0.30084228515625, -0.2803955078125, -0.25994873046875, -0.239501953125, -0.21905517578125, -0.1986083984375, -0.17816162109375, -0.15771484375, -0.13726806640625, -0.1168212890625, -0.09637451171875, -0.075927734375, -0.05548095703125, -0.0350341796875, -0.01458740234375, 0.005859375, 0.02630615234375, 0.0467529296875, 0.06719970703125, 0.087646484375, 0.10809326171875, 0.1285400390625, 0.14898681640625, 0.16943359375, 0.18988037109375, 0.2103271484375, 0.23077392578125, 0.251220703125, 0.27166748046875, 0.2921142578125, 0.31256103515625, 0.3330078125, 0.35345458984375, 0.3739013671875, 0.39434814453125, 0.414794921875, 0.43524169921875, 0.4556884765625, 0.47613525390625, 0.49658203125, 0.51702880859375, 0.5374755859375, 0.55792236328125, 0.578369140625, 0.59881591796875, 0.6192626953125, 0.63970947265625, 0.66015625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 6.0, 6.0, 13.0, 15.0, 29.0, 51.0, 116.0, 269.0, 753.0, 2577.0, 12042.0, 82742.0, 742912.0, 179063.0, 22074.0, 4113.0, 1083.0, 367.0, 147.0, 78.0, 36.0, 25.0, 19.0, 9.0, 7.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1612548828125, -0.1564655303955078, -0.15167617797851562, -0.14688682556152344, -0.14209747314453125, -0.13730812072753906, -0.13251876831054688, -0.1277294158935547, -0.1229400634765625, -0.11815071105957031, -0.11336135864257812, -0.10857200622558594, -0.10378265380859375, -0.09899330139160156, -0.09420394897460938, -0.08941459655761719, -0.084625244140625, -0.07983589172363281, -0.07504653930664062, -0.07025718688964844, -0.06546783447265625, -0.06067848205566406, -0.055889129638671875, -0.05109977722167969, -0.0463104248046875, -0.04152107238769531, -0.036731719970703125, -0.03194236755371094, -0.02715301513671875, -0.022363662719726562, -0.017574310302734375, -0.012784957885742188, -0.00799560546875, -0.0032062530517578125, 0.001583099365234375, 0.0063724517822265625, 0.01116180419921875, 0.015951156616210938, 0.020740509033203125, 0.025529861450195312, 0.0303192138671875, 0.03510856628417969, 0.039897918701171875, 0.04468727111816406, 0.04947662353515625, 0.05426597595214844, 0.059055328369140625, 0.06384468078613281, 0.068634033203125, 0.07342338562011719, 0.07821273803710938, 0.08300209045410156, 0.08779144287109375, 0.09258079528808594, 0.09737014770507812, 0.10215950012207031, 0.1069488525390625, 0.11173820495605469, 0.11652755737304688, 0.12131690979003906, 0.12610626220703125, 0.13089561462402344, 0.13568496704101562, 0.1404743194580078, 0.145263671875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 7.0, 5.0, 12.0, 8.0, 14.0, 24.0, 20.0, 15.0, 30.0, 44.0, 61.0, 77.0, 77.0, 75.0, 79.0, 89.0, 65.0, 66.0, 54.0, 47.0, 30.0, 21.0, 25.0, 17.0, 11.0, 5.0, 3.0, 5.0, 0.0, 3.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.088878631591797e-05, -3.963429480791092e-05, -3.837980329990387e-05, -3.712531179189682e-05, -3.587082028388977e-05, -3.461632877588272e-05, -3.336183726787567e-05, -3.210734575986862e-05, -3.085285425186157e-05, -2.9598362743854523e-05, -2.8343871235847473e-05, -2.7089379727840424e-05, -2.5834888219833374e-05, -2.4580396711826324e-05, -2.3325905203819275e-05, -2.2071413695812225e-05, -2.0816922187805176e-05, -1.9562430679798126e-05, -1.8307939171791077e-05, -1.7053447663784027e-05, -1.5798956155776978e-05, -1.4544464647769928e-05, -1.3289973139762878e-05, -1.2035481631755829e-05, -1.078099012374878e-05, -9.52649861574173e-06, -8.27200710773468e-06, -7.017515599727631e-06, -5.763024091720581e-06, -4.5085325837135315e-06, -3.254041075706482e-06, -1.9995495676994324e-06, -7.450580596923828e-07, 5.094334483146667e-07, 1.7639249563217163e-06, 3.018416464328766e-06, 4.2729079723358154e-06, 5.527399480342865e-06, 6.7818909883499146e-06, 8.036382496356964e-06, 9.290874004364014e-06, 1.0545365512371063e-05, 1.1799857020378113e-05, 1.3054348528385162e-05, 1.4308840036392212e-05, 1.556333154439926e-05, 1.681782305240631e-05, 1.807231456041336e-05, 1.932680606842041e-05, 2.058129757642746e-05, 2.183578908443451e-05, 2.309028059244156e-05, 2.434477210044861e-05, 2.5599263608455658e-05, 2.6853755116462708e-05, 2.8108246624469757e-05, 2.9362738132476807e-05, 3.0617229640483856e-05, 3.1871721148490906e-05, 3.3126212656497955e-05, 3.4380704164505005e-05, 3.5635195672512054e-05, 3.6889687180519104e-05, 3.8144178688526154e-05, 3.93986701965332e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 9.0, 8.0, 18.0, 28.0, 30.0, 74.0, 114.0, 216.0, 507.0, 1433.0, 5988.0, 35643.0, 358562.0, 592340.0, 44064.0, 6808.0, 1656.0, 534.0, 235.0, 119.0, 73.0, 32.0, 20.0, 12.0, 11.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1549072265625, -0.1499176025390625, -0.144927978515625, -0.1399383544921875, -0.13494873046875, -0.1299591064453125, -0.124969482421875, -0.1199798583984375, -0.114990234375, -0.1100006103515625, -0.105010986328125, -0.1000213623046875, -0.09503173828125, -0.0900421142578125, -0.085052490234375, -0.0800628662109375, -0.0750732421875, -0.0700836181640625, -0.065093994140625, -0.0601043701171875, -0.05511474609375, -0.0501251220703125, -0.045135498046875, -0.0401458740234375, -0.03515625, -0.0301666259765625, -0.025177001953125, -0.0201873779296875, -0.01519775390625, -0.0102081298828125, -0.005218505859375, -0.0002288818359375, 0.0047607421875, 0.0097503662109375, 0.014739990234375, 0.0197296142578125, 0.02471923828125, 0.0297088623046875, 0.034698486328125, 0.0396881103515625, 0.044677734375, 0.0496673583984375, 0.054656982421875, 0.0596466064453125, 0.06463623046875, 0.0696258544921875, 0.074615478515625, 0.0796051025390625, 0.0845947265625, 0.0895843505859375, 0.094573974609375, 0.0995635986328125, 0.10455322265625, 0.1095428466796875, 0.114532470703125, 0.1195220947265625, 0.12451171875, 0.1295013427734375, 0.134490966796875, 0.1394805908203125, 0.14447021484375, 0.1494598388671875, 0.154449462890625, 0.1594390869140625, 0.1644287109375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 7.0, 5.0, 5.0, 17.0, 15.0, 29.0, 24.0, 50.0, 56.0, 64.0, 80.0, 103.0, 92.0, 99.0, 78.0, 61.0, 60.0, 44.0, 31.0, 25.0, 11.0, 7.0, 10.0, 7.0, 4.0, 8.0, 1.0, 4.0, 0.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1793212890625, -0.17478561401367188, -0.17024993896484375, -0.16571426391601562, -0.1611785888671875, -0.15664291381835938, -0.15210723876953125, -0.14757156372070312, -0.143035888671875, -0.13850021362304688, -0.13396453857421875, -0.12942886352539062, -0.1248931884765625, -0.12035751342773438, -0.11582183837890625, -0.11128616333007812, -0.10675048828125, -0.10221481323242188, -0.09767913818359375, -0.09314346313476562, -0.0886077880859375, -0.08407211303710938, -0.07953643798828125, -0.07500076293945312, -0.070465087890625, -0.06592941284179688, -0.06139373779296875, -0.056858062744140625, -0.0523223876953125, -0.047786712646484375, -0.04325103759765625, -0.038715362548828125, -0.0341796875, -0.029644012451171875, -0.02510833740234375, -0.020572662353515625, -0.0160369873046875, -0.011501312255859375, -0.00696563720703125, -0.002429962158203125, 0.002105712890625, 0.006641387939453125, 0.01117706298828125, 0.015712738037109375, 0.0202484130859375, 0.024784088134765625, 0.02931976318359375, 0.033855438232421875, 0.03839111328125, 0.042926788330078125, 0.04746246337890625, 0.051998138427734375, 0.0565338134765625, 0.061069488525390625, 0.06560516357421875, 0.07014083862304688, 0.074676513671875, 0.07921218872070312, 0.08374786376953125, 0.08828353881835938, 0.0928192138671875, 0.09735488891601562, 0.10189056396484375, 0.10642623901367188, 0.1109619140625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 12.0, 12.0, 41.0, 109.0, 297.0, 272.0, 136.0, 51.0, 24.0, 15.0, 9.0, 4.0, 7.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.741288185119629, -2.6102638244628906, -2.4792394638061523, -2.348215103149414, -2.217190742492676, -2.0861663818359375, -1.9551421403884888, -1.8241177797317505, -1.6930934190750122, -1.562069058418274, -1.4310446977615356, -1.300020456314087, -1.1689960956573486, -1.0379717350006104, -0.9069473743438721, -0.7759230136871338, -0.6448986530303955, -0.5138742923736572, -0.38284996151924133, -0.25182563066482544, -0.12080127000808716, 0.010223090648651123, 0.14124739170074463, 0.2722717523574829, 0.4032961130142212, 0.5343204736709595, 0.6653448343276978, 0.7963691353797913, 0.9273934960365295, 1.058417797088623, 1.1894421577453613, 1.3204665184020996, 1.451490879058838, 1.5825152397155762, 1.7135396003723145, 1.8445639610290527, 1.975588321685791, 2.1066126823425293, 2.2376370429992676, 2.368661403656006, 2.499685764312744, 2.6307101249694824, 2.7617344856262207, 2.892758846282959, 3.0237832069396973, 3.1548075675964355, 3.285831928253174, 3.416856288909912, 3.5478804111480713, 3.6789047718048096, 3.809929132461548, 3.940953493118286, 4.071977615356445, 4.203001976013184, 4.334026336669922, 4.46505069732666, 4.596075057983398, 4.727099418640137, 4.858123779296875, 4.989148139953613, 5.120172500610352, 5.25119686126709, 5.382221221923828, 5.513245582580566, 5.644269943237305]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 1.0, 4.0, 4.0, 6.0, 12.0, 3.0, 5.0, 9.0, 13.0, 13.0, 20.0, 18.0, 22.0, 33.0, 24.0, 20.0, 28.0, 50.0, 48.0, 68.0, 71.0, 83.0, 82.0, 46.0, 45.0, 32.0, 46.0, 28.0, 20.0, 28.0, 26.0, 23.0, 15.0, 10.0, 16.0, 11.0, 7.0, 7.0, 4.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7512314319610596, -2.662660598754883, -2.574089765548706, -2.4855189323425293, -2.3969478607177734, -2.3083770275115967, -2.21980619430542, -2.131235361099243, -2.0426645278930664, -1.9540936946868896, -1.865522861480713, -1.7769519090652466, -1.6883810758590698, -1.599810242652893, -1.5112392902374268, -1.42266845703125, -1.3340976238250732, -1.2455267906188965, -1.1569559574127197, -1.0683850049972534, -0.9798141717910767, -0.8912433385848999, -0.8026724457740784, -0.7141015529632568, -0.6255307197570801, -0.5369598865509033, -0.4483889937400818, -0.35981813073158264, -0.2712472677230835, -0.18267640471458435, -0.0941055417060852, -0.005534648895263672, 0.08303594589233398, 0.17160680890083313, 0.2601776719093323, 0.3487485349178314, 0.43731939792633057, 0.5258902311325073, 0.6144611239433289, 0.7030320167541504, 0.7916028499603271, 0.8801736831665039, 0.9687445759773254, 1.057315468788147, 1.1458863019943237, 1.2344571352005005, 1.3230280876159668, 1.4115989208221436, 1.5001697540283203, 1.588740587234497, 1.6773114204406738, 1.7658823728561401, 1.854453206062317, 1.9430240392684937, 2.03159499168396, 2.1201658248901367, 2.2087366580963135, 2.2973074913024902, 2.385878324508667, 2.4744491577148438, 2.5630202293395996, 2.6515910625457764, 2.740161895751953, 2.82873272895813, 2.9173035621643066]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 5.0, 11.0, 8.0, 14.0, 23.0, 31.0, 30.0, 52.0, 82.0, 142.0, 211.0, 362.0, 641.0, 1375.0, 3330.0, 9631.0, 44013.0, 377073.0, 2360043.0, 1218643.0, 143936.0, 23383.0, 6474.0, 2433.0, 989.0, 490.0, 284.0, 202.0, 121.0, 74.0, 61.0, 37.0, 28.0, 14.0, 11.0, 9.0, 9.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.205322265625, -0.1984272003173828, -0.19153213500976562, -0.18463706970214844, -0.17774200439453125, -0.17084693908691406, -0.16395187377929688, -0.1570568084716797, -0.1501617431640625, -0.1432666778564453, -0.13637161254882812, -0.12947654724121094, -0.12258148193359375, -0.11568641662597656, -0.10879135131835938, -0.10189628601074219, -0.095001220703125, -0.08810615539550781, -0.08121109008789062, -0.07431602478027344, -0.06742095947265625, -0.06052589416503906, -0.053630828857421875, -0.04673576354980469, -0.0398406982421875, -0.03294563293457031, -0.026050567626953125, -0.019155502319335938, -0.01226043701171875, -0.0053653717041015625, 0.001529693603515625, 0.008424758911132812, 0.01531982421875, 0.022214889526367188, 0.029109954833984375, 0.03600502014160156, 0.04290008544921875, 0.04979515075683594, 0.056690216064453125, 0.06358528137207031, 0.0704803466796875, 0.07737541198730469, 0.08427047729492188, 0.09116554260253906, 0.09806060791015625, 0.10495567321777344, 0.11185073852539062, 0.11874580383300781, 0.125640869140625, 0.1325359344482422, 0.13943099975585938, 0.14632606506347656, 0.15322113037109375, 0.16011619567871094, 0.16701126098632812, 0.1739063262939453, 0.1808013916015625, 0.1876964569091797, 0.19459152221679688, 0.20148658752441406, 0.20838165283203125, 0.21527671813964844, 0.22217178344726562, 0.2290668487548828, 0.2359619140625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 4.0, 5.0, 3.0, 10.0, 8.0, 17.0, 24.0, 19.0, 27.0, 38.0, 55.0, 55.0, 75.0, 67.0, 65.0, 79.0, 81.0, 70.0, 54.0, 53.0, 45.0, 48.0, 28.0, 24.0, 22.0, 14.0, 7.0, 4.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.265625, -0.2565345764160156, -0.24744415283203125, -0.23835372924804688, -0.2292633056640625, -0.22017288208007812, -0.21108245849609375, -0.20199203491210938, -0.192901611328125, -0.18381118774414062, -0.17472076416015625, -0.16563034057617188, -0.1565399169921875, -0.14744949340820312, -0.13835906982421875, -0.12926864624023438, -0.12017822265625, -0.11108779907226562, -0.10199737548828125, -0.09290695190429688, -0.0838165283203125, -0.07472610473632812, -0.06563568115234375, -0.056545257568359375, -0.047454833984375, -0.038364410400390625, -0.02927398681640625, -0.020183563232421875, -0.0110931396484375, -0.002002716064453125, 0.00708770751953125, 0.016178131103515625, 0.0252685546875, 0.034358978271484375, 0.04344940185546875, 0.052539825439453125, 0.0616302490234375, 0.07072067260742188, 0.07981109619140625, 0.08890151977539062, 0.097991943359375, 0.10708236694335938, 0.11617279052734375, 0.12526321411132812, 0.1343536376953125, 0.14344406127929688, 0.15253448486328125, 0.16162490844726562, 0.17071533203125, 0.17980575561523438, 0.18889617919921875, 0.19798660278320312, 0.2070770263671875, 0.21616744995117188, 0.22525787353515625, 0.23434829711914062, 0.243438720703125, 0.2525291442871094, 0.26161956787109375, 0.2707099914550781, 0.2798004150390625, 0.2888908386230469, 0.29798126220703125, 0.3070716857910156, 0.316162109375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 3.0, 2.0, 13.0, 18.0, 22.0, 52.0, 111.0, 296.0, 837.0, 3742.0, 63409.0, 3996318.0, 123052.0, 4890.0, 950.0, 328.0, 121.0, 49.0, 19.0, 26.0, 6.0, 3.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.638671875, -0.6190643310546875, -0.599456787109375, -0.5798492431640625, -0.56024169921875, -0.5406341552734375, -0.521026611328125, -0.5014190673828125, -0.4818115234375, -0.4622039794921875, -0.442596435546875, -0.4229888916015625, -0.40338134765625, -0.3837738037109375, -0.364166259765625, -0.3445587158203125, -0.324951171875, -0.3053436279296875, -0.285736083984375, -0.2661285400390625, -0.24652099609375, -0.2269134521484375, -0.207305908203125, -0.1876983642578125, -0.1680908203125, -0.1484832763671875, -0.128875732421875, -0.1092681884765625, -0.08966064453125, -0.0700531005859375, -0.050445556640625, -0.0308380126953125, -0.01123046875, 0.0083770751953125, 0.027984619140625, 0.0475921630859375, 0.06719970703125, 0.0868072509765625, 0.106414794921875, 0.1260223388671875, 0.1456298828125, 0.1652374267578125, 0.184844970703125, 0.2044525146484375, 0.22406005859375, 0.2436676025390625, 0.263275146484375, 0.2828826904296875, 0.302490234375, 0.3220977783203125, 0.341705322265625, 0.3613128662109375, 0.38092041015625, 0.4005279541015625, 0.420135498046875, 0.4397430419921875, 0.4593505859375, 0.4789581298828125, 0.498565673828125, 0.5181732177734375, 0.53778076171875, 0.5573883056640625, 0.576995849609375, 0.5966033935546875, 0.6162109375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 0.0, 5.0, 5.0, 6.0, 7.0, 6.0, 18.0, 37.0, 55.0, 69.0, 106.0, 196.0, 362.0, 670.0, 820.0, 711.0, 418.0, 245.0, 123.0, 76.0, 53.0, 33.0, 21.0, 13.0, 5.0, 5.0, 1.0, 3.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38037109375, -0.36904144287109375, -0.3577117919921875, -0.34638214111328125, -0.335052490234375, -0.32372283935546875, -0.3123931884765625, -0.30106353759765625, -0.28973388671875, -0.27840423583984375, -0.2670745849609375, -0.25574493408203125, -0.244415283203125, -0.23308563232421875, -0.2217559814453125, -0.21042633056640625, -0.1990966796875, -0.18776702880859375, -0.1764373779296875, -0.16510772705078125, -0.153778076171875, -0.14244842529296875, -0.1311187744140625, -0.11978912353515625, -0.10845947265625, -0.09712982177734375, -0.0858001708984375, -0.07447052001953125, -0.063140869140625, -0.05181121826171875, -0.0404815673828125, -0.02915191650390625, -0.017822265625, -0.00649261474609375, 0.0048370361328125, 0.01616668701171875, 0.027496337890625, 0.03882598876953125, 0.0501556396484375, 0.06148529052734375, 0.07281494140625, 0.08414459228515625, 0.0954742431640625, 0.10680389404296875, 0.118133544921875, 0.12946319580078125, 0.1407928466796875, 0.15212249755859375, 0.1634521484375, 0.17478179931640625, 0.1861114501953125, 0.19744110107421875, 0.208770751953125, 0.22010040283203125, 0.2314300537109375, 0.24275970458984375, 0.25408935546875, 0.26541900634765625, 0.2767486572265625, 0.28807830810546875, 0.299407958984375, 0.31073760986328125, 0.3220672607421875, 0.33339691162109375, 0.3447265625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 10.0, 16.0, 63.0, 147.0, 260.0, 260.0, 132.0, 67.0, 28.0, 14.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.03072452545166, -5.904982566833496, -5.779240131378174, -5.65349817276001, -5.527756214141846, -5.402013778686523, -5.276271820068359, -5.150529861450195, -5.024787902832031, -4.899045944213867, -4.773303508758545, -4.647561550140381, -4.521819591522217, -4.3960771560668945, -4.2703351974487305, -4.144593238830566, -4.018850803375244, -3.893108606338501, -3.767366647720337, -3.6416244506835938, -3.5158824920654297, -3.3901402950286865, -3.2643980979919434, -3.1386561393737793, -3.012913942337036, -2.887171745300293, -2.761429786682129, -2.6356875896453857, -2.5099453926086426, -2.3842034339904785, -2.2584612369537354, -2.132719039916992, -2.006977081298828, -1.8812350034713745, -1.755492925643921, -1.6297507286071777, -1.5040086507797241, -1.3782665729522705, -1.2525243759155273, -1.1267822980880737, -1.0010402202606201, -0.8752981424331665, -0.7495560050010681, -0.6238138675689697, -0.4980717897415161, -0.3723297119140625, -0.2465875744819641, -0.12084543704986572, 0.004896640777587891, 0.1306387484073639, 0.2563808560371399, 0.3821229636669159, 0.5078650712966919, 0.6336071491241455, 0.7593492865562439, 0.8850914239883423, 1.010833501815796, 1.1365755796432495, 1.2623176574707031, 1.3880598545074463, 1.5138019323349, 1.6395440101623535, 1.7652862071990967, 1.8910282850265503, 2.016770362854004]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 9.0, 3.0, 4.0, 9.0, 15.0, 11.0, 10.0, 16.0, 16.0, 16.0, 28.0, 20.0, 30.0, 49.0, 41.0, 41.0, 46.0, 50.0, 56.0, 69.0, 45.0, 45.0, 58.0, 35.0, 47.0, 27.0, 36.0, 33.0, 24.0, 16.0, 16.0, 17.0, 19.0, 5.0, 9.0, 7.0, 5.0, 7.0, 3.0, 3.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4121918678283691, -1.3658236265182495, -1.3194552659988403, -1.2730870246887207, -1.2267186641693115, -1.180350422859192, -1.1339821815490723, -1.087613821029663, -1.041245460510254, -0.9948771595954895, -0.9485088586807251, -0.9021406173706055, -0.8557722568511963, -0.8094040155410767, -0.7630357146263123, -0.7166674137115479, -0.6702991724014282, -0.6239308714866638, -0.5775625705718994, -0.5311943292617798, -0.484825998544693, -0.4384576976299286, -0.3920894265174866, -0.34572112560272217, -0.29935282468795776, -0.25298452377319336, -0.20661623775959015, -0.16024795174598694, -0.11387965083122253, -0.06751134991645813, -0.021143078804016113, 0.02522522211074829, 0.07159340381622314, 0.11796169728040695, 0.16432999074459076, 0.21069827675819397, 0.2570665776729584, 0.3034348785877228, 0.3498031497001648, 0.3961714506149292, 0.4425397515296936, 0.488908052444458, 0.5352763533592224, 0.5816446542739868, 0.6280128955841064, 0.6743812561035156, 0.7207494974136353, 0.7671177983283997, 0.8134860992431641, 0.8598544001579285, 0.9062227010726929, 0.9525909423828125, 0.9989593029022217, 1.0453275442123413, 1.091695785522461, 1.1380641460418701, 1.1844325065612793, 1.230800747871399, 1.277169108390808, 1.3235373497009277, 1.369905710220337, 1.4162739515304565, 1.4626421928405762, 1.5090105533599854, 1.555378794670105]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 4.0, 10.0, 6.0, 15.0, 12.0, 26.0, 40.0, 69.0, 82.0, 120.0, 161.0, 235.0, 423.0, 758.0, 1434.0, 2821.0, 6093.0, 14520.0, 37390.0, 103375.0, 287266.0, 358851.0, 147177.0, 52044.0, 19799.0, 8228.0, 3647.0, 1669.0, 914.0, 508.0, 280.0, 196.0, 137.0, 65.0, 48.0, 35.0, 33.0, 14.0, 12.0, 7.0, 8.0, 13.0, 3.0, 4.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.20068359375, -0.194244384765625, -0.18780517578125, -0.181365966796875, -0.1749267578125, -0.168487548828125, -0.16204833984375, -0.155609130859375, -0.149169921875, -0.142730712890625, -0.13629150390625, -0.129852294921875, -0.1234130859375, -0.116973876953125, -0.11053466796875, -0.104095458984375, -0.09765625, -0.091217041015625, -0.08477783203125, -0.078338623046875, -0.0718994140625, -0.065460205078125, -0.05902099609375, -0.052581787109375, -0.046142578125, -0.039703369140625, -0.03326416015625, -0.026824951171875, -0.0203857421875, -0.013946533203125, -0.00750732421875, -0.001068115234375, 0.00537109375, 0.011810302734375, 0.01824951171875, 0.024688720703125, 0.0311279296875, 0.037567138671875, 0.04400634765625, 0.050445556640625, 0.056884765625, 0.063323974609375, 0.06976318359375, 0.076202392578125, 0.0826416015625, 0.089080810546875, 0.09552001953125, 0.101959228515625, 0.1083984375, 0.114837646484375, 0.12127685546875, 0.127716064453125, 0.1341552734375, 0.140594482421875, 0.14703369140625, 0.153472900390625, 0.159912109375, 0.166351318359375, 0.17279052734375, 0.179229736328125, 0.1856689453125, 0.192108154296875, 0.19854736328125, 0.204986572265625, 0.21142578125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 5.0, 9.0, 7.0, 10.0, 22.0, 19.0, 27.0, 39.0, 45.0, 48.0, 64.0, 76.0, 88.0, 65.0, 74.0, 55.0, 57.0, 64.0, 48.0, 48.0, 28.0, 30.0, 30.0, 11.0, 19.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.265625, -0.2566871643066406, -0.24774932861328125, -0.23881149291992188, -0.2298736572265625, -0.22093582153320312, -0.21199798583984375, -0.20306015014648438, -0.194122314453125, -0.18518447875976562, -0.17624664306640625, -0.16730880737304688, -0.1583709716796875, -0.14943313598632812, -0.14049530029296875, -0.13155746459960938, -0.12261962890625, -0.11368179321289062, -0.10474395751953125, -0.09580612182617188, -0.0868682861328125, -0.07793045043945312, -0.06899261474609375, -0.060054779052734375, -0.051116943359375, -0.042179107666015625, -0.03324127197265625, -0.024303436279296875, -0.0153656005859375, -0.006427764892578125, 0.00251007080078125, 0.011447906494140625, 0.0203857421875, 0.029323577880859375, 0.03826141357421875, 0.047199249267578125, 0.0561370849609375, 0.06507492065429688, 0.07401275634765625, 0.08295059204101562, 0.091888427734375, 0.10082626342773438, 0.10976409912109375, 0.11870193481445312, 0.1276397705078125, 0.13657760620117188, 0.14551544189453125, 0.15445327758789062, 0.16339111328125, 0.17232894897460938, 0.18126678466796875, 0.19020462036132812, 0.1991424560546875, 0.20808029174804688, 0.21701812744140625, 0.22595596313476562, 0.234893798828125, 0.24383163452148438, 0.25276947021484375, 0.2617073059082031, 0.2706451416015625, 0.2795829772949219, 0.28852081298828125, 0.2974586486816406, 0.306396484375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 7.0, 7.0, 8.0, 7.0, 15.0, 11.0, 16.0, 25.0, 37.0, 31.0, 52.0, 81.0, 130.0, 148.0, 213.0, 307.0, 445.0, 737.0, 1569.0, 4468.0, 20885.0, 185139.0, 749846.0, 68463.0, 10148.0, 2696.0, 1128.0, 577.0, 372.0, 281.0, 198.0, 148.0, 85.0, 67.0, 56.0, 30.0, 33.0, 23.0, 16.0, 9.0, 7.0, 12.0, 6.0, 5.0, 4.0, 2.0, 2.0, 5.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.47900390625, -0.46503448486328125, -0.4510650634765625, -0.43709564208984375, -0.423126220703125, -0.40915679931640625, -0.3951873779296875, -0.38121795654296875, -0.36724853515625, -0.35327911376953125, -0.3393096923828125, -0.32534027099609375, -0.311370849609375, -0.29740142822265625, -0.2834320068359375, -0.26946258544921875, -0.2554931640625, -0.24152374267578125, -0.2275543212890625, -0.21358489990234375, -0.199615478515625, -0.18564605712890625, -0.1716766357421875, -0.15770721435546875, -0.14373779296875, -0.12976837158203125, -0.1157989501953125, -0.10182952880859375, -0.087860107421875, -0.07389068603515625, -0.0599212646484375, -0.04595184326171875, -0.031982421875, -0.01801300048828125, -0.0040435791015625, 0.00992584228515625, 0.023895263671875, 0.03786468505859375, 0.0518341064453125, 0.06580352783203125, 0.07977294921875, 0.09374237060546875, 0.1077117919921875, 0.12168121337890625, 0.135650634765625, 0.14962005615234375, 0.1635894775390625, 0.17755889892578125, 0.1915283203125, 0.20549774169921875, 0.2194671630859375, 0.23343658447265625, 0.247406005859375, 0.26137542724609375, 0.2753448486328125, 0.28931427001953125, 0.30328369140625, 0.31725311279296875, 0.3312225341796875, 0.34519195556640625, 0.359161376953125, 0.37313079833984375, 0.3871002197265625, 0.40106964111328125, 0.4150390625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 1.0, 0.0, 2.0, 2.0, 5.0, 5.0, 5.0, 5.0, 13.0, 13.0, 16.0, 21.0, 24.0, 33.0, 37.0, 28.0, 49.0, 47.0, 61.0, 77.0, 53.0, 61.0, 63.0, 53.0, 50.0, 50.0, 39.0, 36.0, 29.0, 26.0, 20.0, 19.0, 16.0, 8.0, 7.0, 9.0, 8.0, 8.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.81591796875, -0.7920150756835938, -0.7681121826171875, -0.7442092895507812, -0.720306396484375, -0.6964035034179688, -0.6725006103515625, -0.6485977172851562, -0.62469482421875, -0.6007919311523438, -0.5768890380859375, -0.5529861450195312, -0.529083251953125, -0.5051803588867188, -0.4812774658203125, -0.45737457275390625, -0.4334716796875, -0.40956878662109375, -0.3856658935546875, -0.36176300048828125, -0.337860107421875, -0.31395721435546875, -0.2900543212890625, -0.26615142822265625, -0.24224853515625, -0.21834564208984375, -0.1944427490234375, -0.17053985595703125, -0.146636962890625, -0.12273406982421875, -0.0988311767578125, -0.07492828369140625, -0.051025390625, -0.02712249755859375, -0.0032196044921875, 0.02068328857421875, 0.044586181640625, 0.06848907470703125, 0.0923919677734375, 0.11629486083984375, 0.14019775390625, 0.16410064697265625, 0.1880035400390625, 0.21190643310546875, 0.235809326171875, 0.25971221923828125, 0.2836151123046875, 0.30751800537109375, 0.3314208984375, 0.35532379150390625, 0.3792266845703125, 0.40312957763671875, 0.427032470703125, 0.45093536376953125, 0.4748382568359375, 0.49874114990234375, 0.52264404296875, 0.5465469360351562, 0.5704498291015625, 0.5943527221679688, 0.618255615234375, 0.6421585083007812, 0.6660614013671875, 0.6899642944335938, 0.7138671875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 5.0, 7.0, 7.0, 13.0, 13.0, 10.0, 24.0, 18.0, 54.0, 100.0, 168.0, 312.0, 725.0, 2059.0, 6908.0, 29040.0, 169001.0, 737141.0, 80028.0, 16109.0, 4292.0, 1356.0, 553.0, 260.0, 130.0, 74.0, 43.0, 25.0, 17.0, 15.0, 13.0, 13.0, 4.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.107666015625, -0.10372352600097656, -0.09978103637695312, -0.09583854675292969, -0.09189605712890625, -0.08795356750488281, -0.08401107788085938, -0.08006858825683594, -0.0761260986328125, -0.07218360900878906, -0.06824111938476562, -0.06429862976074219, -0.06035614013671875, -0.05641365051269531, -0.052471160888671875, -0.04852867126464844, -0.044586181640625, -0.04064369201660156, -0.036701202392578125, -0.03275871276855469, -0.02881622314453125, -0.024873733520507812, -0.020931243896484375, -0.016988754272460938, -0.0130462646484375, -0.009103775024414062, -0.005161285400390625, -0.0012187957763671875, 0.00272369384765625, 0.0066661834716796875, 0.010608673095703125, 0.014551162719726562, 0.01849365234375, 0.022436141967773438, 0.026378631591796875, 0.030321121215820312, 0.03426361083984375, 0.03820610046386719, 0.042148590087890625, 0.04609107971191406, 0.0500335693359375, 0.05397605895996094, 0.057918548583984375, 0.06186103820800781, 0.06580352783203125, 0.06974601745605469, 0.07368850708007812, 0.07763099670410156, 0.081573486328125, 0.08551597595214844, 0.08945846557617188, 0.09340095520019531, 0.09734344482421875, 0.10128593444824219, 0.10522842407226562, 0.10917091369628906, 0.1131134033203125, 0.11705589294433594, 0.12099838256835938, 0.12494087219238281, 0.12888336181640625, 0.1328258514404297, 0.13676834106445312, 0.14071083068847656, 0.1446533203125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 7.0, 10.0, 4.0, 8.0, 12.0, 12.0, 9.0, 17.0, 25.0, 21.0, 21.0, 33.0, 35.0, 53.0, 48.0, 76.0, 68.0, 82.0, 91.0, 71.0, 52.0, 44.0, 41.0, 36.0, 21.0, 16.0, 16.0, 17.0, 17.0, 14.0, 6.0, 8.0, 2.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.427267074584961e-05, -3.3272430300712585e-05, -3.227218985557556e-05, -3.127194941043854e-05, -3.0271708965301514e-05, -2.927146852016449e-05, -2.8271228075027466e-05, -2.7270987629890442e-05, -2.6270747184753418e-05, -2.5270506739616394e-05, -2.427026629447937e-05, -2.3270025849342346e-05, -2.2269785404205322e-05, -2.12695449590683e-05, -2.0269304513931274e-05, -1.926906406879425e-05, -1.8268823623657227e-05, -1.7268583178520203e-05, -1.626834273338318e-05, -1.5268102288246155e-05, -1.4267861843109131e-05, -1.3267621397972107e-05, -1.2267380952835083e-05, -1.1267140507698059e-05, -1.0266900062561035e-05, -9.266659617424011e-06, -8.266419172286987e-06, -7.266178727149963e-06, -6.2659382820129395e-06, -5.2656978368759155e-06, -4.265457391738892e-06, -3.2652169466018677e-06, -2.2649765014648438e-06, -1.2647360563278198e-06, -2.644956111907959e-07, 7.35744833946228e-07, 1.735985279083252e-06, 2.736225724220276e-06, 3.7364661693573e-06, 4.736706614494324e-06, 5.736947059631348e-06, 6.737187504768372e-06, 7.737427949905396e-06, 8.73766839504242e-06, 9.737908840179443e-06, 1.0738149285316467e-05, 1.1738389730453491e-05, 1.2738630175590515e-05, 1.3738870620727539e-05, 1.4739111065864563e-05, 1.5739351511001587e-05, 1.673959195613861e-05, 1.7739832401275635e-05, 1.874007284641266e-05, 1.9740313291549683e-05, 2.0740553736686707e-05, 2.174079418182373e-05, 2.2741034626960754e-05, 2.374127507209778e-05, 2.4741515517234802e-05, 2.5741755962371826e-05, 2.674199640750885e-05, 2.7742236852645874e-05, 2.8742477297782898e-05, 2.9742717742919922e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 7.0, 7.0, 9.0, 10.0, 10.0, 19.0, 25.0, 34.0, 96.0, 119.0, 200.0, 375.0, 623.0, 1455.0, 4131.0, 14641.0, 67919.0, 647172.0, 255069.0, 41527.0, 9637.0, 3021.0, 1212.0, 512.0, 292.0, 157.0, 98.0, 53.0, 48.0, 22.0, 17.0, 14.0, 10.0, 7.0, 8.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.110595703125, -0.10712337493896484, -0.10365104675292969, -0.10017871856689453, -0.09670639038085938, -0.09323406219482422, -0.08976173400878906, -0.0862894058227539, -0.08281707763671875, -0.0793447494506836, -0.07587242126464844, -0.07240009307861328, -0.06892776489257812, -0.06545543670654297, -0.06198310852050781, -0.058510780334472656, -0.0550384521484375, -0.051566123962402344, -0.04809379577636719, -0.04462146759033203, -0.041149139404296875, -0.03767681121826172, -0.03420448303222656, -0.030732154846191406, -0.02725982666015625, -0.023787498474121094, -0.020315170288085938, -0.01684284210205078, -0.013370513916015625, -0.009898185729980469, -0.0064258575439453125, -0.0029535293579101562, 0.000518798828125, 0.003991127014160156, 0.0074634552001953125, 0.010935783386230469, 0.014408111572265625, 0.01788043975830078, 0.021352767944335938, 0.024825096130371094, 0.02829742431640625, 0.031769752502441406, 0.03524208068847656, 0.03871440887451172, 0.042186737060546875, 0.04565906524658203, 0.04913139343261719, 0.052603721618652344, 0.0560760498046875, 0.059548377990722656, 0.06302070617675781, 0.06649303436279297, 0.06996536254882812, 0.07343769073486328, 0.07691001892089844, 0.0803823471069336, 0.08385467529296875, 0.0873270034790039, 0.09079933166503906, 0.09427165985107422, 0.09774398803710938, 0.10121631622314453, 0.10468864440917969, 0.10816097259521484, 0.11163330078125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 0.0, 2.0, 1.0, 4.0, 3.0, 9.0, 11.0, 14.0, 17.0, 21.0, 27.0, 48.0, 58.0, 74.0, 115.0, 129.0, 125.0, 87.0, 82.0, 53.0, 23.0, 27.0, 21.0, 16.0, 11.0, 11.0, 6.0, 3.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1861572265625, -0.18160629272460938, -0.17705535888671875, -0.17250442504882812, -0.1679534912109375, -0.16340255737304688, -0.15885162353515625, -0.15430068969726562, -0.149749755859375, -0.14519882202148438, -0.14064788818359375, -0.13609695434570312, -0.1315460205078125, -0.12699508666992188, -0.12244415283203125, -0.11789321899414062, -0.11334228515625, -0.10879135131835938, -0.10424041748046875, -0.09968948364257812, -0.0951385498046875, -0.09058761596679688, -0.08603668212890625, -0.08148574829101562, -0.076934814453125, -0.07238388061523438, -0.06783294677734375, -0.06328201293945312, -0.0587310791015625, -0.054180145263671875, -0.04962921142578125, -0.045078277587890625, -0.04052734375, -0.035976409912109375, -0.03142547607421875, -0.026874542236328125, -0.0223236083984375, -0.017772674560546875, -0.01322174072265625, -0.008670806884765625, -0.004119873046875, 0.000431060791015625, 0.00498199462890625, 0.009532928466796875, 0.0140838623046875, 0.018634796142578125, 0.02318572998046875, 0.027736663818359375, 0.03228759765625, 0.036838531494140625, 0.04138946533203125, 0.045940399169921875, 0.0504913330078125, 0.055042266845703125, 0.05959320068359375, 0.06414413452148438, 0.068695068359375, 0.07324600219726562, 0.07779693603515625, 0.08234786987304688, 0.0868988037109375, 0.09144973754882812, 0.09600067138671875, 0.10055160522460938, 0.1051025390625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 5.0, 4.0, 3.0, 12.0, 22.0, 47.0, 89.0, 297.0, 273.0, 117.0, 66.0, 30.0, 15.0, 7.0, 9.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.2032394409179688, -2.093127489089966, -1.9830154180526733, -1.8729033470153809, -1.762791395187378, -1.6526793241500854, -1.542567253112793, -1.43245530128479, -1.3223432302474976, -1.212231159210205, -1.1021192073822021, -0.9920071363449097, -0.881895124912262, -0.7717831134796143, -0.6616710424423218, -0.5515590310096741, -0.44144701957702637, -0.33133500814437866, -0.22122296690940857, -0.11111092567443848, -0.0009989142417907715, 0.10911309719085693, 0.21922516822814941, 0.3293371796607971, 0.4394491910934448, 0.5495612025260925, 0.6596732139587402, 0.7697852849960327, 0.8798972964286804, 0.9900093078613281, 1.1001213788986206, 1.210233449935913, 1.320345401763916, 1.4304574728012085, 1.5405694246292114, 1.650681495666504, 1.7607934474945068, 1.8709055185317993, 1.9810175895690918, 2.0911295413970947, 2.2012414932250977, 2.3113534450531006, 2.4214656352996826, 2.5315775871276855, 2.6416895389556885, 2.7518014907836914, 2.8619136810302734, 2.9720256328582764, 3.0821378231048584, 3.1922497749328613, 3.3023619651794434, 3.4124739170074463, 3.522585868835449, 3.6326980590820312, 3.742810010910034, 3.852921962738037, 3.963034152984619, 4.073146343231201, 4.183258056640625, 4.293370246887207, 4.403482437133789, 4.513594150543213, 4.623706340789795, 4.733818531036377, 4.843930244445801]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 1.0, 1.0, 3.0, 1.0, 5.0, 4.0, 11.0, 3.0, 8.0, 8.0, 10.0, 10.0, 12.0, 14.0, 19.0, 15.0, 17.0, 22.0, 20.0, 29.0, 25.0, 25.0, 36.0, 57.0, 69.0, 102.0, 97.0, 57.0, 41.0, 26.0, 36.0, 24.0, 29.0, 24.0, 22.0, 16.0, 17.0, 11.0, 11.0, 13.0, 7.0, 10.0, 8.0, 5.0, 11.0, 6.0, 1.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.97845458984375, -1.909497857093811, -1.840541124343872, -1.771584391593933, -1.7026276588439941, -1.6336709260940552, -1.5647141933441162, -1.4957575798034668, -1.4268007278442383, -1.3578439950942993, -1.2888872623443604, -1.2199305295944214, -1.1509737968444824, -1.0820170640945435, -1.0130603313446045, -0.9441036581993103, -0.8751469850540161, -0.8061902523040771, -0.7372335195541382, -0.6682767868041992, -0.5993200540542603, -0.5303633213043213, -0.4614066481590271, -0.39244991540908813, -0.32349318265914917, -0.2545364499092102, -0.18557973206043243, -0.11662301421165466, -0.0476662814617157, 0.021290451288223267, 0.09024715423583984, 0.1592038869857788, 0.22816061973571777, 0.29711735248565674, 0.3660740852355957, 0.4350307881832123, 0.5039875507354736, 0.5729442834854126, 0.6419009566307068, 0.7108576893806458, 0.7798144221305847, 0.8487711548805237, 0.9177278876304626, 0.9866845607757568, 1.0556412935256958, 1.1245980262756348, 1.1935547590255737, 1.2625114917755127, 1.3314682245254517, 1.4004249572753906, 1.4693816900253296, 1.5383384227752686, 1.6072951555252075, 1.6762518882751465, 1.745208501815796, 1.8141653537750244, 1.8831219673156738, 1.9520787000656128, 2.0210354328155518, 2.089992046356201, 2.1589488983154297, 2.227905511856079, 2.2968623638153076, 2.365818977355957, 2.4347758293151855]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 6.0, 7.0, 10.0, 8.0, 11.0, 21.0, 19.0, 25.0, 54.0, 63.0, 75.0, 109.0, 167.0, 258.0, 346.0, 590.0, 1312.0, 2850.0, 7708.0, 28274.0, 174845.0, 1177710.0, 2177794.0, 520985.0, 75410.0, 15974.0, 5138.0, 2053.0, 983.0, 515.0, 295.0, 224.0, 127.0, 96.0, 49.0, 38.0, 40.0, 27.0, 21.0, 15.0, 9.0, 4.0, 8.0, 3.0, 8.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.206298828125, -0.1999073028564453, -0.19351577758789062, -0.18712425231933594, -0.18073272705078125, -0.17434120178222656, -0.16794967651367188, -0.1615581512451172, -0.1551666259765625, -0.1487751007080078, -0.14238357543945312, -0.13599205017089844, -0.12960052490234375, -0.12320899963378906, -0.11681747436523438, -0.11042594909667969, -0.104034423828125, -0.09764289855957031, -0.09125137329101562, -0.08485984802246094, -0.07846832275390625, -0.07207679748535156, -0.06568527221679688, -0.05929374694824219, -0.0529022216796875, -0.04651069641113281, -0.040119171142578125, -0.03372764587402344, -0.02733612060546875, -0.020944595336914062, -0.014553070068359375, -0.008161544799804688, -0.00177001953125, 0.0046215057373046875, 0.011013031005859375, 0.017404556274414062, 0.02379608154296875, 0.030187606811523438, 0.036579132080078125, 0.04297065734863281, 0.0493621826171875, 0.05575370788574219, 0.062145233154296875, 0.06853675842285156, 0.07492828369140625, 0.08131980895996094, 0.08771133422851562, 0.09410285949707031, 0.100494384765625, 0.10688591003417969, 0.11327743530273438, 0.11966896057128906, 0.12606048583984375, 0.13245201110839844, 0.13884353637695312, 0.1452350616455078, 0.1516265869140625, 0.1580181121826172, 0.16440963745117188, 0.17080116271972656, 0.17719268798828125, 0.18358421325683594, 0.18997573852539062, 0.1963672637939453, 0.2027587890625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 1.0, 9.0, 13.0, 17.0, 14.0, 21.0, 32.0, 27.0, 28.0, 47.0, 62.0, 57.0, 64.0, 75.0, 72.0, 74.0, 50.0, 47.0, 72.0, 40.0, 44.0, 29.0, 26.0, 20.0, 21.0, 15.0, 10.0, 6.0, 3.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.203369140625, -0.19536209106445312, -0.18735504150390625, -0.17934799194335938, -0.1713409423828125, -0.16333389282226562, -0.15532684326171875, -0.14731979370117188, -0.139312744140625, -0.13130569458007812, -0.12329864501953125, -0.11529159545898438, -0.1072845458984375, -0.09927749633789062, -0.09127044677734375, -0.08326339721679688, -0.07525634765625, -0.06724929809570312, -0.05924224853515625, -0.051235198974609375, -0.0432281494140625, -0.035221099853515625, -0.02721405029296875, -0.019207000732421875, -0.011199951171875, -0.003192901611328125, 0.00481414794921875, 0.012821197509765625, 0.0208282470703125, 0.028835296630859375, 0.03684234619140625, 0.044849395751953125, 0.0528564453125, 0.060863494873046875, 0.06887054443359375, 0.07687759399414062, 0.0848846435546875, 0.09289169311523438, 0.10089874267578125, 0.10890579223632812, 0.116912841796875, 0.12491989135742188, 0.13292694091796875, 0.14093399047851562, 0.1489410400390625, 0.15694808959960938, 0.16495513916015625, 0.17296218872070312, 0.18096923828125, 0.18897628784179688, 0.19698333740234375, 0.20499038696289062, 0.2129974365234375, 0.22100448608398438, 0.22901153564453125, 0.23701858520507812, 0.245025634765625, 0.2530326843261719, 0.26103973388671875, 0.2690467834472656, 0.2770538330078125, 0.2850608825683594, 0.29306793212890625, 0.3010749816894531, 0.30908203125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 10.0, 11.0, 13.0, 27.0, 36.0, 74.0, 130.0, 243.0, 544.0, 1428.0, 6617.0, 78117.0, 3743166.0, 346954.0, 13349.0, 2199.0, 719.0, 260.0, 155.0, 89.0, 48.0, 23.0, 17.0, 9.0, 11.0, 8.0, 6.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.43212890625, -0.4165191650390625, -0.400909423828125, -0.3852996826171875, -0.36968994140625, -0.3540802001953125, -0.338470458984375, -0.3228607177734375, -0.3072509765625, -0.2916412353515625, -0.276031494140625, -0.2604217529296875, -0.24481201171875, -0.2292022705078125, -0.213592529296875, -0.1979827880859375, -0.182373046875, -0.1667633056640625, -0.151153564453125, -0.1355438232421875, -0.11993408203125, -0.1043243408203125, -0.088714599609375, -0.0731048583984375, -0.0574951171875, -0.0418853759765625, -0.026275634765625, -0.0106658935546875, 0.00494384765625, 0.0205535888671875, 0.036163330078125, 0.0517730712890625, 0.0673828125, 0.0829925537109375, 0.098602294921875, 0.1142120361328125, 0.12982177734375, 0.1454315185546875, 0.161041259765625, 0.1766510009765625, 0.1922607421875, 0.2078704833984375, 0.223480224609375, 0.2390899658203125, 0.25469970703125, 0.2703094482421875, 0.285919189453125, 0.3015289306640625, 0.317138671875, 0.3327484130859375, 0.348358154296875, 0.3639678955078125, 0.37957763671875, 0.3951873779296875, 0.410797119140625, 0.4264068603515625, 0.4420166015625, 0.4576263427734375, 0.473236083984375, 0.4888458251953125, 0.50445556640625, 0.5200653076171875, 0.535675048828125, 0.5512847900390625, 0.56689453125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 2.0, 6.0, 12.0, 5.0, 16.0, 21.0, 32.0, 42.0, 61.0, 118.0, 179.0, 325.0, 558.0, 700.0, 738.0, 501.0, 310.0, 167.0, 88.0, 70.0, 40.0, 25.0, 27.0, 12.0, 4.0, 5.0, 2.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.393798828125, -0.38146209716796875, -0.3691253662109375, -0.35678863525390625, -0.344451904296875, -0.33211517333984375, -0.3197784423828125, -0.30744171142578125, -0.29510498046875, -0.28276824951171875, -0.2704315185546875, -0.25809478759765625, -0.245758056640625, -0.23342132568359375, -0.2210845947265625, -0.20874786376953125, -0.1964111328125, -0.18407440185546875, -0.1717376708984375, -0.15940093994140625, -0.147064208984375, -0.13472747802734375, -0.1223907470703125, -0.11005401611328125, -0.09771728515625, -0.08538055419921875, -0.0730438232421875, -0.06070709228515625, -0.048370361328125, -0.03603363037109375, -0.0236968994140625, -0.01136016845703125, 0.0009765625, 0.01331329345703125, 0.0256500244140625, 0.03798675537109375, 0.050323486328125, 0.06266021728515625, 0.0749969482421875, 0.08733367919921875, 0.09967041015625, 0.11200714111328125, 0.1243438720703125, 0.13668060302734375, 0.149017333984375, 0.16135406494140625, 0.1736907958984375, 0.18602752685546875, 0.1983642578125, 0.21070098876953125, 0.2230377197265625, 0.23537445068359375, 0.247711181640625, 0.26004791259765625, 0.2723846435546875, 0.28472137451171875, 0.29705810546875, 0.30939483642578125, 0.3217315673828125, 0.33406829833984375, 0.346405029296875, 0.35874176025390625, 0.3710784912109375, 0.38341522216796875, 0.395751953125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 8.0, 20.0, 29.0, 79.0, 180.0, 250.0, 244.0, 113.0, 38.0, 21.0, 11.0, 8.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.871633529663086, -5.746171951293945, -5.620710372924805, -5.495249271392822, -5.369787693023682, -5.244326114654541, -5.1188645362854, -4.993403434753418, -4.867941856384277, -4.742480278015137, -4.617018699645996, -4.491557598114014, -4.366096019744873, -4.240634441375732, -4.115172863006592, -3.9897115230560303, -3.8642499446868896, -3.738788366317749, -3.6133270263671875, -3.487865447998047, -3.3624041080474854, -3.2369425296783447, -3.111481189727783, -2.9860196113586426, -2.860558032989502, -2.7350964546203613, -2.6096351146698, -2.484173536300659, -2.3587121963500977, -2.233250617980957, -2.1077890396118164, -1.9823276996612549, -1.8568665981292725, -1.7314051389694214, -1.6059436798095703, -1.4804821014404297, -1.3550207614898682, -1.2295591831207275, -1.1040977239608765, -0.9786362648010254, -0.8531748056411743, -0.7277133464813232, -0.6022518873214722, -0.4767903685569763, -0.35132890939712524, -0.22586745023727417, -0.10040593147277832, 0.025055527687072754, 0.15051698684692383, 0.2759784460067749, 0.40143993496894836, 0.5269014239311218, 0.6523628830909729, 0.777824342250824, 0.9032858610153198, 1.028747320175171, 1.154208779335022, 1.279670238494873, 1.4051316976547241, 1.5305931568145752, 1.6560547351837158, 1.7815160751342773, 1.906977653503418, 2.0324392318725586, 2.15790057182312]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 5.0, 6.0, 6.0, 7.0, 17.0, 12.0, 15.0, 11.0, 26.0, 27.0, 24.0, 27.0, 45.0, 38.0, 36.0, 40.0, 54.0, 57.0, 54.0, 57.0, 57.0, 37.0, 48.0, 43.0, 39.0, 32.0, 21.0, 26.0, 16.0, 26.0, 19.0, 14.0, 15.0, 10.0, 10.0, 12.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.664239764213562, -1.614546537399292, -1.564853310585022, -1.515160083770752, -1.465466856956482, -1.415773630142212, -1.366080403327942, -1.3163871765136719, -1.2666939496994019, -1.2170007228851318, -1.1673074960708618, -1.1176142692565918, -1.0679210424423218, -1.0182278156280518, -0.9685345888137817, -0.9188413619995117, -0.8691480755805969, -0.8194548487663269, -0.7697616219520569, -0.7200683951377869, -0.6703751683235168, -0.6206819415092468, -0.570988655090332, -0.521295428276062, -0.4716022312641144, -0.42190900444984436, -0.37221577763557434, -0.32252252101898193, -0.2728292942047119, -0.2231360822916031, -0.17344284057617188, -0.12374961376190186, -0.07405638694763184, -0.024363156408071518, 0.0253300741314888, 0.07502330839633942, 0.12471653521060944, 0.17440976202487946, 0.22410300374031067, 0.2737962305545807, 0.3234894573688507, 0.3731826841831207, 0.42287591099739075, 0.47256916761398315, 0.5222623944282532, 0.5719556212425232, 0.6216488480567932, 0.6713420748710632, 0.7210353016853333, 0.7707285284996033, 0.8204217553138733, 0.8701149821281433, 0.9198082089424133, 0.9695014357566833, 1.0191947221755981, 1.0688879489898682, 1.1185811758041382, 1.1682744026184082, 1.2179676294326782, 1.2676608562469482, 1.3173540830612183, 1.3670473098754883, 1.4167405366897583, 1.4664337635040283, 1.5161269903182983]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 5.0, 9.0, 11.0, 21.0, 33.0, 51.0, 77.0, 143.0, 240.0, 478.0, 861.0, 1828.0, 4058.0, 10379.0, 33465.0, 149784.0, 547650.0, 228858.0, 47517.0, 13533.0, 5055.0, 2190.0, 1070.0, 540.0, 288.0, 156.0, 114.0, 52.0, 31.0, 21.0, 15.0, 9.0, 4.0, 4.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3125, -0.3019523620605469, -0.29140472412109375, -0.2808570861816406, -0.2703094482421875, -0.2597618103027344, -0.24921417236328125, -0.23866653442382812, -0.228118896484375, -0.21757125854492188, -0.20702362060546875, -0.19647598266601562, -0.1859283447265625, -0.17538070678710938, -0.16483306884765625, -0.15428543090820312, -0.14373779296875, -0.13319015502929688, -0.12264251708984375, -0.11209487915039062, -0.1015472412109375, -0.09099960327148438, -0.08045196533203125, -0.06990432739257812, -0.059356689453125, -0.048809051513671875, -0.03826141357421875, -0.027713775634765625, -0.0171661376953125, -0.006618499755859375, 0.00392913818359375, 0.014476776123046875, 0.0250244140625, 0.035572052001953125, 0.04611968994140625, 0.056667327880859375, 0.0672149658203125, 0.07776260375976562, 0.08831024169921875, 0.09885787963867188, 0.109405517578125, 0.11995315551757812, 0.13050079345703125, 0.14104843139648438, 0.1515960693359375, 0.16214370727539062, 0.17269134521484375, 0.18323898315429688, 0.19378662109375, 0.20433425903320312, 0.21488189697265625, 0.22542953491210938, 0.2359771728515625, 0.24652481079101562, 0.25707244873046875, 0.2676200866699219, 0.278167724609375, 0.2887153625488281, 0.29926300048828125, 0.3098106384277344, 0.3203582763671875, 0.3309059143066406, 0.34145355224609375, 0.3520011901855469, 0.362548828125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 6.0, 7.0, 10.0, 27.0, 19.0, 10.0, 29.0, 31.0, 29.0, 49.0, 59.0, 66.0, 71.0, 68.0, 58.0, 54.0, 61.0, 66.0, 48.0, 49.0, 30.0, 41.0, 28.0, 32.0, 21.0, 10.0, 7.0, 10.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2044677734375, -0.1964244842529297, -0.18838119506835938, -0.18033790588378906, -0.17229461669921875, -0.16425132751464844, -0.15620803833007812, -0.1481647491455078, -0.1401214599609375, -0.1320781707763672, -0.12403488159179688, -0.11599159240722656, -0.10794830322265625, -0.09990501403808594, -0.09186172485351562, -0.08381843566894531, -0.075775146484375, -0.06773185729980469, -0.059688568115234375, -0.05164527893066406, -0.04360198974609375, -0.03555870056152344, -0.027515411376953125, -0.019472122192382812, -0.0114288330078125, -0.0033855438232421875, 0.004657745361328125, 0.012701034545898438, 0.02074432373046875, 0.028787612915039062, 0.036830902099609375, 0.04487419128417969, 0.05291748046875, 0.06096076965332031, 0.06900405883789062, 0.07704734802246094, 0.08509063720703125, 0.09313392639160156, 0.10117721557617188, 0.10922050476074219, 0.1172637939453125, 0.1253070831298828, 0.13335037231445312, 0.14139366149902344, 0.14943695068359375, 0.15748023986816406, 0.16552352905273438, 0.1735668182373047, 0.181610107421875, 0.1896533966064453, 0.19769668579101562, 0.20573997497558594, 0.21378326416015625, 0.22182655334472656, 0.22986984252929688, 0.2379131317138672, 0.2459564208984375, 0.2539997100830078, 0.2620429992675781, 0.27008628845214844, 0.27812957763671875, 0.28617286682128906, 0.2942161560058594, 0.3022594451904297, 0.310302734375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 2.0, 5.0, 8.0, 9.0, 13.0, 16.0, 34.0, 24.0, 44.0, 60.0, 80.0, 84.0, 121.0, 173.0, 249.0, 325.0, 551.0, 872.0, 1541.0, 4059.0, 27822.0, 785126.0, 208547.0, 12377.0, 2801.0, 1247.0, 739.0, 468.0, 326.0, 207.0, 157.0, 110.0, 102.0, 63.0, 54.0, 27.0, 33.0, 19.0, 10.0, 18.0, 9.0, 10.0, 8.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.55126953125, -0.5339508056640625, -0.516632080078125, -0.4993133544921875, -0.48199462890625, -0.4646759033203125, -0.447357177734375, -0.4300384521484375, -0.4127197265625, -0.3954010009765625, -0.378082275390625, -0.3607635498046875, -0.34344482421875, -0.3261260986328125, -0.308807373046875, -0.2914886474609375, -0.274169921875, -0.2568511962890625, -0.239532470703125, -0.2222137451171875, -0.20489501953125, -0.1875762939453125, -0.170257568359375, -0.1529388427734375, -0.1356201171875, -0.1183013916015625, -0.100982666015625, -0.0836639404296875, -0.06634521484375, -0.0490264892578125, -0.031707763671875, -0.0143890380859375, 0.0029296875, 0.0202484130859375, 0.037567138671875, 0.0548858642578125, 0.07220458984375, 0.0895233154296875, 0.106842041015625, 0.1241607666015625, 0.1414794921875, 0.1587982177734375, 0.176116943359375, 0.1934356689453125, 0.21075439453125, 0.2280731201171875, 0.245391845703125, 0.2627105712890625, 0.280029296875, 0.2973480224609375, 0.314666748046875, 0.3319854736328125, 0.34930419921875, 0.3666229248046875, 0.383941650390625, 0.4012603759765625, 0.4185791015625, 0.4358978271484375, 0.453216552734375, 0.4705352783203125, 0.48785400390625, 0.5051727294921875, 0.522491455078125, 0.5398101806640625, 0.55712890625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 7.0, 3.0, 5.0, 3.0, 3.0, 8.0, 9.0, 13.0, 18.0, 13.0, 22.0, 22.0, 21.0, 26.0, 34.0, 35.0, 48.0, 55.0, 39.0, 45.0, 49.0, 48.0, 41.0, 51.0, 42.0, 54.0, 39.0, 37.0, 34.0, 28.0, 25.0, 24.0, 17.0, 9.0, 16.0, 12.0, 14.0, 14.0, 5.0, 3.0, 5.0, 3.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.548828125, -0.5295791625976562, -0.5103302001953125, -0.49108123779296875, -0.471832275390625, -0.45258331298828125, -0.4333343505859375, -0.41408538818359375, -0.39483642578125, -0.37558746337890625, -0.3563385009765625, -0.33708953857421875, -0.317840576171875, -0.29859161376953125, -0.2793426513671875, -0.26009368896484375, -0.2408447265625, -0.22159576416015625, -0.2023468017578125, -0.18309783935546875, -0.163848876953125, -0.14459991455078125, -0.1253509521484375, -0.10610198974609375, -0.08685302734375, -0.06760406494140625, -0.0483551025390625, -0.02910614013671875, -0.009857177734375, 0.00939178466796875, 0.0286407470703125, 0.04788970947265625, 0.067138671875, 0.08638763427734375, 0.1056365966796875, 0.12488555908203125, 0.144134521484375, 0.16338348388671875, 0.1826324462890625, 0.20188140869140625, 0.22113037109375, 0.24037933349609375, 0.2596282958984375, 0.27887725830078125, 0.298126220703125, 0.31737518310546875, 0.3366241455078125, 0.35587310791015625, 0.3751220703125, 0.39437103271484375, 0.4136199951171875, 0.43286895751953125, 0.452117919921875, 0.47136688232421875, 0.4906158447265625, 0.5098648071289062, 0.52911376953125, 0.5483627319335938, 0.5676116943359375, 0.5868606567382812, 0.606109619140625, 0.6253585815429688, 0.6446075439453125, 0.6638565063476562, 0.68310546875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 8.0, 6.0, 9.0, 11.0, 22.0, 28.0, 42.0, 98.0, 157.0, 340.0, 1118.0, 5878.0, 98221.0, 915068.0, 23655.0, 2667.0, 652.0, 232.0, 130.0, 71.0, 55.0, 28.0, 21.0, 8.0, 9.0, 5.0, 9.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23583984375, -0.229156494140625, -0.22247314453125, -0.215789794921875, -0.2091064453125, -0.202423095703125, -0.19573974609375, -0.189056396484375, -0.182373046875, -0.175689697265625, -0.16900634765625, -0.162322998046875, -0.1556396484375, -0.148956298828125, -0.14227294921875, -0.135589599609375, -0.12890625, -0.122222900390625, -0.11553955078125, -0.108856201171875, -0.1021728515625, -0.095489501953125, -0.08880615234375, -0.082122802734375, -0.075439453125, -0.068756103515625, -0.06207275390625, -0.055389404296875, -0.0487060546875, -0.042022705078125, -0.03533935546875, -0.028656005859375, -0.02197265625, -0.015289306640625, -0.00860595703125, -0.001922607421875, 0.0047607421875, 0.011444091796875, 0.01812744140625, 0.024810791015625, 0.031494140625, 0.038177490234375, 0.04486083984375, 0.051544189453125, 0.0582275390625, 0.064910888671875, 0.07159423828125, 0.078277587890625, 0.0849609375, 0.091644287109375, 0.09832763671875, 0.105010986328125, 0.1116943359375, 0.118377685546875, 0.12506103515625, 0.131744384765625, 0.138427734375, 0.145111083984375, 0.15179443359375, 0.158477783203125, 0.1651611328125, 0.171844482421875, 0.17852783203125, 0.185211181640625, 0.19189453125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 3.0, 8.0, 8.0, 14.0, 11.0, 28.0, 36.0, 51.0, 84.0, 98.0, 145.0, 119.0, 122.0, 79.0, 56.0, 44.0, 17.0, 11.0, 13.0, 6.0, 10.0, 5.0, 4.0, 3.0, 5.0, 8.0, 7.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.104873657226562e-05, -6.913114339113235e-05, -6.721355020999908e-05, -6.529595702886581e-05, -6.337836384773254e-05, -6.146077066659927e-05, -5.9543177485466003e-05, -5.762558430433273e-05, -5.570799112319946e-05, -5.379039794206619e-05, -5.187280476093292e-05, -4.995521157979965e-05, -4.803761839866638e-05, -4.612002521753311e-05, -4.420243203639984e-05, -4.228483885526657e-05, -4.03672456741333e-05, -3.844965249300003e-05, -3.653205931186676e-05, -3.461446613073349e-05, -3.269687294960022e-05, -3.077927976846695e-05, -2.886168658733368e-05, -2.694409340620041e-05, -2.502650022506714e-05, -2.310890704393387e-05, -2.1191313862800598e-05, -1.9273720681667328e-05, -1.7356127500534058e-05, -1.5438534319400787e-05, -1.3520941138267517e-05, -1.1603347957134247e-05, -9.685754776000977e-06, -7.768161594867706e-06, -5.850568413734436e-06, -3.932975232601166e-06, -2.0153820514678955e-06, -9.778887033462524e-08, 1.819804310798645e-06, 3.7373974919319153e-06, 5.6549906730651855e-06, 7.572583854198456e-06, 9.490177035331726e-06, 1.1407770216464996e-05, 1.3325363397598267e-05, 1.5242956578731537e-05, 1.7160549759864807e-05, 1.9078142940998077e-05, 2.0995736122131348e-05, 2.2913329303264618e-05, 2.4830922484397888e-05, 2.674851566553116e-05, 2.866610884666443e-05, 3.05837020277977e-05, 3.250129520893097e-05, 3.441888839006424e-05, 3.633648157119751e-05, 3.825407475233078e-05, 4.017166793346405e-05, 4.208926111459732e-05, 4.400685429573059e-05, 4.592444747686386e-05, 4.784204065799713e-05, 4.97596338391304e-05, 5.167722702026367e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 8.0, 10.0, 6.0, 11.0, 28.0, 36.0, 47.0, 69.0, 92.0, 153.0, 206.0, 374.0, 722.0, 1586.0, 4441.0, 19073.0, 146880.0, 790390.0, 67681.0, 11080.0, 3056.0, 1168.0, 549.0, 335.0, 187.0, 125.0, 65.0, 50.0, 36.0, 32.0, 30.0, 10.0, 7.0, 5.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11065673828125, -0.10723400115966797, -0.10381126403808594, -0.1003885269165039, -0.09696578979492188, -0.09354305267333984, -0.09012031555175781, -0.08669757843017578, -0.08327484130859375, -0.07985210418701172, -0.07642936706542969, -0.07300662994384766, -0.06958389282226562, -0.0661611557006836, -0.06273841857910156, -0.05931568145751953, -0.0558929443359375, -0.05247020721435547, -0.04904747009277344, -0.045624732971191406, -0.042201995849609375, -0.038779258728027344, -0.03535652160644531, -0.03193378448486328, -0.02851104736328125, -0.02508831024169922, -0.021665573120117188, -0.018242835998535156, -0.014820098876953125, -0.011397361755371094, -0.007974624633789062, -0.004551887512207031, -0.001129150390625, 0.0022935867309570312, 0.0057163238525390625, 0.009139060974121094, 0.012561798095703125, 0.015984535217285156, 0.019407272338867188, 0.02283000946044922, 0.02625274658203125, 0.02967548370361328, 0.03309822082519531, 0.036520957946777344, 0.039943695068359375, 0.043366432189941406, 0.04678916931152344, 0.05021190643310547, 0.0536346435546875, 0.05705738067626953, 0.06048011779785156, 0.0639028549194336, 0.06732559204101562, 0.07074832916259766, 0.07417106628417969, 0.07759380340576172, 0.08101654052734375, 0.08443927764892578, 0.08786201477050781, 0.09128475189208984, 0.09470748901367188, 0.0981302261352539, 0.10155296325683594, 0.10497570037841797, 0.1083984375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 7.0, 5.0, 6.0, 5.0, 6.0, 5.0, 9.0, 14.0, 16.0, 18.0, 20.0, 20.0, 33.0, 47.0, 41.0, 52.0, 68.0, 65.0, 97.0, 80.0, 66.0, 47.0, 57.0, 31.0, 24.0, 23.0, 20.0, 22.0, 18.0, 16.0, 10.0, 12.0, 8.0, 5.0, 3.0, 3.0, 3.0, 4.0, 4.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0806884765625, -0.07828521728515625, -0.0758819580078125, -0.07347869873046875, -0.071075439453125, -0.06867218017578125, -0.0662689208984375, -0.06386566162109375, -0.06146240234375, -0.05905914306640625, -0.0566558837890625, -0.05425262451171875, -0.051849365234375, -0.04944610595703125, -0.0470428466796875, -0.04463958740234375, -0.042236328125, -0.03983306884765625, -0.0374298095703125, -0.03502655029296875, -0.032623291015625, -0.03022003173828125, -0.0278167724609375, -0.02541351318359375, -0.02301025390625, -0.02060699462890625, -0.0182037353515625, -0.01580047607421875, -0.013397216796875, -0.01099395751953125, -0.0085906982421875, -0.00618743896484375, -0.0037841796875, -0.00138092041015625, 0.0010223388671875, 0.00342559814453125, 0.005828857421875, 0.00823211669921875, 0.0106353759765625, 0.01303863525390625, 0.01544189453125, 0.01784515380859375, 0.0202484130859375, 0.02265167236328125, 0.025054931640625, 0.02745819091796875, 0.0298614501953125, 0.03226470947265625, 0.03466796875, 0.03707122802734375, 0.0394744873046875, 0.04187774658203125, 0.044281005859375, 0.04668426513671875, 0.0490875244140625, 0.05149078369140625, 0.05389404296875, 0.05629730224609375, 0.0587005615234375, 0.06110382080078125, 0.063507080078125, 0.06591033935546875, 0.0683135986328125, 0.07071685791015625, 0.0731201171875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 24.0, 108.0, 595.0, 231.0, 30.0, 8.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.1179704666137695, -6.862144470214844, -6.606318473815918, -6.350492477416992, -6.094666481018066, -5.838840484619141, -5.583014488220215, -5.327188491821289, -5.071362495422363, -4.8155364990234375, -4.559710502624512, -4.303884506225586, -4.04805850982666, -3.7922325134277344, -3.5364065170288086, -3.280580520629883, -3.024754524230957, -2.7689285278320312, -2.5131025314331055, -2.2572765350341797, -2.001450538635254, -1.7456245422363281, -1.4897985458374023, -1.2339725494384766, -0.9781465530395508, -0.722320556640625, -0.4664945602416992, -0.21066856384277344, 0.045157432556152344, 0.3009834289550781, 0.5568094253540039, 0.8126354217529297, 1.0684623718261719, 1.3242883682250977, 1.5801143646240234, 1.8359403610229492, 2.091766357421875, 2.347592353820801, 2.6034183502197266, 2.8592443466186523, 3.115070343017578, 3.370896339416504, 3.6267223358154297, 3.8825483322143555, 4.138374328613281, 4.394200325012207, 4.650026321411133, 4.905852317810059, 5.161678314208984, 5.41750431060791, 5.673330307006836, 5.929156303405762, 6.1849822998046875, 6.440808296203613, 6.696634292602539, 6.952460289001465, 7.208286285400391, 7.464112281799316, 7.719938278198242, 7.975764274597168, 8.231590270996094, 8.48741626739502, 8.743242263793945, 8.999068260192871, 9.254894256591797]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 6.0, 3.0, 4.0, 7.0, 5.0, 8.0, 12.0, 9.0, 12.0, 13.0, 14.0, 20.0, 18.0, 22.0, 30.0, 19.0, 24.0, 30.0, 24.0, 45.0, 110.0, 163.0, 83.0, 38.0, 23.0, 29.0, 27.0, 21.0, 25.0, 24.0, 22.0, 22.0, 15.0, 16.0, 10.0, 6.0, 9.0, 8.0, 3.0, 5.0, 6.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.0402026176452637, -1.9682003259658813, -1.896198034286499, -1.8241957426071167, -1.7521934509277344, -1.6801910400390625, -1.6081887483596802, -1.5361864566802979, -1.4641841650009155, -1.3921818733215332, -1.3201795816421509, -1.2481772899627686, -1.1761748790740967, -1.104172706604004, -1.032170295715332, -0.9601680040359497, -0.8881657123565674, -0.8161634206771851, -0.7441611289978027, -0.6721587777137756, -0.6001564860343933, -0.528154194355011, -0.4561518728733063, -0.38414955139160156, -0.31214725971221924, -0.24014495313167572, -0.1681426465511322, -0.09614033997058868, -0.024138033390045166, 0.04786425828933716, 0.11986657977104187, 0.19186890125274658, 0.2638711929321289, 0.33587348461151123, 0.40787580609321594, 0.47987812757492065, 0.551880419254303, 0.6238827109336853, 0.6958850622177124, 0.7678873538970947, 0.839889645576477, 0.9118919372558594, 0.9838942289352417, 1.055896520614624, 1.127898931503296, 1.1999011039733887, 1.2719035148620605, 1.3439058065414429, 1.4159080982208252, 1.4879103899002075, 1.5599126815795898, 1.6319149732589722, 1.7039172649383545, 1.7759196758270264, 1.8479219675064087, 1.919924259185791, 1.9919265508651733, 2.0639288425445557, 2.1359312534332275, 2.2079334259033203, 2.279935836791992, 2.351938009262085, 2.423940420150757, 2.4959425926208496, 2.5679450035095215]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 8.0, 4.0, 8.0, 15.0, 20.0, 28.0, 49.0, 76.0, 92.0, 151.0, 255.0, 377.0, 681.0, 1230.0, 2382.0, 5082.0, 12733.0, 49112.0, 277720.0, 1187424.0, 1828594.0, 661232.0, 123972.0, 26615.0, 8745.0, 3593.0, 1797.0, 941.0, 507.0, 275.0, 222.0, 122.0, 76.0, 44.0, 29.0, 20.0, 15.0, 13.0, 7.0, 9.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21826171875, -0.21128273010253906, -0.20430374145507812, -0.1973247528076172, -0.19034576416015625, -0.1833667755126953, -0.17638778686523438, -0.16940879821777344, -0.1624298095703125, -0.15545082092285156, -0.14847183227539062, -0.1414928436279297, -0.13451385498046875, -0.1275348663330078, -0.12055587768554688, -0.11357688903808594, -0.106597900390625, -0.09961891174316406, -0.09263992309570312, -0.08566093444824219, -0.07868194580078125, -0.07170295715332031, -0.06472396850585938, -0.05774497985839844, -0.0507659912109375, -0.04378700256347656, -0.036808013916015625, -0.029829025268554688, -0.02285003662109375, -0.015871047973632812, -0.008892059326171875, -0.0019130706787109375, 0.00506591796875, 0.012044906616210938, 0.019023895263671875, 0.026002883911132812, 0.03298187255859375, 0.03996086120605469, 0.046939849853515625, 0.05391883850097656, 0.0608978271484375, 0.06787681579589844, 0.07485580444335938, 0.08183479309082031, 0.08881378173828125, 0.09579277038574219, 0.10277175903320312, 0.10975074768066406, 0.116729736328125, 0.12370872497558594, 0.13068771362304688, 0.1376667022705078, 0.14464569091796875, 0.1516246795654297, 0.15860366821289062, 0.16558265686035156, 0.1725616455078125, 0.17954063415527344, 0.18651962280273438, 0.1934986114501953, 0.20047760009765625, 0.2074565887451172, 0.21443557739257812, 0.22141456604003906, 0.2283935546875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 6.0, 5.0, 11.0, 20.0, 16.0, 28.0, 34.0, 39.0, 59.0, 45.0, 67.0, 66.0, 64.0, 69.0, 73.0, 61.0, 44.0, 53.0, 52.0, 33.0, 32.0, 32.0, 26.0, 20.0, 15.0, 9.0, 10.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2041015625, -0.19610595703125, -0.1881103515625, -0.18011474609375, -0.172119140625, -0.16412353515625, -0.1561279296875, -0.14813232421875, -0.14013671875, -0.13214111328125, -0.1241455078125, -0.11614990234375, -0.108154296875, -0.10015869140625, -0.0921630859375, -0.08416748046875, -0.076171875, -0.06817626953125, -0.0601806640625, -0.05218505859375, -0.044189453125, -0.03619384765625, -0.0281982421875, -0.02020263671875, -0.01220703125, -0.00421142578125, 0.0037841796875, 0.01177978515625, 0.019775390625, 0.02777099609375, 0.0357666015625, 0.04376220703125, 0.0517578125, 0.05975341796875, 0.0677490234375, 0.07574462890625, 0.083740234375, 0.09173583984375, 0.0997314453125, 0.10772705078125, 0.11572265625, 0.12371826171875, 0.1317138671875, 0.13970947265625, 0.147705078125, 0.15570068359375, 0.1636962890625, 0.17169189453125, 0.1796875, 0.18768310546875, 0.1956787109375, 0.20367431640625, 0.211669921875, 0.21966552734375, 0.2276611328125, 0.23565673828125, 0.24365234375, 0.25164794921875, 0.2596435546875, 0.26763916015625, 0.275634765625, 0.28363037109375, 0.2916259765625, 0.29962158203125, 0.3076171875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 7.0, 8.0, 7.0, 9.0, 23.0, 40.0, 33.0, 69.0, 83.0, 140.0, 258.0, 394.0, 736.0, 1533.0, 4139.0, 18929.0, 889736.0, 3242241.0, 28174.0, 4574.0, 1423.0, 705.0, 369.0, 227.0, 125.0, 86.0, 55.0, 33.0, 31.0, 25.0, 10.0, 9.0, 8.0, 7.0, 5.0, 3.0, 2.0, 2.0, 2.0, 4.0, 4.0, 3.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.74853515625, -0.7236709594726562, -0.6988067626953125, -0.6739425659179688, -0.649078369140625, -0.6242141723632812, -0.5993499755859375, -0.5744857788085938, -0.54962158203125, -0.5247573852539062, -0.4998931884765625, -0.47502899169921875, -0.450164794921875, -0.42530059814453125, -0.4004364013671875, -0.37557220458984375, -0.3507080078125, -0.32584381103515625, -0.3009796142578125, -0.27611541748046875, -0.251251220703125, -0.22638702392578125, -0.2015228271484375, -0.17665863037109375, -0.15179443359375, -0.12693023681640625, -0.1020660400390625, -0.07720184326171875, -0.052337646484375, -0.02747344970703125, -0.0026092529296875, 0.02225494384765625, 0.047119140625, 0.07198333740234375, 0.0968475341796875, 0.12171173095703125, 0.146575927734375, 0.17144012451171875, 0.1963043212890625, 0.22116851806640625, 0.24603271484375, 0.27089691162109375, 0.2957611083984375, 0.32062530517578125, 0.345489501953125, 0.37035369873046875, 0.3952178955078125, 0.42008209228515625, 0.4449462890625, 0.46981048583984375, 0.4946746826171875, 0.5195388793945312, 0.544403076171875, 0.5692672729492188, 0.5941314697265625, 0.6189956665039062, 0.64385986328125, 0.6687240600585938, 0.6935882568359375, 0.7184524536132812, 0.743316650390625, 0.7681808471679688, 0.7930450439453125, 0.8179092407226562, 0.8427734375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 3.0, 3.0, 6.0, 7.0, 8.0, 11.0, 12.0, 25.0, 26.0, 32.0, 52.0, 76.0, 116.0, 143.0, 231.0, 374.0, 556.0, 682.0, 631.0, 407.0, 238.0, 145.0, 113.0, 69.0, 28.0, 27.0, 16.0, 15.0, 8.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.7333984375, -0.7138290405273438, -0.6942596435546875, -0.6746902465820312, -0.655120849609375, -0.6355514526367188, -0.6159820556640625, -0.5964126586914062, -0.57684326171875, -0.5572738647460938, -0.5377044677734375, -0.5181350708007812, -0.498565673828125, -0.47899627685546875, -0.4594268798828125, -0.43985748291015625, -0.4202880859375, -0.40071868896484375, -0.3811492919921875, -0.36157989501953125, -0.342010498046875, -0.32244110107421875, -0.3028717041015625, -0.28330230712890625, -0.26373291015625, -0.24416351318359375, -0.2245941162109375, -0.20502471923828125, -0.185455322265625, -0.16588592529296875, -0.1463165283203125, -0.12674713134765625, -0.107177734375, -0.08760833740234375, -0.0680389404296875, -0.04846954345703125, -0.028900146484375, -0.00933074951171875, 0.0102386474609375, 0.02980804443359375, 0.04937744140625, 0.06894683837890625, 0.0885162353515625, 0.10808563232421875, 0.127655029296875, 0.14722442626953125, 0.1667938232421875, 0.18636322021484375, 0.2059326171875, 0.22550201416015625, 0.2450714111328125, 0.26464080810546875, 0.284210205078125, 0.30377960205078125, 0.3233489990234375, 0.34291839599609375, 0.36248779296875, 0.38205718994140625, 0.4016265869140625, 0.42119598388671875, 0.440765380859375, 0.46033477783203125, 0.4799041748046875, 0.49947357177734375, 0.51904296875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 8.0, 9.0, 33.0, 61.0, 221.0, 432.0, 178.0, 50.0, 7.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-25.28878402709961, -24.83358383178711, -24.37838363647461, -23.923181533813477, -23.467981338500977, -23.012781143188477, -22.557579040527344, -22.102378845214844, -21.647178649902344, -21.191978454589844, -20.736778259277344, -20.28157615661621, -19.82637596130371, -19.37117576599121, -18.915973663330078, -18.460773468017578, -18.005573272705078, -17.550373077392578, -17.095172882080078, -16.639970779418945, -16.184770584106445, -15.729570388793945, -15.274369239807129, -14.819168090820312, -14.363967895507812, -13.908767700195312, -13.453566551208496, -12.99836540222168, -12.54316520690918, -12.08796501159668, -11.632763862609863, -11.177562713623047, -10.722362518310547, -10.267162322998047, -9.81196117401123, -9.356760025024414, -8.901559829711914, -8.446359634399414, -7.991158485412598, -7.5359578132629395, -7.080757141113281, -6.625556468963623, -6.170355796813965, -5.715155124664307, -5.259954452514648, -4.80475378036499, -4.349553108215332, -3.894352436065674, -3.4391515254974365, -2.9839508533477783, -2.52875018119812, -2.073549509048462, -1.6183488368988037, -1.1631481647491455, -0.7079474925994873, -0.2527468204498291, 0.2024538516998291, 0.6576545238494873, 1.1128551959991455, 1.5680558681488037, 2.023256540298462, 2.47845721244812, 2.9336578845977783, 3.3888585567474365, 3.8440592288970947]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 8.0, 7.0, 6.0, 29.0, 27.0, 32.0, 55.0, 78.0, 91.0, 115.0, 120.0, 113.0, 101.0, 71.0, 56.0, 37.0, 22.0, 10.0, 16.0, 8.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.560724258422852, -8.33340835571289, -8.106093406677246, -7.878777503967285, -7.651461601257324, -7.4241461753845215, -7.196830749511719, -6.969514846801758, -6.742198944091797, -6.514883518218994, -6.287567615509033, -6.0602521896362305, -5.8329362869262695, -5.605620861053467, -5.378305435180664, -5.150989532470703, -4.9236741065979, -4.696358680725098, -4.469042778015137, -4.241727352142334, -4.014411449432373, -3.7870960235595703, -3.5597803592681885, -3.3324646949768066, -3.105149030685425, -2.877833366394043, -2.650517702102661, -2.4232020378112793, -2.1958866119384766, -1.9685708284378052, -1.741255283355713, -1.513939619064331, -1.2866239547729492, -1.0593082904815674, -0.8319926857948303, -0.6046770811080933, -0.3773614168167114, -0.1500457525253296, 0.0772697925567627, 0.30458545684814453, 0.5319011211395264, 0.7592167854309082, 0.9865323901176453, 1.2138479948043823, 1.4411636590957642, 1.668479323387146, 1.8957948684692383, 2.12311053276062, 2.350426197052002, 2.577741861343384, 2.8050575256347656, 3.0323729515075684, 3.2596888542175293, 3.487004280090332, 3.714319944381714, 3.9416356086730957, 4.168951034545898, 4.396266460418701, 4.623582363128662, 4.850897789001465, 5.078213691711426, 5.3055291175842285, 5.532844543457031, 5.760160446166992, 5.987476348876953]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 6.0, 10.0, 6.0, 7.0, 17.0, 28.0, 36.0, 42.0, 62.0, 134.0, 312.0, 779.0, 2406.0, 8840.0, 49230.0, 716536.0, 237999.0, 24144.0, 5323.0, 1557.0, 526.0, 234.0, 119.0, 61.0, 34.0, 25.0, 19.0, 14.0, 7.0, 9.0, 7.0, 7.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.472900390625, -0.45891571044921875, -0.4449310302734375, -0.43094635009765625, -0.416961669921875, -0.40297698974609375, -0.3889923095703125, -0.37500762939453125, -0.36102294921875, -0.34703826904296875, -0.3330535888671875, -0.31906890869140625, -0.305084228515625, -0.29109954833984375, -0.2771148681640625, -0.26313018798828125, -0.2491455078125, -0.23516082763671875, -0.2211761474609375, -0.20719146728515625, -0.193206787109375, -0.17922210693359375, -0.1652374267578125, -0.15125274658203125, -0.13726806640625, -0.12328338623046875, -0.1092987060546875, -0.09531402587890625, -0.081329345703125, -0.06734466552734375, -0.0533599853515625, -0.03937530517578125, -0.025390625, -0.01140594482421875, 0.0025787353515625, 0.01656341552734375, 0.030548095703125, 0.04453277587890625, 0.0585174560546875, 0.07250213623046875, 0.08648681640625, 0.10047149658203125, 0.1144561767578125, 0.12844085693359375, 0.142425537109375, 0.15641021728515625, 0.1703948974609375, 0.18437957763671875, 0.1983642578125, 0.21234893798828125, 0.2263336181640625, 0.24031829833984375, 0.254302978515625, 0.26828765869140625, 0.2822723388671875, 0.29625701904296875, 0.31024169921875, 0.32422637939453125, 0.3382110595703125, 0.35219573974609375, 0.366180419921875, 0.38016510009765625, 0.3941497802734375, 0.40813446044921875, 0.422119140625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 5.0, 14.0, 21.0, 37.0, 59.0, 98.0, 113.0, 123.0, 125.0, 118.0, 99.0, 64.0, 58.0, 38.0, 14.0, 10.0, 5.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.78271484375, -0.7641830444335938, -0.7456512451171875, -0.7271194458007812, -0.708587646484375, -0.6900558471679688, -0.6715240478515625, -0.6529922485351562, -0.63446044921875, -0.6159286499023438, -0.5973968505859375, -0.5788650512695312, -0.560333251953125, -0.5418014526367188, -0.5232696533203125, -0.5047378540039062, -0.4862060546875, -0.46767425537109375, -0.4491424560546875, -0.43061065673828125, -0.412078857421875, -0.39354705810546875, -0.3750152587890625, -0.35648345947265625, -0.33795166015625, -0.31941986083984375, -0.3008880615234375, -0.28235626220703125, -0.263824462890625, -0.24529266357421875, -0.2267608642578125, -0.20822906494140625, -0.189697265625, -0.17116546630859375, -0.1526336669921875, -0.13410186767578125, -0.115570068359375, -0.09703826904296875, -0.0785064697265625, -0.05997467041015625, -0.04144287109375, -0.02291107177734375, -0.0043792724609375, 0.01415252685546875, 0.032684326171875, 0.05121612548828125, 0.0697479248046875, 0.08827972412109375, 0.1068115234375, 0.12534332275390625, 0.1438751220703125, 0.16240692138671875, 0.180938720703125, 0.19947052001953125, 0.2180023193359375, 0.23653411865234375, 0.25506591796875, 0.27359771728515625, 0.2921295166015625, 0.31066131591796875, 0.329193115234375, 0.34772491455078125, 0.3662567138671875, 0.38478851318359375, 0.4033203125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 6.0, 16.0, 18.0, 30.0, 56.0, 76.0, 151.0, 240.0, 518.0, 1360.0, 6928.0, 341472.0, 687974.0, 7173.0, 1340.0, 556.0, 245.0, 142.0, 82.0, 66.0, 39.0, 26.0, 9.0, 13.0, 12.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.599609375, -0.5796279907226562, -0.5596466064453125, -0.5396652221679688, -0.519683837890625, -0.49970245361328125, -0.4797210693359375, -0.45973968505859375, -0.43975830078125, -0.41977691650390625, -0.3997955322265625, -0.37981414794921875, -0.359832763671875, -0.33985137939453125, -0.3198699951171875, -0.29988861083984375, -0.2799072265625, -0.25992584228515625, -0.2399444580078125, -0.21996307373046875, -0.199981689453125, -0.18000030517578125, -0.1600189208984375, -0.14003753662109375, -0.12005615234375, -0.10007476806640625, -0.0800933837890625, -0.06011199951171875, -0.040130615234375, -0.02014923095703125, -0.0001678466796875, 0.01981353759765625, 0.039794921875, 0.05977630615234375, 0.0797576904296875, 0.09973907470703125, 0.119720458984375, 0.13970184326171875, 0.1596832275390625, 0.17966461181640625, 0.19964599609375, 0.21962738037109375, 0.2396087646484375, 0.25959014892578125, 0.279571533203125, 0.29955291748046875, 0.3195343017578125, 0.33951568603515625, 0.3594970703125, 0.37947845458984375, 0.3994598388671875, 0.41944122314453125, 0.439422607421875, 0.45940399169921875, 0.4793853759765625, 0.49936676025390625, 0.51934814453125, 0.5393295288085938, 0.5593109130859375, 0.5792922973632812, 0.599273681640625, 0.6192550659179688, 0.6392364501953125, 0.6592178344726562, 0.67919921875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 6.0, 7.0, 6.0, 9.0, 13.0, 10.0, 12.0, 19.0, 19.0, 30.0, 21.0, 52.0, 46.0, 71.0, 87.0, 95.0, 88.0, 74.0, 57.0, 46.0, 40.0, 42.0, 34.0, 24.0, 14.0, 23.0, 15.0, 10.0, 6.0, 11.0, 7.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0966796875, -1.0644149780273438, -1.0321502685546875, -0.9998855590820312, -0.967620849609375, -0.9353561401367188, -0.9030914306640625, -0.8708267211914062, -0.83856201171875, -0.8062973022460938, -0.7740325927734375, -0.7417678833007812, -0.709503173828125, -0.6772384643554688, -0.6449737548828125, -0.6127090454101562, -0.5804443359375, -0.5481796264648438, -0.5159149169921875, -0.48365020751953125, -0.451385498046875, -0.41912078857421875, -0.3868560791015625, -0.35459136962890625, -0.32232666015625, -0.29006195068359375, -0.2577972412109375, -0.22553253173828125, -0.193267822265625, -0.16100311279296875, -0.1287384033203125, -0.09647369384765625, -0.064208984375, -0.03194427490234375, 0.0003204345703125, 0.03258514404296875, 0.064849853515625, 0.09711456298828125, 0.1293792724609375, 0.16164398193359375, 0.19390869140625, 0.22617340087890625, 0.2584381103515625, 0.29070281982421875, 0.322967529296875, 0.35523223876953125, 0.3874969482421875, 0.41976165771484375, 0.4520263671875, 0.48429107666015625, 0.5165557861328125, 0.5488204956054688, 0.581085205078125, 0.6133499145507812, 0.6456146240234375, 0.6778793334960938, 0.71014404296875, 0.7424087524414062, 0.7746734619140625, 0.8069381713867188, 0.839202880859375, 0.8714675903320312, 0.9037322998046875, 0.9359970092773438, 0.96826171875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 0.0, 6.0, 10.0, 9.0, 8.0, 11.0, 9.0, 13.0, 27.0, 34.0, 58.0, 94.0, 195.0, 397.0, 824.0, 2592.0, 11199.0, 112698.0, 887798.0, 25612.0, 4581.0, 1274.0, 496.0, 254.0, 118.0, 67.0, 48.0, 33.0, 28.0, 21.0, 11.0, 10.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.07623291015625, -0.0737905502319336, -0.07134819030761719, -0.06890583038330078, -0.06646347045898438, -0.06402111053466797, -0.06157875061035156, -0.059136390686035156, -0.05669403076171875, -0.054251670837402344, -0.05180931091308594, -0.04936695098876953, -0.046924591064453125, -0.04448223114013672, -0.04203987121582031, -0.039597511291503906, -0.0371551513671875, -0.034712791442871094, -0.03227043151855469, -0.02982807159423828, -0.027385711669921875, -0.02494335174560547, -0.022500991821289062, -0.020058631896972656, -0.01761627197265625, -0.015173912048339844, -0.012731552124023438, -0.010289192199707031, -0.007846832275390625, -0.005404472351074219, -0.0029621124267578125, -0.0005197525024414062, 0.001922607421875, 0.004364967346191406, 0.0068073272705078125, 0.009249687194824219, 0.011692047119140625, 0.014134407043457031, 0.016576766967773438, 0.019019126892089844, 0.02146148681640625, 0.023903846740722656, 0.026346206665039062, 0.02878856658935547, 0.031230926513671875, 0.03367328643798828, 0.03611564636230469, 0.038558006286621094, 0.0410003662109375, 0.043442726135253906, 0.04588508605957031, 0.04832744598388672, 0.050769805908203125, 0.05321216583251953, 0.05565452575683594, 0.058096885681152344, 0.06053924560546875, 0.06298160552978516, 0.06542396545410156, 0.06786632537841797, 0.07030868530273438, 0.07275104522705078, 0.07519340515136719, 0.0776357650756836, 0.080078125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 5.0, 2.0, 4.0, 2.0, 4.0, 4.0, 2.0, 6.0, 2.0, 5.0, 4.0, 5.0, 18.0, 12.0, 15.0, 19.0, 27.0, 24.0, 34.0, 37.0, 34.0, 59.0, 69.0, 76.0, 55.0, 73.0, 57.0, 56.0, 52.0, 40.0, 37.0, 32.0, 25.0, 26.0, 13.0, 18.0, 6.0, 4.0, 6.0, 10.0, 5.0, 6.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0], "bins": [-2.9981136322021484e-05, -2.916250377893448e-05, -2.8343871235847473e-05, -2.7525238692760468e-05, -2.6706606149673462e-05, -2.5887973606586456e-05, -2.506934106349945e-05, -2.4250708520412445e-05, -2.343207597732544e-05, -2.2613443434238434e-05, -2.1794810891151428e-05, -2.0976178348064423e-05, -2.0157545804977417e-05, -1.933891326189041e-05, -1.8520280718803406e-05, -1.77016481757164e-05, -1.6883015632629395e-05, -1.606438308954239e-05, -1.5245750546455383e-05, -1.4427118003368378e-05, -1.3608485460281372e-05, -1.2789852917194366e-05, -1.197122037410736e-05, -1.1152587831020355e-05, -1.033395528793335e-05, -9.515322744846344e-06, -8.696690201759338e-06, -7.878057658672333e-06, -7.059425115585327e-06, -6.2407925724983215e-06, -5.422160029411316e-06, -4.60352748632431e-06, -3.7848949432373047e-06, -2.966262400150299e-06, -2.1476298570632935e-06, -1.3289973139762878e-06, -5.103647708892822e-07, 3.082677721977234e-07, 1.126900315284729e-06, 1.9455328583717346e-06, 2.7641654014587402e-06, 3.582797944545746e-06, 4.4014304876327515e-06, 5.220063030719757e-06, 6.038695573806763e-06, 6.857328116893768e-06, 7.675960659980774e-06, 8.49459320306778e-06, 9.313225746154785e-06, 1.013185828924179e-05, 1.0950490832328796e-05, 1.1769123375415802e-05, 1.2587755918502808e-05, 1.3406388461589813e-05, 1.4225021004676819e-05, 1.5043653547763824e-05, 1.586228609085083e-05, 1.6680918633937836e-05, 1.749955117702484e-05, 1.8318183720111847e-05, 1.9136816263198853e-05, 1.9955448806285858e-05, 2.0774081349372864e-05, 2.159271389245987e-05, 2.2411346435546875e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 7.0, 4.0, 10.0, 13.0, 11.0, 24.0, 27.0, 45.0, 73.0, 92.0, 99.0, 171.0, 315.0, 482.0, 818.0, 1430.0, 2653.0, 5172.0, 11522.0, 29715.0, 129760.0, 769622.0, 60892.0, 19032.0, 7876.0, 3832.0, 1965.0, 1100.0, 635.0, 379.0, 271.0, 164.0, 103.0, 71.0, 48.0, 38.0, 19.0, 22.0, 9.0, 9.0, 4.0, 3.0, 5.0, 4.0, 3.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.0345458984375, -0.03344154357910156, -0.032337188720703125, -0.031232833862304688, -0.03012847900390625, -0.029024124145507812, -0.027919769287109375, -0.026815414428710938, -0.0257110595703125, -0.024606704711914062, -0.023502349853515625, -0.022397994995117188, -0.02129364013671875, -0.020189285278320312, -0.019084930419921875, -0.017980575561523438, -0.016876220703125, -0.015771865844726562, -0.014667510986328125, -0.013563156127929688, -0.01245880126953125, -0.011354446411132812, -0.010250091552734375, -0.009145736694335938, -0.0080413818359375, -0.0069370269775390625, -0.005832672119140625, -0.0047283172607421875, -0.00362396240234375, -0.0025196075439453125, -0.001415252685546875, -0.0003108978271484375, 0.00079345703125, 0.0018978118896484375, 0.003002166748046875, 0.0041065216064453125, 0.00521087646484375, 0.0063152313232421875, 0.007419586181640625, 0.008523941040039062, 0.0096282958984375, 0.010732650756835938, 0.011837005615234375, 0.012941360473632812, 0.01404571533203125, 0.015150070190429688, 0.016254425048828125, 0.017358779907226562, 0.018463134765625, 0.019567489624023438, 0.020671844482421875, 0.021776199340820312, 0.02288055419921875, 0.023984909057617188, 0.025089263916015625, 0.026193618774414062, 0.0272979736328125, 0.028402328491210938, 0.029506683349609375, 0.030611038208007812, 0.03171539306640625, 0.03281974792480469, 0.033924102783203125, 0.03502845764160156, 0.0361328125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 4.0, 5.0, 2.0, 2.0, 4.0, 5.0, 8.0, 7.0, 6.0, 12.0, 12.0, 13.0, 18.0, 16.0, 31.0, 36.0, 49.0, 64.0, 78.0, 111.0, 127.0, 95.0, 63.0, 48.0, 27.0, 23.0, 26.0, 18.0, 17.0, 11.0, 10.0, 15.0, 9.0, 6.0, 2.0, 5.0, 3.0, 3.0, 3.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.06610107421875, -0.06426668167114258, -0.062432289123535156, -0.060597896575927734, -0.05876350402832031, -0.05692911148071289, -0.05509471893310547, -0.05326032638549805, -0.051425933837890625, -0.0495915412902832, -0.04775714874267578, -0.04592275619506836, -0.04408836364746094, -0.042253971099853516, -0.040419578552246094, -0.03858518600463867, -0.03675079345703125, -0.03491640090942383, -0.033082008361816406, -0.031247615814208984, -0.029413223266601562, -0.02757883071899414, -0.02574443817138672, -0.023910045623779297, -0.022075653076171875, -0.020241260528564453, -0.01840686798095703, -0.01657247543334961, -0.014738082885742188, -0.012903690338134766, -0.011069297790527344, -0.009234905242919922, -0.0074005126953125, -0.005566120147705078, -0.0037317276000976562, -0.0018973350524902344, -6.29425048828125e-05, 0.0017714500427246094, 0.0036058425903320312, 0.005440235137939453, 0.007274627685546875, 0.009109020233154297, 0.010943412780761719, 0.01277780532836914, 0.014612197875976562, 0.016446590423583984, 0.018280982971191406, 0.020115375518798828, 0.02194976806640625, 0.023784160614013672, 0.025618553161621094, 0.027452945709228516, 0.029287338256835938, 0.03112173080444336, 0.03295612335205078, 0.0347905158996582, 0.036624908447265625, 0.03845930099487305, 0.04029369354248047, 0.04212808609008789, 0.04396247863769531, 0.045796871185302734, 0.047631263732910156, 0.04946565628051758, 0.051300048828125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 10.0, 24.0, 27.0, 54.0, 146.0, 478.0, 98.0, 59.0, 30.0, 22.0, 13.0, 12.0, 6.0, 8.0, 6.0, 1.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4051713943481445, -1.3128323554992676, -1.2204933166503906, -1.1281542778015137, -1.0358152389526367, -0.9434762001037598, -0.8511371612548828, -0.7587981224060059, -0.6664590835571289, -0.574120044708252, -0.481781005859375, -0.38944196701049805, -0.2971029281616211, -0.20476388931274414, -0.11242485046386719, -0.020085811614990234, 0.07225322723388672, 0.16459226608276367, 0.2569313049316406, 0.3492703437805176, 0.44160938262939453, 0.5339484214782715, 0.6262874603271484, 0.7186264991760254, 0.8109655380249023, 0.9033045768737793, 0.9956436157226562, 1.0879826545715332, 1.1803216934204102, 1.272660732269287, 1.364999771118164, 1.457338809967041, 1.549677848815918, 1.642016887664795, 1.7343559265136719, 1.8266949653625488, 1.9190340042114258, 2.0113730430603027, 2.1037120819091797, 2.1960511207580566, 2.2883901596069336, 2.3807291984558105, 2.4730682373046875, 2.5654072761535645, 2.6577463150024414, 2.7500853538513184, 2.8424243927001953, 2.9347634315490723, 3.027102470397949, 3.119441509246826, 3.211780548095703, 3.30411958694458, 3.396458625793457, 3.488797664642334, 3.581136703491211, 3.673475742340088, 3.765814781188965, 3.858153820037842, 3.9504928588867188, 4.042831897735596, 4.135170936584473, 4.22750997543335, 4.319849014282227, 4.4121880531311035, 4.5045270919799805]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 4.0, 8.0, 2.0, 6.0, 11.0, 8.0, 8.0, 15.0, 17.0, 17.0, 26.0, 25.0, 30.0, 39.0, 40.0, 168.0, 303.0, 46.0, 37.0, 33.0, 14.0, 28.0, 20.0, 11.0, 13.0, 19.0, 8.0, 5.0, 8.0, 7.0, 6.0, 5.0, 5.0, 1.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.8578991889953613, -2.7718162536621094, -2.6857330799102783, -2.5996501445770264, -2.5135669708251953, -2.4274840354919434, -2.3414011001586914, -2.2553181648254395, -2.1692349910736084, -2.0831520557403564, -1.9970688819885254, -1.9109859466552734, -1.824902892112732, -1.7388198375701904, -1.6527369022369385, -1.566653847694397, -1.4805707931518555, -1.394487738609314, -1.3084046840667725, -1.2223217487335205, -1.136238694190979, -1.0501556396484375, -0.9640726447105408, -0.877989649772644, -0.7919065952301025, -0.705823540687561, -0.6197405457496643, -0.5336575508117676, -0.4475744962692261, -0.36149147152900696, -0.27540844678878784, -0.1893254518508911, -0.10324215888977051, -0.01715913414955139, 0.06892389059066772, 0.15500691533088684, 0.24108994007110596, 0.3271729648113251, 0.4132559895515442, 0.4993389844894409, 0.5854220390319824, 0.6715050935745239, 0.7575880885124207, 0.8436710834503174, 0.9297541379928589, 1.0158371925354004, 1.1019201278686523, 1.1880031824111938, 1.2740862369537354, 1.3601692914962769, 1.4462523460388184, 1.5323352813720703, 1.6184183359146118, 1.7045013904571533, 1.7905843257904053, 1.8766673803329468, 1.9627504348754883, 2.0488333702087402, 2.1349165439605713, 2.2209994792938232, 2.3070826530456543, 2.3931655883789062, 2.479248523712158, 2.56533145904541, 2.651414632797241]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 4.0, 1.0, 5.0, 2.0, 10.0, 10.0, 9.0, 9.0, 25.0, 23.0, 25.0, 26.0, 47.0, 47.0, 59.0, 261.0, 147.0, 55.0, 37.0, 34.0, 29.0, 26.0, 30.0, 25.0, 21.0, 10.0, 6.0, 7.0, 4.0, 5.0, 0.0, 3.0, 1.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.296630859375, -0.2883739471435547, -0.2801170349121094, -0.27186012268066406, -0.26360321044921875, -0.25534629821777344, -0.24708938598632812, -0.2388324737548828, -0.2305755615234375, -0.2223186492919922, -0.21406173706054688, -0.20580482482910156, -0.19754791259765625, -0.18929100036621094, -0.18103408813476562, -0.1727771759033203, -0.164520263671875, -0.1562633514404297, -0.14800643920898438, -0.13974952697753906, -0.13149261474609375, -0.12323570251464844, -0.11497879028320312, -0.10672187805175781, -0.0984649658203125, -0.09020805358886719, -0.08195114135742188, -0.07369422912597656, -0.06543731689453125, -0.05718040466308594, -0.048923492431640625, -0.04066658020019531, -0.03240966796875, -0.024152755737304688, -0.015895843505859375, -0.0076389312744140625, 0.00061798095703125, 0.008874893188476562, 0.017131805419921875, 0.025388717651367188, 0.0336456298828125, 0.04190254211425781, 0.050159454345703125, 0.05841636657714844, 0.06667327880859375, 0.07493019104003906, 0.08318710327148438, 0.09144401550292969, 0.099700927734375, 0.10795783996582031, 0.11621475219726562, 0.12447166442871094, 0.13272857666015625, 0.14098548889160156, 0.14924240112304688, 0.1574993133544922, 0.1657562255859375, 0.1740131378173828, 0.18227005004882812, 0.19052696228027344, 0.19878387451171875, 0.20704078674316406, 0.21529769897460938, 0.2235546112060547, 0.2318115234375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 8.0, 4.0, 0.0, 0.0, 11.0, 2.0, 1.0, 1.0, 5.0, 13.0, 11.0, 34.0, 40.0, 58.0, 121.0, 533.0, 7728.0, 8375851.0, 3450.0, 464.0, 106.0, 45.0, 23.0, 17.0, 24.0, 13.0, 3.0, 5.0, 12.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0], "bins": [-4.04733943939209, -3.904789686203003, -3.762239933013916, -3.619690179824829, -3.477140426635742, -3.3345906734466553, -3.1920409202575684, -3.0494911670684814, -2.9069414138793945, -2.7643916606903076, -2.6218419075012207, -2.479292154312134, -2.336742401123047, -2.19419264793396, -2.051642894744873, -1.9090931415557861, -1.7665433883666992, -1.6239936351776123, -1.4814438819885254, -1.3388941287994385, -1.1963443756103516, -1.0537946224212646, -0.9112448692321777, -0.7686951160430908, -0.6261453628540039, -0.483595609664917, -0.3410458564758301, -0.19849610328674316, -0.05594635009765625, 0.08660340309143066, 0.22915315628051758, 0.3717029094696045, 0.5142531394958496, 0.6568028926849365, 0.7993526458740234, 0.9419023990631104, 1.0844521522521973, 1.2270019054412842, 1.369551658630371, 1.512101411819458, 1.654651165008545, 1.7972009181976318, 1.9397506713867188, 2.0823004245758057, 2.2248501777648926, 2.3673999309539795, 2.5099496841430664, 2.6524994373321533, 2.7950491905212402, 2.937598943710327, 3.080148696899414, 3.222698450088501, 3.365248203277588, 3.507797956466675, 3.6503477096557617, 3.7928974628448486, 3.9354472160339355, 4.077997207641602, 4.220546722412109, 4.363096237182617, 4.505646228790283, 4.648196220397949, 4.790745735168457, 4.933295249938965, 5.075845241546631]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 5.0, 4.0, 3.0, 4.0, 4.0, 8.0, 4.0, 3.0, 5.0, 4.0, 3.0, 2.0, 5.0, 4.0, 6.0, 3.0, 4.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.315582275390625, -2.2522382736206055, -2.188894033432007, -2.1255500316619873, -2.0622057914733887, -1.9988617897033691, -1.9355177879333496, -1.8721736669540405, -1.8088295459747314, -1.7454854249954224, -1.6821413040161133, -1.6187973022460938, -1.5554531812667847, -1.4921090602874756, -1.428765058517456, -1.365420937538147, -1.302076816558838, -1.2387326955795288, -1.1753885746002197, -1.1120445728302002, -1.0487004518508911, -0.985356330871582, -0.9220122694969177, -0.8586682081222534, -0.7953240871429443, -0.7319799661636353, -0.668635904788971, -0.6052918434143066, -0.5419477224349976, -0.47860363125801086, -0.41525954008102417, -0.3519154489040375, -0.2885715961456299, -0.2252275049686432, -0.1618834137916565, -0.0985393226146698, -0.035195231437683105, 0.02814885973930359, 0.09149295091629028, 0.15483704209327698, 0.21818113327026367, 0.28152522444725037, 0.34486931562423706, 0.40821340680122375, 0.47155749797821045, 0.5349016189575195, 0.5982456803321838, 0.6615897417068481, 0.7249338626861572, 0.7882779836654663, 0.8516220450401306, 0.9149661064147949, 0.978310227394104, 1.041654348373413, 1.1049983501434326, 1.1683424711227417, 1.2316865921020508, 1.2950307130813599, 1.358374834060669, 1.4217188358306885, 1.4850629568099976, 1.5484070777893066, 1.6117510795593262, 1.6750952005386353, 1.7384393215179443]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 8.0, 4.0, 4.0, 8.0, 4.0, 6.0, 12.0, 21.0, 31.0, 36.0, 49.0, 64.0, 101.0, 180.0, 290.0, 558.0, 1624.0, 6994.0, 43752.0, 289248.0, 154532.0, 20601.0, 3944.0, 1093.0, 465.0, 239.0, 142.0, 78.0, 55.0, 37.0, 24.0, 19.0, 15.0, 9.0, 3.0, 8.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.484375, -2.40625, -2.328125, -2.25, -2.171875, -2.09375, -2.015625, -1.9375, -1.859375, -1.78125, -1.703125, -1.625, -1.546875, -1.46875, -1.390625, -1.3125, -1.234375, -1.15625, -1.078125, -1.0, -0.921875, -0.84375, -0.765625, -0.6875, -0.609375, -0.53125, -0.453125, -0.375, -0.296875, -0.21875, -0.140625, -0.0625, 0.015625, 0.09375, 0.171875, 0.25, 0.328125, 0.40625, 0.484375, 0.5625, 0.640625, 0.71875, 0.796875, 0.875, 0.953125, 1.03125, 1.109375, 1.1875, 1.265625, 1.34375, 1.421875, 1.5, 1.578125, 1.65625, 1.734375, 1.8125, 1.890625, 1.96875, 2.046875, 2.125, 2.203125, 2.28125, 2.359375, 2.4375, 2.515625]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 6.0, 18.0, 20.0, 28.0, 51.0, 75.0, 123.0, 159.0, 154.0, 127.0, 95.0, 55.0, 45.0, 25.0, 17.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81396484375, -0.7945938110351562, -0.7752227783203125, -0.7558517456054688, -0.736480712890625, -0.7171096801757812, -0.6977386474609375, -0.6783676147460938, -0.65899658203125, -0.6396255493164062, -0.6202545166015625, -0.6008834838867188, -0.581512451171875, -0.5621414184570312, -0.5427703857421875, -0.5233993530273438, -0.5040283203125, -0.48465728759765625, -0.4652862548828125, -0.44591522216796875, -0.426544189453125, -0.40717315673828125, -0.3878021240234375, -0.36843109130859375, -0.34906005859375, -0.32968902587890625, -0.3103179931640625, -0.29094696044921875, -0.271575927734375, -0.25220489501953125, -0.2328338623046875, -0.21346282958984375, -0.194091796875, -0.17472076416015625, -0.1553497314453125, -0.13597869873046875, -0.116607666015625, -0.09723663330078125, -0.0778656005859375, -0.05849456787109375, -0.03912353515625, -0.01975250244140625, -0.0003814697265625, 0.01898956298828125, 0.038360595703125, 0.05773162841796875, 0.0771026611328125, 0.09647369384765625, 0.1158447265625, 0.13521575927734375, 0.1545867919921875, 0.17395782470703125, 0.193328857421875, 0.21269989013671875, 0.2320709228515625, 0.25144195556640625, 0.27081298828125, 0.29018402099609375, 0.3095550537109375, 0.32892608642578125, 0.348297119140625, 0.36766815185546875, 0.3870391845703125, 0.40641021728515625, 0.42578125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 4.0, 2.0, 9.0, 8.0, 18.0, 27.0, 60.0, 80.0, 76.0, 71.0, 58.0, 22.0, 12.0, 11.0, 5.0, 3.0, 2.0, 1.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.408954620361328, -2.3510591983795166, -2.293164014816284, -2.2352685928344727, -2.177373170852661, -2.1194777488708496, -2.061582565307617, -2.0036871433258057, -1.9457917213439941, -1.8878964185714722, -1.8300009965896606, -1.7721056938171387, -1.7142102718353271, -1.6563149690628052, -1.5984196662902832, -1.5405242443084717, -1.4826289415359497, -1.4247336387634277, -1.3668382167816162, -1.3089429140090942, -1.2510474920272827, -1.1931521892547607, -1.1352567672729492, -1.0773614645004272, -1.0194661617279053, -0.9615707993507385, -0.9036754369735718, -0.8457801342010498, -0.7878847122192383, -0.7299894094467163, -0.6720940470695496, -0.6141986846923828, -0.5563031435012817, -0.498407781124115, -0.44051241874694824, -0.3826170861721039, -0.32472172379493713, -0.2668263614177704, -0.20893102884292603, -0.15103566646575928, -0.09314030408859253, -0.03524494916200638, 0.022650405764579773, 0.08054575324058533, 0.13844111561775208, 0.19633647799491882, 0.2542318105697632, 0.31212717294692993, 0.3700225353240967, 0.4279178977012634, 0.4858132600784302, 0.5437085628509521, 0.6016039848327637, 0.6594992876052856, 0.7173946499824524, 0.7752900123596191, 0.8331853747367859, 0.8910807371139526, 0.9489760994911194, 1.0068714618682861, 1.064766764640808, 1.1226621866226196, 1.1805574893951416, 1.2384529113769531, 1.296348214149475]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 5.0, 4.0, 9.0, 5.0, 33.0, 72.0, 124.0, 91.0, 62.0, 30.0, 14.0, 12.0, 8.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.102263927459717, -2.031590700149536, -1.960917353630066, -1.8902440071105957, -1.819570779800415, -1.7488974332809448, -1.6782240867614746, -1.607550859451294, -1.5368775129318237, -1.4662041664123535, -1.3955309391021729, -1.3248575925827026, -1.2541842460632324, -1.1835110187530518, -1.1128376722335815, -1.0421643257141113, -0.9714910984039307, -0.9008178114891052, -0.8301445245742798, -0.7594711780548096, -0.6887978911399841, -0.6181246042251587, -0.5474512577056885, -0.47677797079086304, -0.4061046838760376, -0.33543139696121216, -0.26475808024406433, -0.1940847784280777, -0.12341147661209106, -0.052738189697265625, 0.017935127019882202, 0.08860844373703003, 0.15928173065185547, 0.2299550324678421, 0.30062833428382874, 0.37130165100097656, 0.441974937915802, 0.5126482248306274, 0.5833215713500977, 0.6539948582649231, 0.7246681451797485, 0.795341432094574, 0.8660147190093994, 0.9366880655288696, 1.0073614120483398, 1.0780346393585205, 1.1487079858779907, 1.219381332397461, 1.2900545597076416, 1.3607279062271118, 1.4314011335372925, 1.5020744800567627, 1.5727477073669434, 1.6434210538864136, 1.7140944004058838, 1.7847676277160645, 1.8554409742355347, 1.9261143207550049, 1.9967875480651855, 2.067460775375366, 2.138134241104126, 2.2088074684143066, 2.2794806957244873, 2.350154161453247, 2.4208273887634277]}, "eval/loss": 4.170833587646484, "eval/wer": 1.9509520031733438, "eval/runtime": 786.0537, "eval/samples_per_second": 3.361, "eval/steps_per_second": 0.281, "train/train_runtime": 5681.1629, "train/train_samples_per_second": 5.023, "train/train_steps_per_second": 0.105, "train/total_flos": 0.0, "train/train_loss": 4.265389429599749} \ No newline at end of file