diff --git "a/wandb/run-20220301_103527-1wkgn37c/files/wandb-summary.json" "b/wandb/run-20220301_103527-1wkgn37c/files/wandb-summary.json" new file mode 100644--- /dev/null +++ "b/wandb/run-20220301_103527-1wkgn37c/files/wandb-summary.json" @@ -0,0 +1 @@ +{"train/loss": 4.3047, "train/learning_rate": 2.982e-05, "train/epoch": 0.84, "train/global_step": 500, "_runtime": 4780, "_timestamp": 1646135707, "_step": 500, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 10.0, 25.0, 89.0, 201.0, 274.0, 207.0, 129.0, 61.0, 14.0, 2.0, 3.0], "bins": [-159.7316436767578, -156.95663452148438, -154.181640625, -151.40663146972656, -148.63162231445312, -145.8566131591797, -143.0816192626953, -140.30661010742188, -137.53160095214844, -134.756591796875, -131.98159790039062, -129.2065887451172, -126.43157958984375, -123.65657806396484, -120.88157653808594, -118.1065673828125, -115.3315658569336, -112.55656433105469, -109.78155517578125, -107.00655364990234, -104.2315444946289, -101.45654296875, -98.68153381347656, -95.90653228759766, -93.13153076171875, -90.35652923583984, -87.5815200805664, -84.8065185546875, -82.03150939941406, -79.25650787353516, -76.48150634765625, -73.70649719238281, -70.93148803710938, -68.15648651123047, -65.38147735595703, -62.606475830078125, -59.83146667480469, -57.05646514892578, -54.28145980834961, -51.50645446777344, -48.731449127197266, -45.956443786621094, -43.18143844604492, -40.40643310546875, -37.631431579589844, -34.856422424316406, -32.0814208984375, -29.306415557861328, -26.531410217285156, -23.756404876708984, -20.981399536132812, -18.206396102905273, -15.431390762329102, -12.65638542175293, -9.88138198852539, -7.106376647949219, -4.331371307373047, -1.5563664436340332, 1.2186384201049805, 3.993642807006836, 6.768648147583008, 9.54365348815918, 12.318656921386719, 15.09366226196289, 17.868667602539062]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 7.0, 3.0, 7.0, 11.0, 11.0, 13.0, 14.0, 12.0, 23.0, 21.0, 23.0, 42.0, 37.0, 53.0, 48.0, 58.0, 57.0, 72.0, 58.0, 64.0, 50.0, 41.0, 47.0, 42.0, 27.0, 30.0, 26.0, 21.0, 22.0, 19.0, 14.0, 6.0, 3.0, 13.0, 5.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-71.47561645507812, -69.17546081542969, -66.87531280517578, -64.57515716552734, -62.275001525878906, -59.974849700927734, -57.67469787597656, -55.374542236328125, -53.07438659667969, -50.774234771728516, -48.47407913208008, -46.173927307128906, -43.87377166748047, -41.5736198425293, -39.273468017578125, -36.97331237792969, -34.673160552978516, -32.373008728027344, -30.072853088378906, -27.772701263427734, -25.472545623779297, -23.172393798828125, -20.87224006652832, -18.572086334228516, -16.27193260192871, -13.971778869628906, -11.671625137329102, -9.371472358703613, -7.071318626403809, -4.771164894104004, -2.4710121154785156, -0.17085838317871094, 2.1292953491210938, 4.429449081420898, 6.729602336883545, 9.029755592346191, 11.329909324645996, 13.6300630569458, 15.930215835571289, 18.230369567871094, 20.5305233001709, 22.830677032470703, 25.130830764770508, 27.430984497070312, 29.731136322021484, 32.03129196166992, 34.331443786621094, 36.63159942626953, 38.9317512512207, 41.231903076171875, 43.53205871582031, 45.832210540771484, 48.13236618041992, 50.432518005371094, 52.73267364501953, 55.0328254699707, 57.332977294921875, 59.63312911987305, 61.933284759521484, 64.23343658447266, 66.5335922241211, 68.83374786376953, 71.13389587402344, 73.43405151367188, 75.73420715332031]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 5.0, 8.0, 12.0, 7.0, 11.0, 15.0, 13.0, 14.0, 25.0, 22.0, 24.0, 30.0, 37.0, 49.0, 57.0, 48.0, 48.0, 64.0, 60.0, 52.0, 51.0, 51.0, 52.0, 36.0, 28.0, 30.0, 21.0, 33.0, 10.0, 18.0, 12.0, 11.0, 16.0, 11.0, 9.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8671875, -3.72955322265625, -3.5919189453125, -3.45428466796875, -3.316650390625, -3.17901611328125, -3.0413818359375, -2.90374755859375, -2.76611328125, -2.62847900390625, -2.4908447265625, -2.35321044921875, -2.215576171875, -2.07794189453125, -1.9403076171875, -1.80267333984375, -1.6650390625, -1.52740478515625, -1.3897705078125, -1.25213623046875, -1.114501953125, -0.97686767578125, -0.8392333984375, -0.70159912109375, -0.56396484375, -0.42633056640625, -0.2886962890625, -0.15106201171875, -0.013427734375, 0.12420654296875, 0.2618408203125, 0.39947509765625, 0.537109375, 0.67474365234375, 0.8123779296875, 0.95001220703125, 1.087646484375, 1.22528076171875, 1.3629150390625, 1.50054931640625, 1.63818359375, 1.77581787109375, 1.9134521484375, 2.05108642578125, 2.188720703125, 2.32635498046875, 2.4639892578125, 2.60162353515625, 2.7392578125, 2.87689208984375, 3.0145263671875, 3.15216064453125, 3.289794921875, 3.42742919921875, 3.5650634765625, 3.70269775390625, 3.84033203125, 3.97796630859375, 4.1156005859375, 4.25323486328125, 4.390869140625, 4.52850341796875, 4.6661376953125, 4.80377197265625, 4.94140625]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 8.0, 14.0, 13.0, 16.0, 23.0, 27.0, 43.0, 59.0, 83.0, 124.0, 207.0, 315.0, 496.0, 859.0, 1490.0, 2865.0, 6509.0, 18137.0, 74813.0, 592136.0, 2777785.0, 611157.0, 75542.0, 18610.0, 6385.0, 2814.0, 1469.0, 858.0, 482.0, 329.0, 198.0, 114.0, 81.0, 65.0, 56.0, 30.0, 19.0, 18.0, 15.0, 9.0, 6.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.6953125, -11.2989501953125, -10.902587890625, -10.5062255859375, -10.10986328125, -9.7135009765625, -9.317138671875, -8.9207763671875, -8.5244140625, -8.1280517578125, -7.731689453125, -7.3353271484375, -6.93896484375, -6.5426025390625, -6.146240234375, -5.7498779296875, -5.353515625, -4.9571533203125, -4.560791015625, -4.1644287109375, -3.76806640625, -3.3717041015625, -2.975341796875, -2.5789794921875, -2.1826171875, -1.7862548828125, -1.389892578125, -0.9935302734375, -0.59716796875, -0.2008056640625, 0.195556640625, 0.5919189453125, 0.98828125, 1.3846435546875, 1.781005859375, 2.1773681640625, 2.57373046875, 2.9700927734375, 3.366455078125, 3.7628173828125, 4.1591796875, 4.5555419921875, 4.951904296875, 5.3482666015625, 5.74462890625, 6.1409912109375, 6.537353515625, 6.9337158203125, 7.330078125, 7.7264404296875, 8.122802734375, 8.5191650390625, 8.91552734375, 9.3118896484375, 9.708251953125, 10.1046142578125, 10.5009765625, 10.8973388671875, 11.293701171875, 11.6900634765625, 12.08642578125, 12.4827880859375, 12.879150390625, 13.2755126953125, 13.671875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 11.0, 8.0, 16.0, 33.0, 30.0, 84.0, 112.0, 214.0, 400.0, 631.0, 878.0, 714.0, 427.0, 227.0, 132.0, 65.0, 44.0, 27.0, 11.0, 7.0, 4.0, 5.0, 3.0, 1.0, 2.0, 2.0], "bins": [-37.90625, -37.126953125, -36.34765625, -35.568359375, -34.7890625, -34.009765625, -33.23046875, -32.451171875, -31.671875, -30.892578125, -30.11328125, -29.333984375, -28.5546875, -27.775390625, -26.99609375, -26.216796875, -25.4375, -24.658203125, -23.87890625, -23.099609375, -22.3203125, -21.541015625, -20.76171875, -19.982421875, -19.203125, -18.423828125, -17.64453125, -16.865234375, -16.0859375, -15.306640625, -14.52734375, -13.748046875, -12.96875, -12.189453125, -11.41015625, -10.630859375, -9.8515625, -9.072265625, -8.29296875, -7.513671875, -6.734375, -5.955078125, -5.17578125, -4.396484375, -3.6171875, -2.837890625, -2.05859375, -1.279296875, -0.5, 0.279296875, 1.05859375, 1.837890625, 2.6171875, 3.396484375, 4.17578125, 4.955078125, 5.734375, 6.513671875, 7.29296875, 8.072265625, 8.8515625, 9.630859375, 10.41015625, 11.189453125, 11.96875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 11.0, 15.0, 47.0, 96.0, 204.0, 550.0, 1421.0, 15083.0, 4158904.0, 15713.0, 1382.0, 476.0, 230.0, 71.0, 46.0, 23.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-124.0625, -120.466796875, -116.87109375, -113.275390625, -109.6796875, -106.083984375, -102.48828125, -98.892578125, -95.296875, -91.701171875, -88.10546875, -84.509765625, -80.9140625, -77.318359375, -73.72265625, -70.126953125, -66.53125, -62.935546875, -59.33984375, -55.744140625, -52.1484375, -48.552734375, -44.95703125, -41.361328125, -37.765625, -34.169921875, -30.57421875, -26.978515625, -23.3828125, -19.787109375, -16.19140625, -12.595703125, -9.0, -5.404296875, -1.80859375, 1.787109375, 5.3828125, 8.978515625, 12.57421875, 16.169921875, 19.765625, 23.361328125, 26.95703125, 30.552734375, 34.1484375, 37.744140625, 41.33984375, 44.935546875, 48.53125, 52.126953125, 55.72265625, 59.318359375, 62.9140625, 66.509765625, 70.10546875, 73.701171875, 77.296875, 80.892578125, 84.48828125, 88.083984375, 91.6796875, 95.275390625, 98.87109375, 102.466796875, 106.0625]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 74.0, 443.0, 436.0, 56.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.867191314697266, -27.192401885986328, -20.51761245727539, -13.842823028564453, -7.168033599853516, -0.4932441711425781, 6.181545257568359, 12.856334686279297, 19.531124114990234, 26.205913543701172, 32.88070297241211, 39.55549240112305, 46.230281829833984, 52.90507125854492, 59.57986068725586, 66.25465393066406, 72.929443359375, 79.60423278808594, 86.27902221679688, 92.95381164550781, 99.62860107421875, 106.30339050292969, 112.97817993164062, 119.65296936035156, 126.3277587890625, 133.00254821777344, 139.67733764648438, 146.3521270751953, 153.02691650390625, 159.7017059326172, 166.37649536132812, 173.05128479003906, 179.72607421875, 186.40086364746094, 193.07565307617188, 199.7504425048828, 206.42523193359375, 213.1000213623047, 219.77481079101562, 226.44960021972656, 233.1243896484375, 239.79917907714844, 246.47396850585938, 253.1487579345703, 259.82354736328125, 266.49835205078125, 273.1731262207031, 279.847900390625, 286.522705078125, 293.197509765625, 299.8722839355469, 306.54705810546875, 313.22186279296875, 319.89666748046875, 326.5714416503906, 333.2462158203125, 339.9210205078125, 346.5958251953125, 353.2705993652344, 359.94537353515625, 366.62017822265625, 373.29498291015625, 379.9697570800781, 386.64453125, 393.3193359375]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 3.0, 6.0, 6.0, 11.0, 10.0, 10.0, 14.0, 12.0, 9.0, 18.0, 18.0, 15.0, 22.0, 27.0, 28.0, 25.0, 44.0, 38.0, 33.0, 38.0, 38.0, 28.0, 48.0, 46.0, 42.0, 44.0, 36.0, 37.0, 36.0, 34.0, 31.0, 27.0, 18.0, 21.0, 21.0, 15.0, 10.0, 18.0, 11.0, 9.0, 11.0, 10.0, 6.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-45.879852294921875, -44.38687515258789, -42.893898010253906, -41.40092468261719, -39.9079475402832, -38.41497039794922, -36.921993255615234, -35.42901611328125, -33.93604278564453, -32.44306564331055, -30.950090408325195, -29.45711326599121, -27.96413803100586, -26.471160888671875, -24.97818374633789, -23.485206604003906, -21.992229461669922, -20.499252319335938, -19.006277084350586, -17.5132999420166, -16.02032470703125, -14.527347564697266, -13.034370422363281, -11.541394233703613, -10.048418045043945, -8.555441856384277, -7.062465190887451, -5.569488525390625, -4.076512336730957, -2.583536148071289, -1.0905590057373047, 0.4024171829223633, 1.8953933715820312, 3.3883697986602783, 4.881346225738525, 6.374322891235352, 7.8672990798950195, 9.360275268554688, 10.853252410888672, 12.34622859954834, 13.839204788208008, 15.332180976867676, 16.825157165527344, 18.318134307861328, 19.811111450195312, 21.304086685180664, 22.79706382751465, 24.2900390625, 25.783016204833984, 27.27599334716797, 28.76896858215332, 30.261945724487305, 31.754920959472656, 33.24789810180664, 34.740875244140625, 36.23385238647461, 37.726829528808594, 39.21980667114258, 40.71278381347656, 42.20575714111328, 43.698734283447266, 45.19171142578125, 46.684688568115234, 48.17766571044922, 49.67063903808594]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 6.0, 9.0, 9.0, 10.0, 18.0, 13.0, 16.0, 20.0, 25.0, 24.0, 38.0, 34.0, 36.0, 62.0, 54.0, 55.0, 50.0, 47.0, 36.0, 59.0, 61.0, 44.0, 41.0, 42.0, 33.0, 33.0, 19.0, 21.0, 20.0, 20.0, 12.0, 7.0, 12.0, 6.0, 6.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1953125, -4.03729248046875, -3.8792724609375, -3.72125244140625, -3.563232421875, -3.40521240234375, -3.2471923828125, -3.08917236328125, -2.93115234375, -2.77313232421875, -2.6151123046875, -2.45709228515625, -2.299072265625, -2.14105224609375, -1.9830322265625, -1.82501220703125, -1.6669921875, -1.50897216796875, -1.3509521484375, -1.19293212890625, -1.034912109375, -0.87689208984375, -0.7188720703125, -0.56085205078125, -0.40283203125, -0.24481201171875, -0.0867919921875, 0.07122802734375, 0.229248046875, 0.38726806640625, 0.5452880859375, 0.70330810546875, 0.861328125, 1.01934814453125, 1.1773681640625, 1.33538818359375, 1.493408203125, 1.65142822265625, 1.8094482421875, 1.96746826171875, 2.12548828125, 2.28350830078125, 2.4415283203125, 2.59954833984375, 2.757568359375, 2.91558837890625, 3.0736083984375, 3.23162841796875, 3.3896484375, 3.54766845703125, 3.7056884765625, 3.86370849609375, 4.021728515625, 4.17974853515625, 4.3377685546875, 4.49578857421875, 4.65380859375, 4.81182861328125, 4.9698486328125, 5.12786865234375, 5.285888671875, 5.44390869140625, 5.6019287109375, 5.75994873046875, 5.91796875]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 4.0, 2.0, 10.0, 16.0, 15.0, 23.0, 36.0, 57.0, 74.0, 105.0, 166.0, 245.0, 340.0, 484.0, 727.0, 1017.0, 1491.0, 2208.0, 3170.0, 4774.0, 7450.0, 10913.0, 16759.0, 26201.0, 41521.0, 68118.0, 115393.0, 197867.0, 217434.0, 127913.0, 75315.0, 45886.0, 28763.0, 18210.0, 11897.0, 7671.0, 5239.0, 3419.0, 2344.0, 1664.0, 1139.0, 742.0, 563.0, 393.0, 252.0, 175.0, 115.0, 71.0, 59.0, 36.0, 28.0, 14.0, 14.0, 11.0, 7.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.52978515625, -0.5127487182617188, -0.4957122802734375, -0.47867584228515625, -0.461639404296875, -0.44460296630859375, -0.4275665283203125, -0.41053009033203125, -0.39349365234375, -0.37645721435546875, -0.3594207763671875, -0.34238433837890625, -0.325347900390625, -0.30831146240234375, -0.2912750244140625, -0.27423858642578125, -0.2572021484375, -0.24016571044921875, -0.2231292724609375, -0.20609283447265625, -0.189056396484375, -0.17201995849609375, -0.1549835205078125, -0.13794708251953125, -0.12091064453125, -0.10387420654296875, -0.0868377685546875, -0.06980133056640625, -0.052764892578125, -0.03572845458984375, -0.0186920166015625, -0.00165557861328125, 0.015380859375, 0.03241729736328125, 0.0494537353515625, 0.06649017333984375, 0.083526611328125, 0.10056304931640625, 0.1175994873046875, 0.13463592529296875, 0.15167236328125, 0.16870880126953125, 0.1857452392578125, 0.20278167724609375, 0.219818115234375, 0.23685455322265625, 0.2538909912109375, 0.27092742919921875, 0.2879638671875, 0.30500030517578125, 0.3220367431640625, 0.33907318115234375, 0.356109619140625, 0.37314605712890625, 0.3901824951171875, 0.40721893310546875, 0.42425537109375, 0.44129180908203125, 0.4583282470703125, 0.47536468505859375, 0.492401123046875, 0.5094375610351562, 0.5264739990234375, 0.5435104370117188, 0.560546875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 6.0, 2.0, 5.0, 4.0, 7.0, 11.0, 20.0, 11.0, 16.0, 19.0, 10.0, 20.0, 17.0, 20.0, 24.0, 30.0, 28.0, 37.0, 27.0, 24.0, 44.0, 35.0, 23.0, 1067.0, 41.0, 41.0, 41.0, 33.0, 19.0, 33.0, 34.0, 34.0, 24.0, 24.0, 22.0, 22.0, 24.0, 17.0, 18.0, 16.0, 10.0, 16.0, 8.0, 9.0, 12.0, 5.0, 2.0, 3.0, 1.0, 4.0, 5.0, 5.0, 1.0, 2.0, 1.0], "bins": [-2.318359375, -2.248077392578125, -2.17779541015625, -2.107513427734375, -2.0372314453125, -1.966949462890625, -1.89666748046875, -1.826385498046875, -1.756103515625, -1.685821533203125, -1.61553955078125, -1.545257568359375, -1.4749755859375, -1.404693603515625, -1.33441162109375, -1.264129638671875, -1.19384765625, -1.123565673828125, -1.05328369140625, -0.983001708984375, -0.9127197265625, -0.842437744140625, -0.77215576171875, -0.701873779296875, -0.631591796875, -0.561309814453125, -0.49102783203125, -0.420745849609375, -0.3504638671875, -0.280181884765625, -0.20989990234375, -0.139617919921875, -0.0693359375, 0.000946044921875, 0.07122802734375, 0.141510009765625, 0.2117919921875, 0.282073974609375, 0.35235595703125, 0.422637939453125, 0.492919921875, 0.563201904296875, 0.63348388671875, 0.703765869140625, 0.7740478515625, 0.844329833984375, 0.91461181640625, 0.984893798828125, 1.05517578125, 1.125457763671875, 1.19573974609375, 1.266021728515625, 1.3363037109375, 1.406585693359375, 1.47686767578125, 1.547149658203125, 1.617431640625, 1.687713623046875, 1.75799560546875, 1.828277587890625, 1.8985595703125, 1.968841552734375, 2.03912353515625, 2.109405517578125, 2.1796875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 6.0, 8.0, 15.0, 15.0, 32.0, 34.0, 58.0, 108.0, 123.0, 184.0, 297.0, 419.0, 654.0, 970.0, 1463.0, 2271.0, 3451.0, 5468.0, 8719.0, 14275.0, 23806.0, 40975.0, 73270.0, 139815.0, 1304336.0, 218335.0, 111604.0, 59760.0, 33617.0, 19958.0, 11942.0, 7446.0, 4740.0, 3014.0, 2027.0, 1307.0, 873.0, 583.0, 399.0, 244.0, 177.0, 120.0, 76.0, 50.0, 38.0, 22.0, 12.0, 10.0, 7.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.55419921875, -0.5378189086914062, -0.5214385986328125, -0.5050582885742188, -0.488677978515625, -0.47229766845703125, -0.4559173583984375, -0.43953704833984375, -0.42315673828125, -0.40677642822265625, -0.3903961181640625, -0.37401580810546875, -0.357635498046875, -0.34125518798828125, -0.3248748779296875, -0.30849456787109375, -0.2921142578125, -0.27573394775390625, -0.2593536376953125, -0.24297332763671875, -0.226593017578125, -0.21021270751953125, -0.1938323974609375, -0.17745208740234375, -0.16107177734375, -0.14469146728515625, -0.1283111572265625, -0.11193084716796875, -0.095550537109375, -0.07917022705078125, -0.0627899169921875, -0.04640960693359375, -0.030029296875, -0.01364898681640625, 0.0027313232421875, 0.01911163330078125, 0.035491943359375, 0.05187225341796875, 0.0682525634765625, 0.08463287353515625, 0.10101318359375, 0.11739349365234375, 0.1337738037109375, 0.15015411376953125, 0.166534423828125, 0.18291473388671875, 0.1992950439453125, 0.21567535400390625, 0.2320556640625, 0.24843597412109375, 0.2648162841796875, 0.28119659423828125, 0.297576904296875, 0.31395721435546875, 0.3303375244140625, 0.34671783447265625, 0.36309814453125, 0.37947845458984375, 0.3958587646484375, 0.41223907470703125, 0.428619384765625, 0.44499969482421875, 0.4613800048828125, 0.47776031494140625, 0.494140625]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 4.0, 4.0, 9.0, 10.0, 6.0, 13.0, 15.0, 21.0, 22.0, 25.0, 32.0, 45.0, 46.0, 60.0, 76.0, 76.0, 73.0, 65.0, 73.0, 59.0, 52.0, 38.0, 41.0, 27.0, 25.0, 18.0, 15.0, 14.0, 6.0, 7.0, 6.0, 2.0, 4.0, 3.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015745162963867188, -0.0015187114477157593, -0.0014629065990447998, -0.0014071017503738403, -0.0013512969017028809, -0.0012954920530319214, -0.001239687204360962, -0.0011838823556900024, -0.001128077507019043, -0.0010722726583480835, -0.001016467809677124, -0.0009606629610061646, -0.0009048581123352051, -0.0008490532636642456, -0.0007932484149932861, -0.0007374435663223267, -0.0006816387176513672, -0.0006258338689804077, -0.0005700290203094482, -0.0005142241716384888, -0.0004584193229675293, -0.0004026144742965698, -0.00034680962562561035, -0.0002910047769546509, -0.0002351999282836914, -0.00017939507961273193, -0.00012359023094177246, -6.778538227081299e-05, -1.1980533599853516e-05, 4.382431507110596e-05, 9.962916374206543e-05, 0.0001554340124130249, 0.00021123886108398438, 0.00026704370975494385, 0.0003228485584259033, 0.0003786534070968628, 0.00043445825576782227, 0.0004902631044387817, 0.0005460679531097412, 0.0006018728017807007, 0.0006576776504516602, 0.0007134824991226196, 0.0007692873477935791, 0.0008250921964645386, 0.000880897045135498, 0.0009367018938064575, 0.000992506742477417, 0.0010483115911483765, 0.001104116439819336, 0.0011599212884902954, 0.0012157261371612549, 0.0012715309858322144, 0.0013273358345031738, 0.0013831406831741333, 0.0014389455318450928, 0.0014947503805160522, 0.0015505552291870117, 0.0016063600778579712, 0.0016621649265289307, 0.0017179697751998901, 0.0017737746238708496, 0.001829579472541809, 0.0018853843212127686, 0.001941189169883728, 0.0019969940185546875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 7.0, 4.0, 7.0, 4.0, 12.0, 14.0, 13.0, 22.0, 28.0, 41.0, 42.0, 52.0, 84.0, 112.0, 161.0, 234.0, 353.0, 656.0, 25155.0, 1019249.0, 901.0, 418.0, 261.0, 206.0, 129.0, 113.0, 67.0, 62.0, 39.0, 30.0, 17.0, 14.0, 17.0, 10.0, 7.0, 3.0, 5.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.04010009765625, -0.03896045684814453, -0.03782081604003906, -0.036681175231933594, -0.035541534423828125, -0.034401893615722656, -0.03326225280761719, -0.03212261199951172, -0.03098297119140625, -0.02984333038330078, -0.028703689575195312, -0.027564048767089844, -0.026424407958984375, -0.025284767150878906, -0.024145126342773438, -0.02300548553466797, -0.0218658447265625, -0.02072620391845703, -0.019586563110351562, -0.018446922302246094, -0.017307281494140625, -0.016167640686035156, -0.015027999877929688, -0.013888359069824219, -0.01274871826171875, -0.011609077453613281, -0.010469436645507812, -0.009329795837402344, -0.008190155029296875, -0.007050514221191406, -0.0059108734130859375, -0.004771232604980469, -0.003631591796875, -0.0024919509887695312, -0.0013523101806640625, -0.00021266937255859375, 0.000926971435546875, 0.0020666122436523438, 0.0032062530517578125, 0.004345893859863281, 0.00548553466796875, 0.006625175476074219, 0.0077648162841796875, 0.008904457092285156, 0.010044097900390625, 0.011183738708496094, 0.012323379516601562, 0.013463020324707031, 0.0146026611328125, 0.01574230194091797, 0.016881942749023438, 0.018021583557128906, 0.019161224365234375, 0.020300865173339844, 0.021440505981445312, 0.02258014678955078, 0.02371978759765625, 0.02485942840576172, 0.025999069213867188, 0.027138710021972656, 0.028278350830078125, 0.029417991638183594, 0.030557632446289062, 0.03169727325439453, 0.0328369140625]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 18.0, 610.0, 383.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008214879781007767, -0.008067880757153034, -0.007920882664620876, -0.007773883640766144, -0.007626885082572699, -0.007479886524379253, -0.007332887966185808, -0.007185889407992363, -0.0070388903841376305, -0.006891891825944185, -0.00674489326775074, -0.0065978942438960075, -0.006450895685702562, -0.006303897127509117, -0.006156898569315672, -0.006009900011122227, -0.0058629014529287815, -0.005715902894735336, -0.005568904336541891, -0.005421905312687159, -0.005274906754493713, -0.005127908196300268, -0.004980909638106823, -0.004833911079913378, -0.0046869125217199326, -0.004539913963526487, -0.004392915405333042, -0.00424591638147831, -0.004098917823284864, -0.003951919265091419, -0.003804920706897974, -0.003657922148704529, -0.0035109235905110836, -0.0033639250323176384, -0.0032169262412935495, -0.0030699276831001043, -0.0029229288920760155, -0.0027759303338825703, -0.002628931775689125, -0.00248193321749568, -0.0023349341936409473, -0.002187935635447502, -0.0020409368444234133, -0.001893938286229968, -0.001746939611621201, -0.001599940937012434, -0.0014529423788189888, -0.0013059437042102218, -0.0011589451460167766, -0.0010119464714080095, -0.0008649478550069034, -0.0007179492386057973, -0.0005709505639970303, -0.0004239518893882632, -0.0002769532729871571, -0.000129954656586051, 1.7044018022716045e-05, 0.00016404266352765262, 0.0003110413090325892, 0.0004580399545375258, 0.0006050386000424623, 0.0007520372746512294, 0.0008990358910523355, 0.0010460345074534416, 0.0011930331820622087]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 4.0, 8.0, 6.0, 15.0, 6.0, 13.0, 14.0, 12.0, 9.0, 22.0, 23.0, 24.0, 26.0, 34.0, 37.0, 35.0, 45.0, 38.0, 35.0, 34.0, 39.0, 44.0, 37.0, 39.0, 39.0, 36.0, 33.0, 34.0, 36.0, 33.0, 22.0, 19.0, 18.0, 17.0, 15.0, 16.0, 12.0, 13.0, 16.0, 7.0, 8.0, 3.0, 4.0, 5.0, 4.0, 3.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0007455945014953613, -0.0007216371595859528, -0.0006976798176765442, -0.0006737224757671356, -0.000649765133857727, -0.0006258077919483185, -0.0006018504500389099, -0.0005778931081295013, -0.0005539357662200928, -0.0005299784243106842, -0.0005060210824012756, -0.00048206374049186707, -0.0004581063985824585, -0.0004341490566730499, -0.00041019171476364136, -0.0003862343728542328, -0.0003622770309448242, -0.00033831968903541565, -0.0003143623471260071, -0.0002904050052165985, -0.00026644766330718994, -0.00024249032139778137, -0.0002185329794883728, -0.00019457563757896423, -0.00017061829566955566, -0.0001466609537601471, -0.00012270361185073853, -9.874626994132996e-05, -7.478892803192139e-05, -5.083158612251282e-05, -2.6874244213104248e-05, -2.9169023036956787e-06, 2.104043960571289e-05, 4.499778151512146e-05, 6.895512342453003e-05, 9.29124653339386e-05, 0.00011686980724334717, 0.00014082714915275574, 0.0001647844910621643, 0.00018874183297157288, 0.00021269917488098145, 0.00023665651679039001, 0.0002606138586997986, 0.00028457120060920715, 0.0003085285425186157, 0.0003324858844280243, 0.00035644322633743286, 0.00038040056824684143, 0.00040435791015625, 0.00042831525206565857, 0.00045227259397506714, 0.0004762299358844757, 0.0005001872777938843, 0.0005241446197032928, 0.0005481019616127014, 0.00057205930352211, 0.0005960166454315186, 0.0006199739873409271, 0.0006439313292503357, 0.0006678886711597443, 0.0006918460130691528, 0.0007158033549785614, 0.00073976069688797, 0.0007637180387973785, 0.0007876753807067871]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 6.0, 9.0, 9.0, 10.0, 18.0, 13.0, 16.0, 20.0, 25.0, 24.0, 38.0, 34.0, 36.0, 62.0, 54.0, 55.0, 50.0, 47.0, 36.0, 59.0, 61.0, 44.0, 41.0, 42.0, 33.0, 33.0, 19.0, 21.0, 20.0, 20.0, 12.0, 7.0, 12.0, 6.0, 6.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1953125, -4.03729248046875, -3.8792724609375, -3.72125244140625, -3.563232421875, -3.40521240234375, -3.2471923828125, -3.08917236328125, -2.93115234375, -2.77313232421875, -2.6151123046875, -2.45709228515625, -2.299072265625, -2.14105224609375, -1.9830322265625, -1.82501220703125, -1.6669921875, -1.50897216796875, -1.3509521484375, -1.19293212890625, -1.034912109375, -0.87689208984375, -0.7188720703125, -0.56085205078125, -0.40283203125, -0.24481201171875, -0.0867919921875, 0.07122802734375, 0.229248046875, 0.38726806640625, 0.5452880859375, 0.70330810546875, 0.861328125, 1.01934814453125, 1.1773681640625, 1.33538818359375, 1.493408203125, 1.65142822265625, 1.8094482421875, 1.96746826171875, 2.12548828125, 2.28350830078125, 2.4415283203125, 2.59954833984375, 2.757568359375, 2.91558837890625, 3.0736083984375, 3.23162841796875, 3.3896484375, 3.54766845703125, 3.7056884765625, 3.86370849609375, 4.021728515625, 4.17974853515625, 4.3377685546875, 4.49578857421875, 4.65380859375, 4.81182861328125, 4.9698486328125, 5.12786865234375, 5.285888671875, 5.44390869140625, 5.6019287109375, 5.75994873046875, 5.91796875]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 2.0, 6.0, 3.0, 7.0, 12.0, 4.0, 10.0, 16.0, 23.0, 31.0, 30.0, 47.0, 69.0, 113.0, 120.0, 165.0, 243.0, 294.0, 445.0, 604.0, 901.0, 1186.0, 1815.0, 2793.0, 4624.0, 8302.0, 18227.0, 81378.0, 784044.0, 100324.0, 19676.0, 8918.0, 4844.0, 2862.0, 1878.0, 1328.0, 895.0, 638.0, 453.0, 318.0, 219.0, 190.0, 128.0, 108.0, 73.0, 49.0, 42.0, 24.0, 24.0, 16.0, 9.0, 7.0, 9.0, 10.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0], "bins": [-20.515625, -19.865234375, -19.21484375, -18.564453125, -17.9140625, -17.263671875, -16.61328125, -15.962890625, -15.3125, -14.662109375, -14.01171875, -13.361328125, -12.7109375, -12.060546875, -11.41015625, -10.759765625, -10.109375, -9.458984375, -8.80859375, -8.158203125, -7.5078125, -6.857421875, -6.20703125, -5.556640625, -4.90625, -4.255859375, -3.60546875, -2.955078125, -2.3046875, -1.654296875, -1.00390625, -0.353515625, 0.296875, 0.947265625, 1.59765625, 2.248046875, 2.8984375, 3.548828125, 4.19921875, 4.849609375, 5.5, 6.150390625, 6.80078125, 7.451171875, 8.1015625, 8.751953125, 9.40234375, 10.052734375, 10.703125, 11.353515625, 12.00390625, 12.654296875, 13.3046875, 13.955078125, 14.60546875, 15.255859375, 15.90625, 16.556640625, 17.20703125, 17.857421875, 18.5078125, 19.158203125, 19.80859375, 20.458984375, 21.109375]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 8.0, 10.0, 10.0, 11.0, 16.0, 18.0, 17.0, 17.0, 26.0, 31.0, 36.0, 45.0, 30.0, 32.0, 41.0, 53.0, 91.0, 343.0, 1636.0, 163.0, 68.0, 49.0, 41.0, 33.0, 37.0, 37.0, 28.0, 21.0, 19.0, 23.0, 18.0, 9.0, 12.0, 11.0, 5.0, 4.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.6796875, -15.221923828125, -14.76416015625, -14.306396484375, -13.8486328125, -13.390869140625, -12.93310546875, -12.475341796875, -12.017578125, -11.559814453125, -11.10205078125, -10.644287109375, -10.1865234375, -9.728759765625, -9.27099609375, -8.813232421875, -8.35546875, -7.897705078125, -7.43994140625, -6.982177734375, -6.5244140625, -6.066650390625, -5.60888671875, -5.151123046875, -4.693359375, -4.235595703125, -3.77783203125, -3.320068359375, -2.8623046875, -2.404541015625, -1.94677734375, -1.489013671875, -1.03125, -0.573486328125, -0.11572265625, 0.342041015625, 0.7998046875, 1.257568359375, 1.71533203125, 2.173095703125, 2.630859375, 3.088623046875, 3.54638671875, 4.004150390625, 4.4619140625, 4.919677734375, 5.37744140625, 5.835205078125, 6.29296875, 6.750732421875, 7.20849609375, 7.666259765625, 8.1240234375, 8.581787109375, 9.03955078125, 9.497314453125, 9.955078125, 10.412841796875, 10.87060546875, 11.328369140625, 11.7861328125, 12.243896484375, 12.70166015625, 13.159423828125, 13.6171875]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 7.0, 3.0, 7.0, 11.0, 10.0, 15.0, 14.0, 19.0, 22.0, 21.0, 35.0, 47.0, 47.0, 49.0, 114.0, 233.0, 1158.0, 2380208.0, 761988.0, 999.0, 261.0, 109.0, 60.0, 39.0, 44.0, 34.0, 34.0, 21.0, 20.0, 12.0, 17.0, 15.0, 13.0, 12.0, 8.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.15625, -61.04931640625, -58.9423828125, -56.83544921875, -54.728515625, -52.62158203125, -50.5146484375, -48.40771484375, -46.30078125, -44.19384765625, -42.0869140625, -39.97998046875, -37.873046875, -35.76611328125, -33.6591796875, -31.55224609375, -29.4453125, -27.33837890625, -25.2314453125, -23.12451171875, -21.017578125, -18.91064453125, -16.8037109375, -14.69677734375, -12.58984375, -10.48291015625, -8.3759765625, -6.26904296875, -4.162109375, -2.05517578125, 0.0517578125, 2.15869140625, 4.265625, 6.37255859375, 8.4794921875, 10.58642578125, 12.693359375, 14.80029296875, 16.9072265625, 19.01416015625, 21.12109375, 23.22802734375, 25.3349609375, 27.44189453125, 29.548828125, 31.65576171875, 33.7626953125, 35.86962890625, 37.9765625, 40.08349609375, 42.1904296875, 44.29736328125, 46.404296875, 48.51123046875, 50.6181640625, 52.72509765625, 54.83203125, 56.93896484375, 59.0458984375, 61.15283203125, 63.259765625, 65.36669921875, 67.4736328125, 69.58056640625, 71.6875]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 360.0, 648.0, 8.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-225.95680236816406, -221.44615173339844, -216.93551635742188, -212.42486572265625, -207.9142303466797, -203.40357971191406, -198.8929443359375, -194.38229370117188, -189.87164306640625, -185.36099243164062, -180.85035705566406, -176.33970642089844, -171.82907104492188, -167.31842041015625, -162.8077850341797, -158.29713439941406, -153.7864990234375, -149.27584838867188, -144.7652130126953, -140.2545623779297, -135.74392700195312, -131.2332763671875, -126.7226333618164, -122.21199035644531, -117.70134735107422, -113.19070434570312, -108.68006134033203, -104.16941833496094, -99.65876770019531, -95.14813232421875, -90.63748168945312, -86.12683868408203, -81.61618041992188, -77.10553741455078, -72.59489440917969, -68.0842514038086, -63.573604583740234, -59.06296157836914, -54.55231475830078, -50.04167175292969, -45.531028747558594, -41.0203857421875, -36.509742736816406, -31.999095916748047, -27.488452911376953, -22.97780990600586, -18.467164993286133, -13.956520080566406, -9.445877075195312, -4.935233116149902, -0.4245891571044922, 4.086054801940918, 8.596698760986328, 13.107341766357422, 17.61798667907715, 22.128631591796875, 26.63927459716797, 31.149917602539062, 35.660560607910156, 40.171207427978516, 44.68185043334961, 49.1924934387207, 53.70314025878906, 58.213783264160156, 62.72442626953125]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 5.0, 5.0, 6.0, 3.0, 7.0, 5.0, 3.0, 12.0, 8.0, 19.0, 19.0, 27.0, 29.0, 30.0, 32.0, 36.0, 26.0, 35.0, 27.0, 46.0, 39.0, 40.0, 36.0, 49.0, 39.0, 36.0, 39.0, 38.0, 40.0, 28.0, 41.0, 26.0, 26.0, 17.0, 22.0, 20.0, 15.0, 12.0, 10.0, 7.0, 11.0, 11.0, 7.0, 5.0, 2.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-42.54457092285156, -41.331809997558594, -40.11905288696289, -38.90629196166992, -37.69353103637695, -36.48077392578125, -35.26801300048828, -34.05525207519531, -32.842491149902344, -31.629732131958008, -30.41697120666504, -29.204212188720703, -27.991451263427734, -26.7786922454834, -25.565933227539062, -24.353172302246094, -23.14041519165039, -21.927656173706055, -20.714895248413086, -19.50213623046875, -18.28937530517578, -17.076616287231445, -15.86385726928711, -14.651097297668457, -13.438337326049805, -12.225577354431152, -11.0128173828125, -9.800058364868164, -8.587298393249512, -7.374538421630859, -6.161778926849365, -4.949019432067871, -3.736255645751953, -2.52349591255188, -1.3107361793518066, -0.0979764461517334, 1.1147832870483398, 2.327543258666992, 3.5403027534484863, 4.7530622482299805, 5.965822219848633, 7.178582191467285, 8.391342163085938, 9.604101181030273, 10.816861152648926, 12.029621124267578, 13.242380142211914, 14.455140113830566, 15.667900085449219, 16.880659103393555, 18.093420028686523, 19.30617904663086, 20.518939971923828, 21.731698989868164, 22.9444580078125, 24.15721893310547, 25.369977951049805, 26.58273696899414, 27.79549789428711, 29.008256912231445, 30.22101593017578, 31.43377685546875, 32.64653778076172, 33.85929489135742, 35.07205581665039]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 1.0, 6.0, 8.0, 13.0, 8.0, 14.0, 12.0, 16.0, 15.0, 29.0, 25.0, 33.0, 35.0, 37.0, 40.0, 65.0, 42.0, 45.0, 49.0, 57.0, 52.0, 42.0, 50.0, 47.0, 43.0, 34.0, 23.0, 37.0, 24.0, 23.0, 14.0, 19.0, 11.0, 8.0, 12.0, 6.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3828125, -4.2213134765625, -4.059814453125, -3.8983154296875, -3.73681640625, -3.5753173828125, -3.413818359375, -3.2523193359375, -3.0908203125, -2.9293212890625, -2.767822265625, -2.6063232421875, -2.44482421875, -2.2833251953125, -2.121826171875, -1.9603271484375, -1.798828125, -1.6373291015625, -1.475830078125, -1.3143310546875, -1.15283203125, -0.9913330078125, -0.829833984375, -0.6683349609375, -0.5068359375, -0.3453369140625, -0.183837890625, -0.0223388671875, 0.13916015625, 0.3006591796875, 0.462158203125, 0.6236572265625, 0.78515625, 0.9466552734375, 1.108154296875, 1.2696533203125, 1.43115234375, 1.5926513671875, 1.754150390625, 1.9156494140625, 2.0771484375, 2.2386474609375, 2.400146484375, 2.5616455078125, 2.72314453125, 2.8846435546875, 3.046142578125, 3.2076416015625, 3.369140625, 3.5306396484375, 3.692138671875, 3.8536376953125, 4.01513671875, 4.1766357421875, 4.338134765625, 4.4996337890625, 4.6611328125, 4.8226318359375, 4.984130859375, 5.1456298828125, 5.30712890625, 5.4686279296875, 5.630126953125, 5.7916259765625, 5.953125]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 1.0, 4.0, 7.0, 9.0, 18.0, 16.0, 16.0, 35.0, 64.0, 62.0, 85.0, 103.0, 158.0, 276.0, 446.0, 760.0, 1307.0, 2500.0, 5521.0, 14235.0, 51918.0, 532794.0, 3236930.0, 287815.0, 37828.0, 11430.0, 4666.0, 2235.0, 1148.0, 649.0, 395.0, 258.0, 158.0, 122.0, 82.0, 58.0, 39.0, 39.0, 21.0, 22.0, 11.0, 9.0, 11.0, 5.0, 6.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0], "bins": [-21.421875, -20.7607421875, -20.099609375, -19.4384765625, -18.77734375, -18.1162109375, -17.455078125, -16.7939453125, -16.1328125, -15.4716796875, -14.810546875, -14.1494140625, -13.48828125, -12.8271484375, -12.166015625, -11.5048828125, -10.84375, -10.1826171875, -9.521484375, -8.8603515625, -8.19921875, -7.5380859375, -6.876953125, -6.2158203125, -5.5546875, -4.8935546875, -4.232421875, -3.5712890625, -2.91015625, -2.2490234375, -1.587890625, -0.9267578125, -0.265625, 0.3955078125, 1.056640625, 1.7177734375, 2.37890625, 3.0400390625, 3.701171875, 4.3623046875, 5.0234375, 5.6845703125, 6.345703125, 7.0068359375, 7.66796875, 8.3291015625, 8.990234375, 9.6513671875, 10.3125, 10.9736328125, 11.634765625, 12.2958984375, 12.95703125, 13.6181640625, 14.279296875, 14.9404296875, 15.6015625, 16.2626953125, 16.923828125, 17.5849609375, 18.24609375, 18.9072265625, 19.568359375, 20.2294921875, 20.890625]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 2.0, 6.0, 6.0, 15.0, 15.0, 25.0, 32.0, 45.0, 76.0, 115.0, 160.0, 229.0, 327.0, 466.0, 593.0, 601.0, 455.0, 289.0, 192.0, 148.0, 78.0, 61.0, 36.0, 32.0, 20.0, 17.0, 11.0, 15.0, 4.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.65625, -25.97021484375, -25.2841796875, -24.59814453125, -23.912109375, -23.22607421875, -22.5400390625, -21.85400390625, -21.16796875, -20.48193359375, -19.7958984375, -19.10986328125, -18.423828125, -17.73779296875, -17.0517578125, -16.36572265625, -15.6796875, -14.99365234375, -14.3076171875, -13.62158203125, -12.935546875, -12.24951171875, -11.5634765625, -10.87744140625, -10.19140625, -9.50537109375, -8.8193359375, -8.13330078125, -7.447265625, -6.76123046875, -6.0751953125, -5.38916015625, -4.703125, -4.01708984375, -3.3310546875, -2.64501953125, -1.958984375, -1.27294921875, -0.5869140625, 0.09912109375, 0.78515625, 1.47119140625, 2.1572265625, 2.84326171875, 3.529296875, 4.21533203125, 4.9013671875, 5.58740234375, 6.2734375, 6.95947265625, 7.6455078125, 8.33154296875, 9.017578125, 9.70361328125, 10.3896484375, 11.07568359375, 11.76171875, 12.44775390625, 13.1337890625, 13.81982421875, 14.505859375, 15.19189453125, 15.8779296875, 16.56396484375, 17.25]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 5.0, 8.0, 6.0, 19.0, 32.0, 26.0, 59.0, 67.0, 107.0, 196.0, 440.0, 1759.0, 221504.0, 3961356.0, 7254.0, 685.0, 286.0, 162.0, 97.0, 85.0, 34.0, 31.0, 16.0, 17.0, 8.0, 4.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.3125, -62.2353515625, -59.158203125, -56.0810546875, -53.00390625, -49.9267578125, -46.849609375, -43.7724609375, -40.6953125, -37.6181640625, -34.541015625, -31.4638671875, -28.38671875, -25.3095703125, -22.232421875, -19.1552734375, -16.078125, -13.0009765625, -9.923828125, -6.8466796875, -3.76953125, -0.6923828125, 2.384765625, 5.4619140625, 8.5390625, 11.6162109375, 14.693359375, 17.7705078125, 20.84765625, 23.9248046875, 27.001953125, 30.0791015625, 33.15625, 36.2333984375, 39.310546875, 42.3876953125, 45.46484375, 48.5419921875, 51.619140625, 54.6962890625, 57.7734375, 60.8505859375, 63.927734375, 67.0048828125, 70.08203125, 73.1591796875, 76.236328125, 79.3134765625, 82.390625, 85.4677734375, 88.544921875, 91.6220703125, 94.69921875, 97.7763671875, 100.853515625, 103.9306640625, 107.0078125, 110.0849609375, 113.162109375, 116.2392578125, 119.31640625, 122.3935546875, 125.470703125, 128.5478515625, 131.625]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 31.0, 36.0, 69.0, 150.0, 188.0, 188.0, 161.0, 98.0, 46.0, 27.0, 9.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-108.53904724121094, -106.02537536621094, -103.5116958618164, -100.9980239868164, -98.48434448242188, -95.97067260742188, -93.45699310302734, -90.94332122802734, -88.42964172363281, -85.91596984863281, -83.40229034423828, -80.88861846923828, -78.37493896484375, -75.86126708984375, -73.34758758544922, -70.83391571044922, -68.32024383544922, -65.80657196044922, -63.29289245605469, -60.77921676635742, -58.265541076660156, -55.751869201660156, -53.23819351196289, -50.724517822265625, -48.21084213256836, -45.697166442871094, -43.18349075317383, -40.66981506347656, -38.15614318847656, -35.64246368408203, -33.12879180908203, -30.615116119384766, -28.10143280029297, -25.587757110595703, -23.074081420898438, -20.560407638549805, -18.04673194885254, -15.533056259155273, -13.019381523132324, -10.505706787109375, -7.992031097412109, -5.478355884552002, -2.9646806716918945, -0.4510054588317871, 2.0626697540283203, 4.576345443725586, 7.090020179748535, 9.603694915771484, 12.11737060546875, 14.631046295166016, 17.14472198486328, 19.658395767211914, 22.17207145690918, 24.685747146606445, 27.199420928955078, 29.713096618652344, 32.22677230834961, 34.740447998046875, 37.25412368774414, 39.767799377441406, 42.281471252441406, 44.79515075683594, 47.30882263183594, 49.8224983215332, 52.33617401123047]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 2.0, 6.0, 6.0, 8.0, 14.0, 9.0, 22.0, 16.0, 10.0, 25.0, 27.0, 23.0, 36.0, 29.0, 43.0, 36.0, 42.0, 45.0, 34.0, 45.0, 41.0, 44.0, 37.0, 45.0, 36.0, 46.0, 31.0, 35.0, 31.0, 31.0, 22.0, 19.0, 15.0, 15.0, 20.0, 10.0, 10.0, 5.0, 4.0, 9.0, 10.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-61.119720458984375, -59.25748825073242, -57.395259857177734, -55.53302764892578, -53.670799255371094, -51.80856704711914, -49.94633483886719, -48.0841064453125, -46.22187805175781, -44.35964584350586, -42.49741744995117, -40.63518524169922, -38.77295684814453, -36.91072463989258, -35.048492431640625, -33.18626403808594, -31.324031829833984, -29.461801528930664, -27.599571228027344, -25.73733901977539, -23.875110626220703, -22.01287841796875, -20.15064811706543, -18.28841781616211, -16.42618751525879, -14.563957214355469, -12.701726913452148, -10.839495658874512, -8.977265357971191, -7.115035057067871, -5.252803802490234, -3.390573501586914, -1.5283432006835938, 0.33388733863830566, 2.196117877960205, 4.058348655700684, 5.920578956604004, 7.782809257507324, 9.645040512084961, 11.507270812988281, 13.369501113891602, 15.231731414794922, 17.093961715698242, 18.956192016601562, 20.818424224853516, 22.680652618408203, 24.542884826660156, 26.405115127563477, 28.267345428466797, 30.129575729370117, 31.991806030273438, 33.85403823852539, 35.71626663208008, 37.57849884033203, 39.44072723388672, 41.30295944213867, 43.165191650390625, 45.02742385864258, 46.889652252197266, 48.75188446044922, 50.614112854003906, 52.47634506225586, 54.33857727050781, 56.2008056640625, 58.06303405761719]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 5.0, 9.0, 17.0, 10.0, 15.0, 20.0, 28.0, 30.0, 27.0, 27.0, 46.0, 46.0, 49.0, 49.0, 47.0, 52.0, 64.0, 44.0, 50.0, 59.0, 44.0, 43.0, 35.0, 32.0, 33.0, 28.0, 21.0, 17.0, 15.0, 15.0, 6.0, 5.0, 11.0, 7.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.55078125, -4.3717041015625, -4.192626953125, -4.0135498046875, -3.83447265625, -3.6553955078125, -3.476318359375, -3.2972412109375, -3.1181640625, -2.9390869140625, -2.760009765625, -2.5809326171875, -2.40185546875, -2.2227783203125, -2.043701171875, -1.8646240234375, -1.685546875, -1.5064697265625, -1.327392578125, -1.1483154296875, -0.96923828125, -0.7901611328125, -0.611083984375, -0.4320068359375, -0.2529296875, -0.0738525390625, 0.105224609375, 0.2843017578125, 0.46337890625, 0.6424560546875, 0.821533203125, 1.0006103515625, 1.1796875, 1.3587646484375, 1.537841796875, 1.7169189453125, 1.89599609375, 2.0750732421875, 2.254150390625, 2.4332275390625, 2.6123046875, 2.7913818359375, 2.970458984375, 3.1495361328125, 3.32861328125, 3.5076904296875, 3.686767578125, 3.8658447265625, 4.044921875, 4.2239990234375, 4.403076171875, 4.5821533203125, 4.76123046875, 4.9403076171875, 5.119384765625, 5.2984619140625, 5.4775390625, 5.6566162109375, 5.835693359375, 6.0147705078125, 6.19384765625, 6.3729248046875, 6.552001953125, 6.7310791015625, 6.91015625]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 12.0, 19.0, 25.0, 40.0, 53.0, 92.0, 123.0, 197.0, 291.0, 404.0, 611.0, 1005.0, 1421.0, 2100.0, 3203.0, 4584.0, 7100.0, 10726.0, 16314.0, 24382.0, 37641.0, 59341.0, 99184.0, 189008.0, 244981.0, 134869.0, 74973.0, 46511.0, 30332.0, 19974.0, 13270.0, 8488.0, 5606.0, 3793.0, 2575.0, 1769.0, 1150.0, 805.0, 510.0, 369.0, 230.0, 180.0, 104.0, 66.0, 47.0, 23.0, 15.0, 12.0, 11.0, 9.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.64501953125, -0.6250152587890625, -0.605010986328125, -0.5850067138671875, -0.56500244140625, -0.5449981689453125, -0.524993896484375, -0.5049896240234375, -0.4849853515625, -0.4649810791015625, -0.444976806640625, -0.4249725341796875, -0.40496826171875, -0.3849639892578125, -0.364959716796875, -0.3449554443359375, -0.324951171875, -0.3049468994140625, -0.284942626953125, -0.2649383544921875, -0.24493408203125, -0.2249298095703125, -0.204925537109375, -0.1849212646484375, -0.1649169921875, -0.1449127197265625, -0.124908447265625, -0.1049041748046875, -0.08489990234375, -0.0648956298828125, -0.044891357421875, -0.0248870849609375, -0.0048828125, 0.0151214599609375, 0.035125732421875, 0.0551300048828125, 0.07513427734375, 0.0951385498046875, 0.115142822265625, 0.1351470947265625, 0.1551513671875, 0.1751556396484375, 0.195159912109375, 0.2151641845703125, 0.23516845703125, 0.2551727294921875, 0.275177001953125, 0.2951812744140625, 0.315185546875, 0.3351898193359375, 0.355194091796875, 0.3751983642578125, 0.39520263671875, 0.4152069091796875, 0.435211181640625, 0.4552154541015625, 0.4752197265625, 0.4952239990234375, 0.515228271484375, 0.5352325439453125, 0.55523681640625, 0.5752410888671875, 0.595245361328125, 0.6152496337890625, 0.63525390625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 9.0, 2.0, 6.0, 11.0, 14.0, 7.0, 13.0, 23.0, 25.0, 12.0, 27.0, 25.0, 28.0, 35.0, 30.0, 35.0, 47.0, 49.0, 44.0, 1071.0, 38.0, 42.0, 41.0, 38.0, 37.0, 48.0, 45.0, 36.0, 29.0, 22.0, 24.0, 24.0, 16.0, 13.0, 17.0, 15.0, 9.0, 8.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.86328125, -2.7645263671875, -2.665771484375, -2.5670166015625, -2.46826171875, -2.3695068359375, -2.270751953125, -2.1719970703125, -2.0732421875, -1.9744873046875, -1.875732421875, -1.7769775390625, -1.67822265625, -1.5794677734375, -1.480712890625, -1.3819580078125, -1.283203125, -1.1844482421875, -1.085693359375, -0.9869384765625, -0.88818359375, -0.7894287109375, -0.690673828125, -0.5919189453125, -0.4931640625, -0.3944091796875, -0.295654296875, -0.1968994140625, -0.09814453125, 0.0006103515625, 0.099365234375, 0.1981201171875, 0.296875, 0.3956298828125, 0.494384765625, 0.5931396484375, 0.69189453125, 0.7906494140625, 0.889404296875, 0.9881591796875, 1.0869140625, 1.1856689453125, 1.284423828125, 1.3831787109375, 1.48193359375, 1.5806884765625, 1.679443359375, 1.7781982421875, 1.876953125, 1.9757080078125, 2.074462890625, 2.1732177734375, 2.27197265625, 2.3707275390625, 2.469482421875, 2.5682373046875, 2.6669921875, 2.7657470703125, 2.864501953125, 2.9632568359375, 3.06201171875, 3.1607666015625, 3.259521484375, 3.3582763671875, 3.45703125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 3.0, 1.0, 2.0, 7.0, 10.0, 12.0, 22.0, 25.0, 57.0, 75.0, 83.0, 173.0, 218.0, 320.0, 497.0, 742.0, 1057.0, 1553.0, 2387.0, 3498.0, 5372.0, 8524.0, 13331.0, 21903.0, 35762.0, 60741.0, 109742.0, 204946.0, 1291006.0, 142387.0, 75721.0, 44189.0, 26412.0, 16570.0, 10269.0, 6639.0, 4273.0, 2852.0, 1882.0, 1217.0, 847.0, 590.0, 404.0, 255.0, 189.0, 118.0, 82.0, 64.0, 42.0, 16.0, 16.0, 12.0, 4.0, 12.0, 3.0, 3.0, 0.0, 3.0, 3.0, 0.0, 2.0], "bins": [-0.52978515625, -0.5128097534179688, -0.4958343505859375, -0.47885894775390625, -0.461883544921875, -0.44490814208984375, -0.4279327392578125, -0.41095733642578125, -0.39398193359375, -0.37700653076171875, -0.3600311279296875, -0.34305572509765625, -0.326080322265625, -0.30910491943359375, -0.2921295166015625, -0.27515411376953125, -0.2581787109375, -0.24120330810546875, -0.2242279052734375, -0.20725250244140625, -0.190277099609375, -0.17330169677734375, -0.1563262939453125, -0.13935089111328125, -0.12237548828125, -0.10540008544921875, -0.0884246826171875, -0.07144927978515625, -0.054473876953125, -0.03749847412109375, -0.0205230712890625, -0.00354766845703125, 0.013427734375, 0.03040313720703125, 0.0473785400390625, 0.06435394287109375, 0.081329345703125, 0.09830474853515625, 0.1152801513671875, 0.13225555419921875, 0.14923095703125, 0.16620635986328125, 0.1831817626953125, 0.20015716552734375, 0.217132568359375, 0.23410797119140625, 0.2510833740234375, 0.26805877685546875, 0.2850341796875, 0.30200958251953125, 0.3189849853515625, 0.33596038818359375, 0.352935791015625, 0.36991119384765625, 0.3868865966796875, 0.40386199951171875, 0.42083740234375, 0.43781280517578125, 0.4547882080078125, 0.47176361083984375, 0.488739013671875, 0.5057144165039062, 0.5226898193359375, 0.5396652221679688, 0.556640625]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 8.0, 8.0, 12.0, 19.0, 20.0, 24.0, 29.0, 40.0, 63.0, 85.0, 107.0, 98.0, 100.0, 78.0, 78.0, 54.0, 45.0, 34.0, 24.0, 20.0, 9.0, 10.0, 10.0, 3.0, 4.0, 4.0, 2.0, 6.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0031032562255859375, -0.003019392490386963, -0.0029355287551879883, -0.0028516650199890137, -0.002767801284790039, -0.0026839375495910645, -0.00260007381439209, -0.0025162100791931152, -0.0024323463439941406, -0.002348482608795166, -0.0022646188735961914, -0.002180755138397217, -0.002096891403198242, -0.0020130276679992676, -0.001929163932800293, -0.0018453001976013184, -0.0017614364624023438, -0.0016775727272033691, -0.0015937089920043945, -0.00150984525680542, -0.0014259815216064453, -0.0013421177864074707, -0.001258254051208496, -0.0011743903160095215, -0.0010905265808105469, -0.0010066628456115723, -0.0009227991104125977, -0.000838935375213623, -0.0007550716400146484, -0.0006712079048156738, -0.0005873441696166992, -0.0005034804344177246, -0.00041961669921875, -0.0003357529640197754, -0.0002518892288208008, -0.00016802549362182617, -8.416175842285156e-05, -2.980232238769531e-07, 8.356571197509766e-05, 0.00016742944717407227, 0.0002512931823730469, 0.0003351569175720215, 0.0004190206527709961, 0.0005028843879699707, 0.0005867481231689453, 0.0006706118583679199, 0.0007544755935668945, 0.0008383393287658691, 0.0009222030639648438, 0.0010060667991638184, 0.001089930534362793, 0.0011737942695617676, 0.0012576580047607422, 0.0013415217399597168, 0.0014253854751586914, 0.001509249210357666, 0.0015931129455566406, 0.0016769766807556152, 0.0017608404159545898, 0.0018447041511535645, 0.001928567886352539, 0.0020124316215515137, 0.0020962953567504883, 0.002180159091949463, 0.0022640228271484375]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 2.0, 3.0, 4.0, 1.0, 2.0, 7.0, 6.0, 10.0, 18.0, 14.0, 36.0, 92.0, 122.0, 222.0, 515.0, 14835.0, 1031260.0, 748.0, 269.0, 159.0, 85.0, 52.0, 25.0, 25.0, 11.0, 11.0, 10.0, 4.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0589599609375, -0.05679035186767578, -0.05462074279785156, -0.052451133728027344, -0.050281524658203125, -0.048111915588378906, -0.04594230651855469, -0.04377269744873047, -0.04160308837890625, -0.03943347930908203, -0.03726387023925781, -0.035094261169433594, -0.032924652099609375, -0.030755043029785156, -0.028585433959960938, -0.02641582489013672, -0.0242462158203125, -0.02207660675048828, -0.019906997680664062, -0.017737388610839844, -0.015567779541015625, -0.013398170471191406, -0.011228561401367188, -0.009058952331542969, -0.00688934326171875, -0.004719734191894531, -0.0025501251220703125, -0.00038051605224609375, 0.001789093017578125, 0.003958702087402344, 0.0061283111572265625, 0.008297920227050781, 0.010467529296875, 0.012637138366699219, 0.014806747436523438, 0.016976356506347656, 0.019145965576171875, 0.021315574645996094, 0.023485183715820312, 0.02565479278564453, 0.02782440185546875, 0.02999401092529297, 0.03216361999511719, 0.034333229064941406, 0.036502838134765625, 0.038672447204589844, 0.04084205627441406, 0.04301166534423828, 0.0451812744140625, 0.04735088348388672, 0.04952049255371094, 0.051690101623535156, 0.053859710693359375, 0.056029319763183594, 0.05819892883300781, 0.06036853790283203, 0.06253814697265625, 0.06470775604248047, 0.06687736511230469, 0.0690469741821289, 0.07121658325195312, 0.07338619232177734, 0.07555580139160156, 0.07772541046142578, 0.07989501953125]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0, 751.0, 259.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004929606337100267, -0.004597438033670187, -0.004265269264578819, -0.003933100961148739, -0.0036009326577186584, -0.003268764354288578, -0.002936595818027854, -0.00260442728176713, -0.0022722589783370495, -0.0019400905584916472, -0.001607922138646245, -0.0012757537188008428, -0.0009435852989554405, -0.0006114168791100383, -0.00027924845926463604, 5.292007699608803e-05, 0.00038508838042616844, 0.0007172568002715707, 0.001049425220116973, 0.0013815936399623752, 0.0017137620598077774, 0.002045930363237858, 0.002378098899498582, 0.002710267435759306, 0.0030424357391893864, 0.0033746040426194668, 0.003706772578880191, 0.004038941115140915, 0.004371109418570995, 0.004703277722001076, 0.005035446025431156, 0.005367614794522524, 0.005699783563613892, 0.006031951867043972, 0.006364120170474052, 0.00669628893956542, 0.0070284572429955006, 0.007360625546425581, 0.007692794315516949, 0.008024962618947029, 0.00835713092237711, 0.00868929922580719, 0.00902146752923727, 0.00935363583266735, 0.009685805067420006, 0.010017973370850086, 0.010350141674280167, 0.010682309977710247, 0.011014478281140327, 0.011346646584570408, 0.011678814888000488, 0.012010983191430569, 0.012343151494860649, 0.012675320729613304, 0.013007489033043385, 0.013339657336473465, 0.013671825639903545, 0.014003993943333626, 0.014336162246763706, 0.014668330550193787, 0.015000499784946442, 0.015332668088376522, 0.015664836391806602, 0.01599700376391411, 0.016329172998666763]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 1.0, 4.0, 6.0, 4.0, 10.0, 8.0, 13.0, 22.0, 16.0, 14.0, 32.0, 23.0, 34.0, 20.0, 36.0, 34.0, 43.0, 27.0, 38.0, 48.0, 37.0, 33.0, 37.0, 41.0, 48.0, 39.0, 47.0, 38.0, 33.0, 32.0, 22.0, 18.0, 24.0, 15.0, 21.0, 15.0, 11.0, 9.0, 11.0, 8.0, 6.0, 8.0, 3.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0008952021598815918, -0.000864262692630291, -0.0008333232253789902, -0.0008023837581276894, -0.0007714442908763885, -0.0007405048236250877, -0.0007095653563737869, -0.0006786258891224861, -0.0006476864218711853, -0.0006167469546198845, -0.0005858074873685837, -0.0005548680201172829, -0.0005239285528659821, -0.0004929890856146812, -0.00046204961836338043, -0.0004311101511120796, -0.0004001706838607788, -0.000369231216609478, -0.0003382917493581772, -0.0003073522821068764, -0.00027641281485557556, -0.00024547334760427475, -0.00021453388035297394, -0.00018359441310167313, -0.00015265494585037231, -0.0001217154785990715, -9.077601134777069e-05, -5.983654409646988e-05, -2.8897076845169067e-05, 2.0423904061317444e-06, 3.2981857657432556e-05, 6.392132490873337e-05, 9.486079216003418e-05, 0.000125800259411335, 0.0001567397266626358, 0.00018767919391393661, 0.00021861866116523743, 0.00024955812841653824, 0.00028049759566783905, 0.00031143706291913986, 0.0003423765301704407, 0.0003733159974217415, 0.0004042554646730423, 0.0004351949319243431, 0.0004661343991756439, 0.0004970738664269447, 0.0005280133336782455, 0.0005589528009295464, 0.0005898922681808472, 0.000620831735432148, 0.0006517712026834488, 0.0006827106699347496, 0.0007136501371860504, 0.0007445896044373512, 0.000775529071688652, 0.0008064685389399529, 0.0008374080061912537, 0.0008683474734425545, 0.0008992869406938553, 0.0009302264079451561, 0.0009611658751964569, 0.0009921053424477577, 0.0010230448096990585, 0.0010539842769503593, 0.0010849237442016602]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 5.0, 9.0, 17.0, 10.0, 15.0, 20.0, 28.0, 30.0, 27.0, 27.0, 46.0, 46.0, 49.0, 49.0, 47.0, 52.0, 64.0, 44.0, 50.0, 59.0, 44.0, 43.0, 35.0, 33.0, 32.0, 28.0, 21.0, 17.0, 15.0, 15.0, 6.0, 5.0, 11.0, 7.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.55078125, -4.3717041015625, -4.192626953125, -4.0135498046875, -3.83447265625, -3.6553955078125, -3.476318359375, -3.2972412109375, -3.1181640625, -2.9390869140625, -2.760009765625, -2.5809326171875, -2.40185546875, -2.2227783203125, -2.043701171875, -1.8646240234375, -1.685546875, -1.5064697265625, -1.327392578125, -1.1483154296875, -0.96923828125, -0.7901611328125, -0.611083984375, -0.4320068359375, -0.2529296875, -0.0738525390625, 0.105224609375, 0.2843017578125, 0.46337890625, 0.6424560546875, 0.821533203125, 1.0006103515625, 1.1796875, 1.3587646484375, 1.537841796875, 1.7169189453125, 1.89599609375, 2.0750732421875, 2.254150390625, 2.4332275390625, 2.6123046875, 2.7913818359375, 2.970458984375, 3.1495361328125, 3.32861328125, 3.5076904296875, 3.686767578125, 3.8658447265625, 4.044921875, 4.2239990234375, 4.403076171875, 4.5821533203125, 4.76123046875, 4.9403076171875, 5.119384765625, 5.2984619140625, 5.4775390625, 5.6566162109375, 5.835693359375, 6.0147705078125, 6.19384765625, 6.3729248046875, 6.552001953125, 6.7310791015625, 6.91015625]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 5.0, 5.0, 10.0, 13.0, 42.0, 37.0, 58.0, 90.0, 142.0, 240.0, 341.0, 618.0, 1182.0, 2902.0, 9064.0, 38158.0, 227534.0, 616703.0, 118428.0, 22690.0, 6034.0, 2024.0, 918.0, 499.0, 281.0, 186.0, 122.0, 70.0, 70.0, 29.0, 19.0, 21.0, 7.0, 8.0, 2.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.81640625, -5.6246337890625, -5.432861328125, -5.2410888671875, -5.04931640625, -4.8575439453125, -4.665771484375, -4.4739990234375, -4.2822265625, -4.0904541015625, -3.898681640625, -3.7069091796875, -3.51513671875, -3.3233642578125, -3.131591796875, -2.9398193359375, -2.748046875, -2.5562744140625, -2.364501953125, -2.1727294921875, -1.98095703125, -1.7891845703125, -1.597412109375, -1.4056396484375, -1.2138671875, -1.0220947265625, -0.830322265625, -0.6385498046875, -0.44677734375, -0.2550048828125, -0.063232421875, 0.1285400390625, 0.3203125, 0.5120849609375, 0.703857421875, 0.8956298828125, 1.08740234375, 1.2791748046875, 1.470947265625, 1.6627197265625, 1.8544921875, 2.0462646484375, 2.238037109375, 2.4298095703125, 2.62158203125, 2.8133544921875, 3.005126953125, 3.1968994140625, 3.388671875, 3.5804443359375, 3.772216796875, 3.9639892578125, 4.15576171875, 4.3475341796875, 4.539306640625, 4.7310791015625, 4.9228515625, 5.1146240234375, 5.306396484375, 5.4981689453125, 5.68994140625, 5.8817138671875, 6.073486328125, 6.2652587890625, 6.45703125]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 8.0, 4.0, 14.0, 9.0, 15.0, 20.0, 24.0, 22.0, 26.0, 29.0, 43.0, 43.0, 47.0, 45.0, 50.0, 76.0, 1677.0, 452.0, 62.0, 52.0, 50.0, 36.0, 47.0, 33.0, 33.0, 30.0, 25.0, 18.0, 20.0, 20.0, 8.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.359375, -17.745849609375, -17.13232421875, -16.518798828125, -15.9052734375, -15.291748046875, -14.67822265625, -14.064697265625, -13.451171875, -12.837646484375, -12.22412109375, -11.610595703125, -10.9970703125, -10.383544921875, -9.77001953125, -9.156494140625, -8.54296875, -7.929443359375, -7.31591796875, -6.702392578125, -6.0888671875, -5.475341796875, -4.86181640625, -4.248291015625, -3.634765625, -3.021240234375, -2.40771484375, -1.794189453125, -1.1806640625, -0.567138671875, 0.04638671875, 0.659912109375, 1.2734375, 1.886962890625, 2.50048828125, 3.114013671875, 3.7275390625, 4.341064453125, 4.95458984375, 5.568115234375, 6.181640625, 6.795166015625, 7.40869140625, 8.022216796875, 8.6357421875, 9.249267578125, 9.86279296875, 10.476318359375, 11.08984375, 11.703369140625, 12.31689453125, 12.930419921875, 13.5439453125, 14.157470703125, 14.77099609375, 15.384521484375, 15.998046875, 16.611572265625, 17.22509765625, 17.838623046875, 18.4521484375, 19.065673828125, 19.67919921875, 20.292724609375, 20.90625]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 3.0, 6.0, 24.0, 18.0, 14.0, 24.0, 21.0, 41.0, 38.0, 56.0, 86.0, 111.0, 233.0, 756.0, 24542.0, 3116530.0, 2161.0, 443.0, 164.0, 120.0, 71.0, 44.0, 43.0, 24.0, 32.0, 17.0, 27.0, 12.0, 12.0, 13.0, 6.0, 5.0, 4.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-48.84375, -47.4189453125, -45.994140625, -44.5693359375, -43.14453125, -41.7197265625, -40.294921875, -38.8701171875, -37.4453125, -36.0205078125, -34.595703125, -33.1708984375, -31.74609375, -30.3212890625, -28.896484375, -27.4716796875, -26.046875, -24.6220703125, -23.197265625, -21.7724609375, -20.34765625, -18.9228515625, -17.498046875, -16.0732421875, -14.6484375, -13.2236328125, -11.798828125, -10.3740234375, -8.94921875, -7.5244140625, -6.099609375, -4.6748046875, -3.25, -1.8251953125, -0.400390625, 1.0244140625, 2.44921875, 3.8740234375, 5.298828125, 6.7236328125, 8.1484375, 9.5732421875, 10.998046875, 12.4228515625, 13.84765625, 15.2724609375, 16.697265625, 18.1220703125, 19.546875, 20.9716796875, 22.396484375, 23.8212890625, 25.24609375, 26.6708984375, 28.095703125, 29.5205078125, 30.9453125, 32.3701171875, 33.794921875, 35.2197265625, 36.64453125, 38.0693359375, 39.494140625, 40.9189453125, 42.34375]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 10.0, 34.0, 140.0, 359.0, 319.0, 129.0, 20.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-44.795841217041016, -43.94947052001953, -43.10310363769531, -42.25673294067383, -41.41036605834961, -40.563995361328125, -39.717628479003906, -38.87125778198242, -38.02488708496094, -37.17851638793945, -36.332149505615234, -35.48577880859375, -34.63941192626953, -33.79304122924805, -32.94667053222656, -32.100303649902344, -31.253936767578125, -30.407567977905273, -29.561199188232422, -28.714828491210938, -27.868459701538086, -27.022090911865234, -26.175722122192383, -25.32935333251953, -24.482982635498047, -23.636613845825195, -22.790245056152344, -21.94387435913086, -21.097505569458008, -20.251136779785156, -19.404767990112305, -18.558399200439453, -17.7120304107666, -16.86566162109375, -16.0192928314209, -15.17292308807373, -14.326554298400879, -13.480184555053711, -12.63381576538086, -11.787446975708008, -10.941078186035156, -10.094709396362305, -9.248339653015137, -8.401970863342285, -7.555602073669434, -6.709232807159424, -5.862863540649414, -5.0164947509765625, -4.1701250076293945, -3.323755979537964, -2.477386951446533, -1.6310176849365234, -0.7846486568450928, 0.06172037124633789, 0.9080896377563477, 1.7544584274291992, 2.600827693939209, 3.4471967220306396, 4.29356575012207, 5.13993501663208, 5.98630428314209, 6.832673072814941, 7.679042339324951, 8.525411605834961, 9.371780395507812]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 5.0, 2.0, 7.0, 5.0, 10.0, 10.0, 13.0, 15.0, 18.0, 25.0, 29.0, 20.0, 23.0, 28.0, 20.0, 22.0, 40.0, 43.0, 39.0, 41.0, 49.0, 34.0, 31.0, 40.0, 47.0, 36.0, 38.0, 31.0, 28.0, 31.0, 34.0, 24.0, 29.0, 25.0, 19.0, 19.0, 15.0, 17.0, 5.0, 5.0, 9.0, 5.0, 4.0, 4.0, 2.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-47.77581024169922, -46.37089920043945, -44.96598815917969, -43.561073303222656, -42.15616226196289, -40.751251220703125, -39.34634017944336, -37.941429138183594, -36.53651809692383, -35.13160705566406, -33.7266960144043, -32.32178497314453, -30.916872024536133, -29.511959075927734, -28.10704803466797, -26.702136993408203, -25.297224044799805, -23.89231300354004, -22.48740005493164, -21.082489013671875, -19.67757797241211, -18.272666931152344, -16.867753982543945, -15.46284294128418, -14.057930946350098, -12.653018951416016, -11.24810791015625, -9.843195915222168, -8.438283920288086, -7.03337287902832, -5.628460884094238, -4.223549842834473, -2.8186378479003906, -1.4137262105941772, -0.008814573287963867, 1.396097183227539, 2.801008701324463, 4.205920219421387, 5.610832214355469, 7.015743255615234, 8.420655250549316, 9.825567245483398, 11.230478286743164, 12.635390281677246, 14.040302276611328, 15.445213317871094, 16.85012435913086, 18.255035400390625, 19.659948348999023, 21.06485939025879, 22.469772338867188, 23.874683380126953, 25.27959442138672, 26.684505462646484, 28.089418411254883, 29.49432945251465, 30.899242401123047, 32.30415344238281, 33.70906448364258, 35.113975524902344, 36.518890380859375, 37.92380142211914, 39.328712463378906, 40.73362350463867, 42.13853454589844]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 7.0, 11.0, 18.0, 13.0, 16.0, 24.0, 34.0, 24.0, 34.0, 29.0, 42.0, 53.0, 52.0, 50.0, 57.0, 55.0, 52.0, 50.0, 52.0, 56.0, 46.0, 42.0, 20.0, 35.0, 29.0, 25.0, 17.0, 15.0, 15.0, 7.0, 7.0, 13.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.77734375, -4.5914306640625, -4.405517578125, -4.2196044921875, -4.03369140625, -3.8477783203125, -3.661865234375, -3.4759521484375, -3.2900390625, -3.1041259765625, -2.918212890625, -2.7322998046875, -2.54638671875, -2.3604736328125, -2.174560546875, -1.9886474609375, -1.802734375, -1.6168212890625, -1.430908203125, -1.2449951171875, -1.05908203125, -0.8731689453125, -0.687255859375, -0.5013427734375, -0.3154296875, -0.1295166015625, 0.056396484375, 0.2423095703125, 0.42822265625, 0.6141357421875, 0.800048828125, 0.9859619140625, 1.171875, 1.3577880859375, 1.543701171875, 1.7296142578125, 1.91552734375, 2.1014404296875, 2.287353515625, 2.4732666015625, 2.6591796875, 2.8450927734375, 3.031005859375, 3.2169189453125, 3.40283203125, 3.5887451171875, 3.774658203125, 3.9605712890625, 4.146484375, 4.3323974609375, 4.518310546875, 4.7042236328125, 4.89013671875, 5.0760498046875, 5.261962890625, 5.4478759765625, 5.6337890625, 5.8197021484375, 6.005615234375, 6.1915283203125, 6.37744140625, 6.5633544921875, 6.749267578125, 6.9351806640625, 7.12109375]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 8.0, 6.0, 10.0, 8.0, 15.0, 16.0, 16.0, 37.0, 41.0, 54.0, 60.0, 86.0, 134.0, 187.0, 391.0, 1109.0, 5878.0, 49594.0, 983174.0, 2953329.0, 180793.0, 15546.0, 2336.0, 601.0, 281.0, 151.0, 88.0, 66.0, 61.0, 43.0, 41.0, 29.0, 24.0, 25.0, 14.0, 8.0, 4.0, 9.0, 8.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.890625, -15.307373046875, -14.72412109375, -14.140869140625, -13.5576171875, -12.974365234375, -12.39111328125, -11.807861328125, -11.224609375, -10.641357421875, -10.05810546875, -9.474853515625, -8.8916015625, -8.308349609375, -7.72509765625, -7.141845703125, -6.55859375, -5.975341796875, -5.39208984375, -4.808837890625, -4.2255859375, -3.642333984375, -3.05908203125, -2.475830078125, -1.892578125, -1.309326171875, -0.72607421875, -0.142822265625, 0.4404296875, 1.023681640625, 1.60693359375, 2.190185546875, 2.7734375, 3.356689453125, 3.93994140625, 4.523193359375, 5.1064453125, 5.689697265625, 6.27294921875, 6.856201171875, 7.439453125, 8.022705078125, 8.60595703125, 9.189208984375, 9.7724609375, 10.355712890625, 10.93896484375, 11.522216796875, 12.10546875, 12.688720703125, 13.27197265625, 13.855224609375, 14.4384765625, 15.021728515625, 15.60498046875, 16.188232421875, 16.771484375, 17.354736328125, 17.93798828125, 18.521240234375, 19.1044921875, 19.687744140625, 20.27099609375, 20.854248046875, 21.4375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 7.0, 9.0, 18.0, 16.0, 49.0, 51.0, 81.0, 99.0, 140.0, 238.0, 338.0, 456.0, 582.0, 571.0, 428.0, 314.0, 215.0, 141.0, 119.0, 64.0, 43.0, 27.0, 25.0, 17.0, 8.0, 10.0, 1.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.359375, -19.740966796875, -19.12255859375, -18.504150390625, -17.8857421875, -17.267333984375, -16.64892578125, -16.030517578125, -15.412109375, -14.793701171875, -14.17529296875, -13.556884765625, -12.9384765625, -12.320068359375, -11.70166015625, -11.083251953125, -10.46484375, -9.846435546875, -9.22802734375, -8.609619140625, -7.9912109375, -7.372802734375, -6.75439453125, -6.135986328125, -5.517578125, -4.899169921875, -4.28076171875, -3.662353515625, -3.0439453125, -2.425537109375, -1.80712890625, -1.188720703125, -0.5703125, 0.048095703125, 0.66650390625, 1.284912109375, 1.9033203125, 2.521728515625, 3.14013671875, 3.758544921875, 4.376953125, 4.995361328125, 5.61376953125, 6.232177734375, 6.8505859375, 7.468994140625, 8.08740234375, 8.705810546875, 9.32421875, 9.942626953125, 10.56103515625, 11.179443359375, 11.7978515625, 12.416259765625, 13.03466796875, 13.653076171875, 14.271484375, 14.889892578125, 15.50830078125, 16.126708984375, 16.7451171875, 17.363525390625, 17.98193359375, 18.600341796875, 19.21875]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 9.0, 3.0, 11.0, 17.0, 28.0, 33.0, 60.0, 93.0, 99.0, 198.0, 386.0, 1267.0, 19728.0, 2883027.0, 1276009.0, 11421.0, 1047.0, 349.0, 179.0, 115.0, 57.0, 48.0, 23.0, 31.0, 14.0, 4.0, 9.0, 6.0, 4.0, 4.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.25, -42.400390625, -40.55078125, -38.701171875, -36.8515625, -35.001953125, -33.15234375, -31.302734375, -29.453125, -27.603515625, -25.75390625, -23.904296875, -22.0546875, -20.205078125, -18.35546875, -16.505859375, -14.65625, -12.806640625, -10.95703125, -9.107421875, -7.2578125, -5.408203125, -3.55859375, -1.708984375, 0.140625, 1.990234375, 3.83984375, 5.689453125, 7.5390625, 9.388671875, 11.23828125, 13.087890625, 14.9375, 16.787109375, 18.63671875, 20.486328125, 22.3359375, 24.185546875, 26.03515625, 27.884765625, 29.734375, 31.583984375, 33.43359375, 35.283203125, 37.1328125, 38.982421875, 40.83203125, 42.681640625, 44.53125, 46.380859375, 48.23046875, 50.080078125, 51.9296875, 53.779296875, 55.62890625, 57.478515625, 59.328125, 61.177734375, 63.02734375, 64.876953125, 66.7265625, 68.576171875, 70.42578125, 72.275390625, 74.125]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 12.0, 20.0, 62.0, 131.0, 261.0, 267.0, 170.0, 65.0, 22.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.441036224365234, -42.25052261352539, -38.06000900268555, -33.86949157714844, -29.678979873657227, -25.488466262817383, -21.297950744628906, -17.107437133789062, -12.916923522949219, -8.726409912109375, -4.535895347595215, -0.3453807830810547, 3.845132827758789, 8.035646438598633, 12.22616195678711, 16.416675567626953, 20.607189178466797, 24.79770278930664, 28.988216400146484, 33.178733825683594, 37.36924743652344, 41.55976104736328, 45.750274658203125, 49.94078826904297, 54.13130187988281, 58.321815490722656, 62.5123291015625, 66.70284271240234, 70.89335632324219, 75.08386993408203, 79.27438354492188, 83.46490478515625, 87.65541076660156, 91.8459243774414, 96.03643798828125, 100.2269515991211, 104.41746520996094, 108.60797882080078, 112.79849243164062, 116.989013671875, 121.17951965332031, 125.37003326416016, 129.560546875, 133.75106811523438, 137.9415740966797, 142.13209533691406, 146.32260131835938, 150.51312255859375, 154.70364379882812, 158.8941650390625, 163.0846710205078, 167.2751922607422, 171.4656982421875, 175.65621948242188, 179.8467254638672, 184.03724670410156, 188.22775268554688, 192.41827392578125, 196.60877990722656, 200.79930114746094, 204.98980712890625, 209.18032836914062, 213.37083435058594, 217.5613555908203, 221.75186157226562]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 6.0, 10.0, 4.0, 10.0, 4.0, 8.0, 6.0, 12.0, 15.0, 11.0, 21.0, 23.0, 23.0, 37.0, 35.0, 27.0, 31.0, 41.0, 42.0, 43.0, 42.0, 40.0, 46.0, 29.0, 42.0, 50.0, 36.0, 50.0, 31.0, 37.0, 26.0, 33.0, 27.0, 14.0, 14.0, 18.0, 16.0, 18.0, 7.0, 6.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-50.21797180175781, -48.60258102416992, -46.9871940612793, -45.371803283691406, -43.75641632080078, -42.14102554321289, -40.525638580322266, -38.910247802734375, -37.29486083984375, -35.67947006225586, -34.064083099365234, -32.448692321777344, -30.83330535888672, -29.217914581298828, -27.602527618408203, -25.987136840820312, -24.371747970581055, -22.756359100341797, -21.14097023010254, -19.52558135986328, -17.910192489624023, -16.294803619384766, -14.679413795471191, -13.064024925231934, -11.448636054992676, -9.833247184753418, -8.21785831451416, -6.602468967437744, -4.987080097198486, -3.3716907501220703, -1.7563018798828125, -0.1409130096435547, 1.4744758605957031, 3.089864730834961, 4.705253601074219, 6.320642948150635, 7.936031818389893, 9.551421165466309, 11.166810035705566, 12.782198905944824, 14.397587776184082, 16.012977600097656, 17.628366470336914, 19.243755340576172, 20.85914421081543, 22.474533081054688, 24.089921951293945, 25.705310821533203, 27.32069969177246, 28.93608856201172, 30.551477432250977, 32.166866302490234, 33.782257080078125, 35.39764404296875, 37.01303482055664, 38.628421783447266, 40.243812561035156, 41.85920333862305, 43.47459030151367, 45.08998107910156, 46.70536804199219, 48.32075881958008, 49.9361457824707, 51.551536560058594, 53.16692352294922]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 7.0, 11.0, 14.0, 19.0, 16.0, 25.0, 38.0, 29.0, 42.0, 34.0, 43.0, 35.0, 52.0, 46.0, 82.0, 62.0, 54.0, 52.0, 41.0, 39.0, 52.0, 30.0, 28.0, 27.0, 30.0, 26.0, 24.0, 8.0, 12.0, 10.0, 9.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.96484375, -4.76910400390625, -4.5733642578125, -4.37762451171875, -4.181884765625, -3.98614501953125, -3.7904052734375, -3.59466552734375, -3.39892578125, -3.20318603515625, -3.0074462890625, -2.81170654296875, -2.615966796875, -2.42022705078125, -2.2244873046875, -2.02874755859375, -1.8330078125, -1.63726806640625, -1.4415283203125, -1.24578857421875, -1.050048828125, -0.85430908203125, -0.6585693359375, -0.46282958984375, -0.26708984375, -0.07135009765625, 0.1243896484375, 0.32012939453125, 0.515869140625, 0.71160888671875, 0.9073486328125, 1.10308837890625, 1.298828125, 1.49456787109375, 1.6903076171875, 1.88604736328125, 2.081787109375, 2.27752685546875, 2.4732666015625, 2.66900634765625, 2.86474609375, 3.06048583984375, 3.2562255859375, 3.45196533203125, 3.647705078125, 3.84344482421875, 4.0391845703125, 4.23492431640625, 4.4306640625, 4.62640380859375, 4.8221435546875, 5.01788330078125, 5.213623046875, 5.40936279296875, 5.6051025390625, 5.80084228515625, 5.99658203125, 6.19232177734375, 6.3880615234375, 6.58380126953125, 6.779541015625, 6.97528076171875, 7.1710205078125, 7.36676025390625, 7.5625]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 1.0, 3.0, 4.0, 12.0, 8.0, 19.0, 35.0, 36.0, 62.0, 109.0, 149.0, 245.0, 324.0, 516.0, 770.0, 1203.0, 1898.0, 2879.0, 4353.0, 7006.0, 10990.0, 18114.0, 30249.0, 52365.0, 95024.0, 186375.0, 275900.0, 159569.0, 83228.0, 46020.0, 27136.0, 16240.0, 10057.0, 6240.0, 3919.0, 2587.0, 1661.0, 1133.0, 766.0, 461.0, 302.0, 203.0, 152.0, 95.0, 56.0, 29.0, 13.0, 21.0, 16.0, 2.0, 7.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.75048828125, -0.7273178100585938, -0.7041473388671875, -0.6809768676757812, -0.657806396484375, -0.6346359252929688, -0.6114654541015625, -0.5882949829101562, -0.56512451171875, -0.5419540405273438, -0.5187835693359375, -0.49561309814453125, -0.472442626953125, -0.44927215576171875, -0.4261016845703125, -0.40293121337890625, -0.3797607421875, -0.35659027099609375, -0.3334197998046875, -0.31024932861328125, -0.287078857421875, -0.26390838623046875, -0.2407379150390625, -0.21756744384765625, -0.19439697265625, -0.17122650146484375, -0.1480560302734375, -0.12488555908203125, -0.101715087890625, -0.07854461669921875, -0.0553741455078125, -0.03220367431640625, -0.009033203125, 0.01413726806640625, 0.0373077392578125, 0.06047821044921875, 0.083648681640625, 0.10681915283203125, 0.1299896240234375, 0.15316009521484375, 0.17633056640625, 0.19950103759765625, 0.2226715087890625, 0.24584197998046875, 0.269012451171875, 0.29218292236328125, 0.3153533935546875, 0.33852386474609375, 0.3616943359375, 0.38486480712890625, 0.4080352783203125, 0.43120574951171875, 0.454376220703125, 0.47754669189453125, 0.5007171630859375, 0.5238876342773438, 0.54705810546875, 0.5702285766601562, 0.5933990478515625, 0.6165695190429688, 0.639739990234375, 0.6629104614257812, 0.6860809326171875, 0.7092514038085938, 0.732421875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 5.0, 2.0, 10.0, 4.0, 5.0, 9.0, 14.0, 11.0, 11.0, 21.0, 18.0, 30.0, 21.0, 32.0, 36.0, 30.0, 47.0, 50.0, 32.0, 52.0, 50.0, 1072.0, 60.0, 44.0, 37.0, 23.0, 29.0, 47.0, 26.0, 26.0, 21.0, 15.0, 11.0, 23.0, 20.0, 15.0, 12.0, 7.0, 12.0, 4.0, 7.0, 4.0, 11.0, 7.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.091796875, -2.996337890625, -2.90087890625, -2.805419921875, -2.7099609375, -2.614501953125, -2.51904296875, -2.423583984375, -2.328125, -2.232666015625, -2.13720703125, -2.041748046875, -1.9462890625, -1.850830078125, -1.75537109375, -1.659912109375, -1.564453125, -1.468994140625, -1.37353515625, -1.278076171875, -1.1826171875, -1.087158203125, -0.99169921875, -0.896240234375, -0.80078125, -0.705322265625, -0.60986328125, -0.514404296875, -0.4189453125, -0.323486328125, -0.22802734375, -0.132568359375, -0.037109375, 0.058349609375, 0.15380859375, 0.249267578125, 0.3447265625, 0.440185546875, 0.53564453125, 0.631103515625, 0.7265625, 0.822021484375, 0.91748046875, 1.012939453125, 1.1083984375, 1.203857421875, 1.29931640625, 1.394775390625, 1.490234375, 1.585693359375, 1.68115234375, 1.776611328125, 1.8720703125, 1.967529296875, 2.06298828125, 2.158447265625, 2.25390625, 2.349365234375, 2.44482421875, 2.540283203125, 2.6357421875, 2.731201171875, 2.82666015625, 2.922119140625, 3.017578125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 6.0, 8.0, 8.0, 14.0, 11.0, 26.0, 28.0, 29.0, 51.0, 87.0, 115.0, 149.0, 214.0, 326.0, 468.0, 691.0, 1031.0, 1421.0, 2158.0, 3080.0, 4880.0, 7158.0, 11244.0, 17447.0, 27868.0, 45717.0, 78739.0, 146662.0, 1297425.0, 195314.0, 102404.0, 57229.0, 34061.0, 21028.0, 13575.0, 8690.0, 5768.0, 3704.0, 2588.0, 1783.0, 1208.0, 844.0, 575.0, 417.0, 261.0, 193.0, 126.0, 94.0, 69.0, 41.0, 32.0, 30.0, 21.0, 7.0, 5.0, 6.0, 5.0, 5.0, 2.0, 1.0], "bins": [-0.57763671875, -0.5599822998046875, -0.542327880859375, -0.5246734619140625, -0.50701904296875, -0.4893646240234375, -0.471710205078125, -0.4540557861328125, -0.4364013671875, -0.4187469482421875, -0.401092529296875, -0.3834381103515625, -0.36578369140625, -0.3481292724609375, -0.330474853515625, -0.3128204345703125, -0.295166015625, -0.2775115966796875, -0.259857177734375, -0.2422027587890625, -0.22454833984375, -0.2068939208984375, -0.189239501953125, -0.1715850830078125, -0.1539306640625, -0.1362762451171875, -0.118621826171875, -0.1009674072265625, -0.08331298828125, -0.0656585693359375, -0.048004150390625, -0.0303497314453125, -0.0126953125, 0.0049591064453125, 0.022613525390625, 0.0402679443359375, 0.05792236328125, 0.0755767822265625, 0.093231201171875, 0.1108856201171875, 0.1285400390625, 0.1461944580078125, 0.163848876953125, 0.1815032958984375, 0.19915771484375, 0.2168121337890625, 0.234466552734375, 0.2521209716796875, 0.269775390625, 0.2874298095703125, 0.305084228515625, 0.3227386474609375, 0.34039306640625, 0.3580474853515625, 0.375701904296875, 0.3933563232421875, 0.4110107421875, 0.4286651611328125, 0.446319580078125, 0.4639739990234375, 0.48162841796875, 0.4992828369140625, 0.516937255859375, 0.5345916748046875, 0.55224609375]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 7.0, 5.0, 6.0, 4.0, 8.0, 11.0, 17.0, 18.0, 28.0, 32.0, 24.0, 35.0, 45.0, 55.0, 67.0, 83.0, 99.0, 62.0, 75.0, 62.0, 56.0, 42.0, 35.0, 31.0, 14.0, 16.0, 15.0, 11.0, 11.0, 9.0, 4.0, 0.0, 5.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0019378662109375, -0.0018814951181411743, -0.0018251240253448486, -0.001768752932548523, -0.0017123818397521973, -0.0016560107469558716, -0.001599639654159546, -0.0015432685613632202, -0.0014868974685668945, -0.0014305263757705688, -0.0013741552829742432, -0.0013177841901779175, -0.0012614130973815918, -0.0012050420045852661, -0.0011486709117889404, -0.0010922998189926147, -0.001035928726196289, -0.0009795576333999634, -0.0009231865406036377, -0.000866815447807312, -0.0008104443550109863, -0.0007540732622146606, -0.000697702169418335, -0.0006413310766220093, -0.0005849599838256836, -0.0005285888910293579, -0.0004722177982330322, -0.00041584670543670654, -0.00035947561264038086, -0.0003031045198440552, -0.0002467334270477295, -0.0001903623342514038, -0.00013399124145507812, -7.762014865875244e-05, -2.1249055862426758e-05, 3.5122036933898926e-05, 9.149312973022461e-05, 0.0001478642225265503, 0.00020423531532287598, 0.00026060640811920166, 0.00031697750091552734, 0.00037334859371185303, 0.0004297196865081787, 0.0004860907793045044, 0.0005424618721008301, 0.0005988329648971558, 0.0006552040576934814, 0.0007115751504898071, 0.0007679462432861328, 0.0008243173360824585, 0.0008806884288787842, 0.0009370595216751099, 0.0009934306144714355, 0.0010498017072677612, 0.001106172800064087, 0.0011625438928604126, 0.0012189149856567383, 0.001275286078453064, 0.0013316571712493896, 0.0013880282640457153, 0.001444399356842041, 0.0015007704496383667, 0.0015571415424346924, 0.001613512635231018, 0.0016698837280273438]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 10.0, 7.0, 16.0, 14.0, 26.0, 26.0, 32.0, 46.0, 87.0, 128.0, 149.0, 251.0, 446.0, 1738.0, 1023206.0, 20807.0, 665.0, 304.0, 170.0, 114.0, 82.0, 68.0, 41.0, 30.0, 22.0, 14.0, 8.0, 8.0, 6.0, 5.0, 7.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0341796875, -0.032946109771728516, -0.03171253204345703, -0.030478954315185547, -0.029245376586914062, -0.028011798858642578, -0.026778221130371094, -0.02554464340209961, -0.024311065673828125, -0.02307748794555664, -0.021843910217285156, -0.020610332489013672, -0.019376754760742188, -0.018143177032470703, -0.01690959930419922, -0.015676021575927734, -0.01444244384765625, -0.013208866119384766, -0.011975288391113281, -0.010741710662841797, -0.009508132934570312, -0.008274555206298828, -0.007040977478027344, -0.005807399749755859, -0.004573822021484375, -0.0033402442932128906, -0.0021066665649414062, -0.0008730888366699219, 0.0003604888916015625, 0.0015940666198730469, 0.0028276443481445312, 0.004061222076416016, 0.0052947998046875, 0.006528377532958984, 0.007761955261230469, 0.008995532989501953, 0.010229110717773438, 0.011462688446044922, 0.012696266174316406, 0.01392984390258789, 0.015163421630859375, 0.01639699935913086, 0.017630577087402344, 0.018864154815673828, 0.020097732543945312, 0.021331310272216797, 0.02256488800048828, 0.023798465728759766, 0.02503204345703125, 0.026265621185302734, 0.02749919891357422, 0.028732776641845703, 0.029966354370117188, 0.031199932098388672, 0.032433509826660156, 0.03366708755493164, 0.034900665283203125, 0.03613424301147461, 0.037367820739746094, 0.03860139846801758, 0.03983497619628906, 0.04106855392456055, 0.04230213165283203, 0.043535709381103516, 0.044769287109375]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 26.0, 620.0, 364.0, 8.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008985470049083233, -0.008765552192926407, -0.00854563433676958, -0.008325716480612755, -0.008105798624455929, -0.007885880768299103, -0.007665962912142277, -0.007446045055985451, -0.007226127199828625, -0.007006209343671799, -0.006786291487514973, -0.006566373631358147, -0.006346455775201321, -0.006126537919044495, -0.005906620062887669, -0.005686702206730843, -0.005466783884912729, -0.005246866028755903, -0.005026948172599077, -0.004807030316442251, -0.004587112460285425, -0.004367194604128599, -0.004147276282310486, -0.00392735842615366, -0.0037074408028274775, -0.0034875229466706514, -0.0032676050905138254, -0.0030476870015263557, -0.0028277691453695297, -0.0026078512892127037, -0.0023879334330558777, -0.0021680155768990517, -0.0019480977207422256, -0.0017281798645853996, -0.0015082620084285736, -0.0012883440358564258, -0.0010684261796995997, -0.0008485083235427737, -0.0006285903509706259, -0.00040867249481379986, -0.00018875463865697384, 3.116324660368264e-05, 0.0002510811318643391, 0.00047099904622882605, 0.0006909169023856521, 0.0009108347585424781, 0.001130752731114626, 0.001350670587271452, 0.001570588443428278, 0.001790506299585104, 0.00201042415574193, 0.002230342011898756, 0.002450259868055582, 0.002670177724212408, 0.0028900958131998777, 0.0031100136693567038, 0.0033299315255135298, 0.003549849381670356, 0.003769767237827182, 0.0039896853268146515, 0.0042096031829714775, 0.0044295210391283035, 0.0046494388952851295, 0.004869356751441956, 0.005089274607598782]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 3.0, 3.0, 14.0, 9.0, 13.0, 11.0, 14.0, 16.0, 12.0, 14.0, 26.0, 12.0, 24.0, 31.0, 33.0, 39.0, 40.0, 41.0, 45.0, 39.0, 39.0, 30.0, 43.0, 30.0, 43.0, 35.0, 34.0, 30.0, 36.0, 34.0, 30.0, 22.0, 20.0, 20.0, 21.0, 17.0, 13.0, 16.0, 11.0, 8.0, 10.0, 7.0, 6.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000735938549041748, -0.0007114782929420471, -0.0006870180368423462, -0.0006625577807426453, -0.0006380975246429443, -0.0006136372685432434, -0.0005891770124435425, -0.0005647167563438416, -0.0005402565002441406, -0.0005157962441444397, -0.0004913359880447388, -0.00046687573194503784, -0.0004424154758453369, -0.000417955219745636, -0.00039349496364593506, -0.00036903470754623413, -0.0003445744514465332, -0.0003201141953468323, -0.00029565393924713135, -0.0002711936831474304, -0.0002467334270477295, -0.00022227317094802856, -0.00019781291484832764, -0.0001733526587486267, -0.00014889240264892578, -0.00012443214654922485, -9.997189044952393e-05, -7.5511634349823e-05, -5.105137825012207e-05, -2.6591122150421143e-05, -2.130866050720215e-06, 2.2329390048980713e-05, 4.678964614868164e-05, 7.124990224838257e-05, 9.57101583480835e-05, 0.00012017041444778442, 0.00014463067054748535, 0.00016909092664718628, 0.0001935511827468872, 0.00021801143884658813, 0.00024247169494628906, 0.00026693195104599, 0.0002913922071456909, 0.00031585246324539185, 0.0003403127193450928, 0.0003647729754447937, 0.00038923323154449463, 0.00041369348764419556, 0.0004381537437438965, 0.0004626139998435974, 0.00048707425594329834, 0.0005115345120429993, 0.0005359947681427002, 0.0005604550242424011, 0.000584915280342102, 0.000609375536441803, 0.0006338357925415039, 0.0006582960486412048, 0.0006827563047409058, 0.0007072165608406067, 0.0007316768169403076, 0.0007561370730400085, 0.0007805973291397095, 0.0008050575852394104, 0.0008295178413391113]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 7.0, 11.0, 14.0, 19.0, 16.0, 25.0, 38.0, 29.0, 42.0, 34.0, 43.0, 35.0, 52.0, 46.0, 82.0, 62.0, 54.0, 52.0, 41.0, 39.0, 52.0, 30.0, 28.0, 27.0, 30.0, 26.0, 24.0, 8.0, 12.0, 10.0, 9.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.96484375, -4.76910400390625, -4.5733642578125, -4.37762451171875, -4.181884765625, -3.98614501953125, -3.7904052734375, -3.59466552734375, -3.39892578125, -3.20318603515625, -3.0074462890625, -2.81170654296875, -2.615966796875, -2.42022705078125, -2.2244873046875, -2.02874755859375, -1.8330078125, -1.63726806640625, -1.4415283203125, -1.24578857421875, -1.050048828125, -0.85430908203125, -0.6585693359375, -0.46282958984375, -0.26708984375, -0.07135009765625, 0.1243896484375, 0.32012939453125, 0.515869140625, 0.71160888671875, 0.9073486328125, 1.10308837890625, 1.298828125, 1.49456787109375, 1.6903076171875, 1.88604736328125, 2.081787109375, 2.27752685546875, 2.4732666015625, 2.66900634765625, 2.86474609375, 3.06048583984375, 3.2562255859375, 3.45196533203125, 3.647705078125, 3.84344482421875, 4.0391845703125, 4.23492431640625, 4.4306640625, 4.62640380859375, 4.8221435546875, 5.01788330078125, 5.213623046875, 5.40936279296875, 5.6051025390625, 5.80084228515625, 5.99658203125, 6.19232177734375, 6.3880615234375, 6.58380126953125, 6.779541015625, 6.97528076171875, 7.1710205078125, 7.36676025390625, 7.5625]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 9.0, 11.0, 16.0, 26.0, 34.0, 52.0, 95.0, 113.0, 193.0, 320.0, 500.0, 829.0, 1452.0, 2397.0, 4298.0, 8166.0, 17234.0, 43438.0, 138707.0, 481179.0, 234452.0, 66866.0, 24641.0, 10686.0, 5473.0, 2954.0, 1744.0, 995.0, 612.0, 396.0, 258.0, 144.0, 91.0, 62.0, 41.0, 24.0, 15.0, 13.0, 7.0, 10.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.08203125, -2.96209716796875, -2.8421630859375, -2.72222900390625, -2.602294921875, -2.48236083984375, -2.3624267578125, -2.24249267578125, -2.12255859375, -2.00262451171875, -1.8826904296875, -1.76275634765625, -1.642822265625, -1.52288818359375, -1.4029541015625, -1.28302001953125, -1.1630859375, -1.04315185546875, -0.9232177734375, -0.80328369140625, -0.683349609375, -0.56341552734375, -0.4434814453125, -0.32354736328125, -0.20361328125, -0.08367919921875, 0.0362548828125, 0.15618896484375, 0.276123046875, 0.39605712890625, 0.5159912109375, 0.63592529296875, 0.755859375, 0.87579345703125, 0.9957275390625, 1.11566162109375, 1.235595703125, 1.35552978515625, 1.4754638671875, 1.59539794921875, 1.71533203125, 1.83526611328125, 1.9552001953125, 2.07513427734375, 2.195068359375, 2.31500244140625, 2.4349365234375, 2.55487060546875, 2.6748046875, 2.79473876953125, 2.9146728515625, 3.03460693359375, 3.154541015625, 3.27447509765625, 3.3944091796875, 3.51434326171875, 3.63427734375, 3.75421142578125, 3.8741455078125, 3.99407958984375, 4.114013671875, 4.23394775390625, 4.3538818359375, 4.47381591796875, 4.59375]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 5.0, 2.0, 8.0, 9.0, 13.0, 11.0, 9.0, 15.0, 25.0, 19.0, 27.0, 16.0, 34.0, 35.0, 47.0, 44.0, 52.0, 69.0, 56.0, 168.0, 1830.0, 123.0, 53.0, 54.0, 43.0, 39.0, 44.0, 32.0, 27.0, 23.0, 20.0, 19.0, 17.0, 17.0, 11.0, 9.0, 8.0, 4.0, 4.0, 7.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-22.640625, -22.051513671875, -21.46240234375, -20.873291015625, -20.2841796875, -19.695068359375, -19.10595703125, -18.516845703125, -17.927734375, -17.338623046875, -16.74951171875, -16.160400390625, -15.5712890625, -14.982177734375, -14.39306640625, -13.803955078125, -13.21484375, -12.625732421875, -12.03662109375, -11.447509765625, -10.8583984375, -10.269287109375, -9.68017578125, -9.091064453125, -8.501953125, -7.912841796875, -7.32373046875, -6.734619140625, -6.1455078125, -5.556396484375, -4.96728515625, -4.378173828125, -3.7890625, -3.199951171875, -2.61083984375, -2.021728515625, -1.4326171875, -0.843505859375, -0.25439453125, 0.334716796875, 0.923828125, 1.512939453125, 2.10205078125, 2.691162109375, 3.2802734375, 3.869384765625, 4.45849609375, 5.047607421875, 5.63671875, 6.225830078125, 6.81494140625, 7.404052734375, 7.9931640625, 8.582275390625, 9.17138671875, 9.760498046875, 10.349609375, 10.938720703125, 11.52783203125, 12.116943359375, 12.7060546875, 13.295166015625, 13.88427734375, 14.473388671875, 15.0625]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 9.0, 3.0, 3.0, 8.0, 7.0, 14.0, 18.0, 15.0, 21.0, 18.0, 33.0, 19.0, 55.0, 67.0, 87.0, 165.0, 307.0, 775.0, 5448.0, 2483315.0, 649781.0, 3920.0, 729.0, 283.0, 180.0, 105.0, 77.0, 39.0, 37.0, 36.0, 21.0, 17.0, 21.0, 14.0, 14.0, 11.0, 11.0, 7.0, 7.0, 2.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-25.859375, -24.899658203125, -23.93994140625, -22.980224609375, -22.0205078125, -21.060791015625, -20.10107421875, -19.141357421875, -18.181640625, -17.221923828125, -16.26220703125, -15.302490234375, -14.3427734375, -13.383056640625, -12.42333984375, -11.463623046875, -10.50390625, -9.544189453125, -8.58447265625, -7.624755859375, -6.6650390625, -5.705322265625, -4.74560546875, -3.785888671875, -2.826171875, -1.866455078125, -0.90673828125, 0.052978515625, 1.0126953125, 1.972412109375, 2.93212890625, 3.891845703125, 4.8515625, 5.811279296875, 6.77099609375, 7.730712890625, 8.6904296875, 9.650146484375, 10.60986328125, 11.569580078125, 12.529296875, 13.489013671875, 14.44873046875, 15.408447265625, 16.3681640625, 17.327880859375, 18.28759765625, 19.247314453125, 20.20703125, 21.166748046875, 22.12646484375, 23.086181640625, 24.0458984375, 25.005615234375, 25.96533203125, 26.925048828125, 27.884765625, 28.844482421875, 29.80419921875, 30.763916015625, 31.7236328125, 32.683349609375, 33.64306640625, 34.602783203125, 35.5625]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 312.0, 675.0, 26.0, 0.0, 0.0, 0.0, 1.0], "bins": [-238.09268188476562, -233.99868774414062, -229.90469360351562, -225.81068420410156, -221.71669006347656, -217.62269592285156, -213.5286865234375, -209.4346923828125, -205.3406982421875, -201.2467041015625, -197.1527099609375, -193.05870056152344, -188.96470642089844, -184.87071228027344, -180.77670288085938, -176.68270874023438, -172.58871459960938, -168.49472045898438, -164.40072631835938, -160.3067169189453, -156.2127227783203, -152.1187286376953, -148.02471923828125, -143.93072509765625, -139.83673095703125, -135.74273681640625, -131.64874267578125, -127.55473327636719, -123.46073913574219, -119.36674499511719, -115.27274322509766, -111.17874145507812, -107.08473205566406, -102.99073791503906, -98.89673614501953, -94.802734375, -90.708740234375, -86.61474609375, -82.52074432373047, -78.42674255371094, -74.33274841308594, -70.23875427246094, -66.1447525024414, -62.05075454711914, -57.956756591796875, -53.86275863647461, -49.768760681152344, -45.67476272583008, -41.58076858520508, -37.48677062988281, -33.39277267456055, -29.29877471923828, -25.204776763916016, -21.11077880859375, -17.016780853271484, -12.922782897949219, -8.828784942626953, -4.7347869873046875, -0.6407890319824219, 3.4532089233398438, 7.547206878662109, 11.641204833984375, 15.73520278930664, 19.829200744628906, 23.923198699951172]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 9.0, 6.0, 3.0, 9.0, 11.0, 12.0, 21.0, 23.0, 28.0, 32.0, 26.0, 26.0, 27.0, 28.0, 34.0, 37.0, 29.0, 35.0, 49.0, 48.0, 59.0, 43.0, 36.0, 39.0, 39.0, 35.0, 26.0, 24.0, 34.0, 25.0, 22.0, 17.0, 18.0, 13.0, 11.0, 10.0, 14.0, 3.0, 13.0, 5.0, 5.0, 4.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-58.52305221557617, -56.78562545776367, -55.04820251464844, -53.31077575683594, -51.5733528137207, -49.8359260559082, -48.09850311279297, -46.36107635498047, -44.62364959716797, -42.88622283935547, -41.148799896240234, -39.411373138427734, -37.6739501953125, -35.9365234375, -34.1990966796875, -32.461673736572266, -30.7242488861084, -28.98682403564453, -27.249399185180664, -25.511974334716797, -23.774547576904297, -22.03712272644043, -20.299697875976562, -18.562271118164062, -16.824848175048828, -15.087423324584961, -13.349997520446777, -11.61257266998291, -9.875146865844727, -8.13772201538086, -6.400297164916992, -4.662871360778809, -2.925445556640625, -1.1880203485488892, 0.5494048595428467, 2.286829948425293, 4.024255275726318, 5.761680603027344, 7.499105453491211, 9.236531257629395, 10.973956108093262, 12.711380958557129, 14.448806762695312, 16.18623161315918, 17.923656463623047, 19.661083221435547, 21.39850616455078, 23.13593292236328, 24.87335777282715, 26.610782623291016, 28.348207473754883, 30.08563232421875, 31.82305908203125, 33.56048583984375, 35.297908782958984, 37.035335540771484, 38.77275848388672, 40.51018524169922, 42.24760818481445, 43.98503494262695, 45.72245788574219, 47.45988464355469, 49.19731140136719, 50.93473434448242, 52.67216110229492]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 5.0, 5.0, 3.0, 12.0, 13.0, 17.0, 15.0, 23.0, 28.0, 44.0, 31.0, 41.0, 38.0, 39.0, 42.0, 57.0, 64.0, 62.0, 62.0, 51.0, 34.0, 43.0, 49.0, 37.0, 28.0, 25.0, 27.0, 24.0, 29.0, 17.0, 13.0, 14.0, 4.0, 9.0, 7.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.89453125, -4.6964111328125, -4.498291015625, -4.3001708984375, -4.10205078125, -3.9039306640625, -3.705810546875, -3.5076904296875, -3.3095703125, -3.1114501953125, -2.913330078125, -2.7152099609375, -2.51708984375, -2.3189697265625, -2.120849609375, -1.9227294921875, -1.724609375, -1.5264892578125, -1.328369140625, -1.1302490234375, -0.93212890625, -0.7340087890625, -0.535888671875, -0.3377685546875, -0.1396484375, 0.0584716796875, 0.256591796875, 0.4547119140625, 0.65283203125, 0.8509521484375, 1.049072265625, 1.2471923828125, 1.4453125, 1.6434326171875, 1.841552734375, 2.0396728515625, 2.23779296875, 2.4359130859375, 2.634033203125, 2.8321533203125, 3.0302734375, 3.2283935546875, 3.426513671875, 3.6246337890625, 3.82275390625, 4.0208740234375, 4.218994140625, 4.4171142578125, 4.615234375, 4.8133544921875, 5.011474609375, 5.2095947265625, 5.40771484375, 5.6058349609375, 5.803955078125, 6.0020751953125, 6.2001953125, 6.3983154296875, 6.596435546875, 6.7945556640625, 6.99267578125, 7.1907958984375, 7.388916015625, 7.5870361328125, 7.78515625]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 8.0, 11.0, 20.0, 17.0, 15.0, 22.0, 29.0, 31.0, 36.0, 43.0, 43.0, 74.0, 208.0, 1589.0, 46972.0, 3794128.0, 345340.0, 4921.0, 371.0, 110.0, 53.0, 50.0, 33.0, 30.0, 22.0, 28.0, 17.0, 20.0, 11.0, 10.0, 14.0, 3.0, 6.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.28125, -27.1806640625, -26.080078125, -24.9794921875, -23.87890625, -22.7783203125, -21.677734375, -20.5771484375, -19.4765625, -18.3759765625, -17.275390625, -16.1748046875, -15.07421875, -13.9736328125, -12.873046875, -11.7724609375, -10.671875, -9.5712890625, -8.470703125, -7.3701171875, -6.26953125, -5.1689453125, -4.068359375, -2.9677734375, -1.8671875, -0.7666015625, 0.333984375, 1.4345703125, 2.53515625, 3.6357421875, 4.736328125, 5.8369140625, 6.9375, 8.0380859375, 9.138671875, 10.2392578125, 11.33984375, 12.4404296875, 13.541015625, 14.6416015625, 15.7421875, 16.8427734375, 17.943359375, 19.0439453125, 20.14453125, 21.2451171875, 22.345703125, 23.4462890625, 24.546875, 25.6474609375, 26.748046875, 27.8486328125, 28.94921875, 30.0498046875, 31.150390625, 32.2509765625, 33.3515625, 34.4521484375, 35.552734375, 36.6533203125, 37.75390625, 38.8544921875, 39.955078125, 41.0556640625, 42.15625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 2.0, 4.0, 10.0, 8.0, 23.0, 35.0, 58.0, 84.0, 125.0, 183.0, 262.0, 440.0, 635.0, 672.0, 559.0, 351.0, 237.0, 158.0, 97.0, 55.0, 37.0, 12.0, 9.0, 9.0, 6.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0], "bins": [-28.125, -27.4727783203125, -26.820556640625, -26.1683349609375, -25.51611328125, -24.8638916015625, -24.211669921875, -23.5594482421875, -22.9072265625, -22.2550048828125, -21.602783203125, -20.9505615234375, -20.29833984375, -19.6461181640625, -18.993896484375, -18.3416748046875, -17.689453125, -17.0372314453125, -16.385009765625, -15.7327880859375, -15.08056640625, -14.4283447265625, -13.776123046875, -13.1239013671875, -12.4716796875, -11.8194580078125, -11.167236328125, -10.5150146484375, -9.86279296875, -9.2105712890625, -8.558349609375, -7.9061279296875, -7.25390625, -6.6016845703125, -5.949462890625, -5.2972412109375, -4.64501953125, -3.9927978515625, -3.340576171875, -2.6883544921875, -2.0361328125, -1.3839111328125, -0.731689453125, -0.0794677734375, 0.57275390625, 1.2249755859375, 1.877197265625, 2.5294189453125, 3.181640625, 3.8338623046875, 4.486083984375, 5.1383056640625, 5.79052734375, 6.4427490234375, 7.094970703125, 7.7471923828125, 8.3994140625, 9.0516357421875, 9.703857421875, 10.3560791015625, 11.00830078125, 11.6605224609375, 12.312744140625, 12.9649658203125, 13.6171875]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 6.0, 9.0, 8.0, 14.0, 38.0, 60.0, 66.0, 100.0, 165.0, 241.0, 535.0, 1951.0, 33829.0, 3722275.0, 426683.0, 6500.0, 902.0, 334.0, 174.0, 144.0, 92.0, 37.0, 26.0, 31.0, 23.0, 15.0, 10.0, 6.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.21875, -41.31982421875, -39.4208984375, -37.52197265625, -35.623046875, -33.72412109375, -31.8251953125, -29.92626953125, -28.02734375, -26.12841796875, -24.2294921875, -22.33056640625, -20.431640625, -18.53271484375, -16.6337890625, -14.73486328125, -12.8359375, -10.93701171875, -9.0380859375, -7.13916015625, -5.240234375, -3.34130859375, -1.4423828125, 0.45654296875, 2.35546875, 4.25439453125, 6.1533203125, 8.05224609375, 9.951171875, 11.85009765625, 13.7490234375, 15.64794921875, 17.546875, 19.44580078125, 21.3447265625, 23.24365234375, 25.142578125, 27.04150390625, 28.9404296875, 30.83935546875, 32.73828125, 34.63720703125, 36.5361328125, 38.43505859375, 40.333984375, 42.23291015625, 44.1318359375, 46.03076171875, 47.9296875, 49.82861328125, 51.7275390625, 53.62646484375, 55.525390625, 57.42431640625, 59.3232421875, 61.22216796875, 63.12109375, 65.02001953125, 66.9189453125, 68.81787109375, 70.716796875, 72.61572265625, 74.5146484375, 76.41357421875, 78.3125]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 21.0, 42.0, 95.0, 191.0, 224.0, 183.0, 163.0, 61.0, 20.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-135.32640075683594, -131.41815185546875, -127.50990295410156, -123.60165405273438, -119.69340515136719, -115.78515625, -111.87689971923828, -107.9686508178711, -104.0604019165039, -100.15215301513672, -96.24390411376953, -92.33565521240234, -88.42739868164062, -84.51914978027344, -80.61090087890625, -76.70265197753906, -72.79440307617188, -68.88615417480469, -64.9779052734375, -61.06965255737305, -57.16140365600586, -53.25315475463867, -49.34490203857422, -45.43665313720703, -41.528404235839844, -37.620155334472656, -33.71190643310547, -29.803653717041016, -25.895404815673828, -21.98715591430664, -18.07890510559082, -14.170654296875, -10.262405395507812, -6.354155540466309, -2.4459056854248047, 1.4623441696166992, 5.370594024658203, 9.27884292602539, 13.187093734741211, 17.09534454345703, 21.00359344482422, 24.911842346191406, 28.820093154907227, 32.72834396362305, 36.636592864990234, 40.54484176635742, 44.453094482421875, 48.36134338378906, 52.26959228515625, 56.17784118652344, 60.086090087890625, 63.99434280395508, 67.902587890625, 71.81083679199219, 75.7190933227539, 79.6273422241211, 83.53559112548828, 87.44384002685547, 91.35208892822266, 95.26033782958984, 99.16859436035156, 103.07684326171875, 106.98509216308594, 110.89334106445312, 114.80158996582031]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 10.0, 10.0, 12.0, 11.0, 15.0, 21.0, 23.0, 21.0, 27.0, 20.0, 22.0, 26.0, 36.0, 44.0, 48.0, 44.0, 34.0, 39.0, 32.0, 43.0, 35.0, 42.0, 45.0, 45.0, 33.0, 27.0, 25.0, 28.0, 30.0, 25.0, 19.0, 18.0, 12.0, 18.0, 13.0, 6.0, 8.0, 10.0, 7.0, 6.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-49.94775390625, -48.38202667236328, -46.81629943847656, -45.250572204589844, -43.684844970703125, -42.119117736816406, -40.55339050292969, -38.987667083740234, -37.421939849853516, -35.8562126159668, -34.29048538208008, -32.72475814819336, -31.159032821655273, -29.593305587768555, -28.027578353881836, -26.46185302734375, -24.8961238861084, -23.33039665222168, -21.76466941833496, -20.198944091796875, -18.633216857910156, -17.067489624023438, -15.501762390136719, -13.936036109924316, -12.370308876037598, -10.804581642150879, -9.238855361938477, -7.673128128051758, -6.107401371002197, -4.541674613952637, -2.975947380065918, -1.4102210998535156, 0.15550613403320312, 1.7212330102920532, 3.2869598865509033, 4.852686882019043, 6.4184136390686035, 7.984140396118164, 9.549867630004883, 11.115593910217285, 12.681321144104004, 14.247048377990723, 15.812774658203125, 17.378501892089844, 18.944229125976562, 20.50995635986328, 22.07568359375, 23.641408920288086, 25.207136154174805, 26.772863388061523, 28.338590621948242, 29.904315948486328, 31.470043182373047, 33.035770416259766, 34.601497650146484, 36.1672248840332, 37.73295211791992, 39.29867935180664, 40.86440658569336, 42.43013381958008, 43.9958610534668, 45.56158447265625, 47.12731170654297, 48.69303894042969, 50.258766174316406]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 0.0, 6.0, 4.0, 10.0, 11.0, 16.0, 19.0, 29.0, 26.0, 36.0, 36.0, 32.0, 47.0, 49.0, 49.0, 53.0, 58.0, 52.0, 50.0, 47.0, 48.0, 47.0, 42.0, 36.0, 35.0, 31.0, 30.0, 24.0, 22.0, 21.0, 9.0, 10.0, 6.0, 6.0, 2.0, 7.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6015625, -5.398681640625, -5.19580078125, -4.992919921875, -4.7900390625, -4.587158203125, -4.38427734375, -4.181396484375, -3.978515625, -3.775634765625, -3.57275390625, -3.369873046875, -3.1669921875, -2.964111328125, -2.76123046875, -2.558349609375, -2.35546875, -2.152587890625, -1.94970703125, -1.746826171875, -1.5439453125, -1.341064453125, -1.13818359375, -0.935302734375, -0.732421875, -0.529541015625, -0.32666015625, -0.123779296875, 0.0791015625, 0.281982421875, 0.48486328125, 0.687744140625, 0.890625, 1.093505859375, 1.29638671875, 1.499267578125, 1.7021484375, 1.905029296875, 2.10791015625, 2.310791015625, 2.513671875, 2.716552734375, 2.91943359375, 3.122314453125, 3.3251953125, 3.528076171875, 3.73095703125, 3.933837890625, 4.13671875, 4.339599609375, 4.54248046875, 4.745361328125, 4.9482421875, 5.151123046875, 5.35400390625, 5.556884765625, 5.759765625, 5.962646484375, 6.16552734375, 6.368408203125, 6.5712890625, 6.774169921875, 6.97705078125, 7.179931640625, 7.3828125]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 3.0, 6.0, 4.0, 5.0, 16.0, 18.0, 27.0, 35.0, 70.0, 95.0, 117.0, 210.0, 281.0, 431.0, 632.0, 861.0, 1244.0, 1826.0, 2584.0, 3694.0, 5313.0, 7710.0, 11284.0, 16473.0, 24970.0, 38245.0, 61931.0, 105045.0, 193042.0, 230087.0, 131638.0, 74678.0, 45339.0, 29054.0, 19337.0, 13075.0, 9039.0, 6240.0, 4252.0, 2962.0, 2053.0, 1427.0, 1028.0, 661.0, 463.0, 347.0, 220.0, 174.0, 126.0, 56.0, 46.0, 38.0, 19.0, 15.0, 11.0, 9.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.66748046875, -0.6467437744140625, -0.626007080078125, -0.6052703857421875, -0.58453369140625, -0.5637969970703125, -0.543060302734375, -0.5223236083984375, -0.5015869140625, -0.4808502197265625, -0.460113525390625, -0.4393768310546875, -0.41864013671875, -0.3979034423828125, -0.377166748046875, -0.3564300537109375, -0.335693359375, -0.3149566650390625, -0.294219970703125, -0.2734832763671875, -0.25274658203125, -0.2320098876953125, -0.211273193359375, -0.1905364990234375, -0.1697998046875, -0.1490631103515625, -0.128326416015625, -0.1075897216796875, -0.08685302734375, -0.0661163330078125, -0.045379638671875, -0.0246429443359375, -0.00390625, 0.0168304443359375, 0.037567138671875, 0.0583038330078125, 0.07904052734375, 0.0997772216796875, 0.120513916015625, 0.1412506103515625, 0.1619873046875, 0.1827239990234375, 0.203460693359375, 0.2241973876953125, 0.24493408203125, 0.2656707763671875, 0.286407470703125, 0.3071441650390625, 0.327880859375, 0.3486175537109375, 0.369354248046875, 0.3900909423828125, 0.41082763671875, 0.4315643310546875, 0.452301025390625, 0.4730377197265625, 0.4937744140625, 0.5145111083984375, 0.535247802734375, 0.5559844970703125, 0.57672119140625, 0.5974578857421875, 0.618194580078125, 0.6389312744140625, 0.65966796875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 9.0, 7.0, 8.0, 11.0, 9.0, 24.0, 20.0, 21.0, 29.0, 36.0, 27.0, 35.0, 37.0, 41.0, 43.0, 33.0, 48.0, 39.0, 1069.0, 46.0, 45.0, 44.0, 42.0, 36.0, 35.0, 33.0, 30.0, 21.0, 34.0, 22.0, 12.0, 5.0, 15.0, 15.0, 7.0, 11.0, 3.0, 6.0, 3.0, 3.0, 3.0, 1.0, 4.0, 0.0, 1.0, 3.0, 1.0], "bins": [-3.703125, -3.5986328125, -3.494140625, -3.3896484375, -3.28515625, -3.1806640625, -3.076171875, -2.9716796875, -2.8671875, -2.7626953125, -2.658203125, -2.5537109375, -2.44921875, -2.3447265625, -2.240234375, -2.1357421875, -2.03125, -1.9267578125, -1.822265625, -1.7177734375, -1.61328125, -1.5087890625, -1.404296875, -1.2998046875, -1.1953125, -1.0908203125, -0.986328125, -0.8818359375, -0.77734375, -0.6728515625, -0.568359375, -0.4638671875, -0.359375, -0.2548828125, -0.150390625, -0.0458984375, 0.05859375, 0.1630859375, 0.267578125, 0.3720703125, 0.4765625, 0.5810546875, 0.685546875, 0.7900390625, 0.89453125, 0.9990234375, 1.103515625, 1.2080078125, 1.3125, 1.4169921875, 1.521484375, 1.6259765625, 1.73046875, 1.8349609375, 1.939453125, 2.0439453125, 2.1484375, 2.2529296875, 2.357421875, 2.4619140625, 2.56640625, 2.6708984375, 2.775390625, 2.8798828125, 2.984375]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 4.0, 0.0, 5.0, 13.0, 15.0, 19.0, 19.0, 43.0, 63.0, 87.0, 111.0, 159.0, 224.0, 279.0, 461.0, 591.0, 858.0, 1192.0, 1709.0, 2434.0, 3497.0, 5213.0, 7864.0, 12040.0, 18247.0, 28876.0, 46007.0, 78072.0, 139917.0, 1277014.0, 194291.0, 108090.0, 61731.0, 37869.0, 23532.0, 15545.0, 10085.0, 6460.0, 4392.0, 3056.0, 2060.0, 1494.0, 1060.0, 702.0, 481.0, 397.0, 222.0, 203.0, 137.0, 86.0, 78.0, 49.0, 29.0, 22.0, 20.0, 6.0, 4.0, 7.0, 5.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.54443359375, -0.5267486572265625, -0.509063720703125, -0.4913787841796875, -0.47369384765625, -0.4560089111328125, -0.438323974609375, -0.4206390380859375, -0.4029541015625, -0.3852691650390625, -0.367584228515625, -0.3498992919921875, -0.33221435546875, -0.3145294189453125, -0.296844482421875, -0.2791595458984375, -0.261474609375, -0.2437896728515625, -0.226104736328125, -0.2084197998046875, -0.19073486328125, -0.1730499267578125, -0.155364990234375, -0.1376800537109375, -0.1199951171875, -0.1023101806640625, -0.084625244140625, -0.0669403076171875, -0.04925537109375, -0.0315704345703125, -0.013885498046875, 0.0037994384765625, 0.021484375, 0.0391693115234375, 0.056854248046875, 0.0745391845703125, 0.09222412109375, 0.1099090576171875, 0.127593994140625, 0.1452789306640625, 0.1629638671875, 0.1806488037109375, 0.198333740234375, 0.2160186767578125, 0.23370361328125, 0.2513885498046875, 0.269073486328125, 0.2867584228515625, 0.304443359375, 0.3221282958984375, 0.339813232421875, 0.3574981689453125, 0.37518310546875, 0.3928680419921875, 0.410552978515625, 0.4282379150390625, 0.4459228515625, 0.4636077880859375, 0.481292724609375, 0.4989776611328125, 0.51666259765625, 0.5343475341796875, 0.552032470703125, 0.5697174072265625, 0.58740234375]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 4.0, 7.0, 4.0, 20.0, 17.0, 10.0, 22.0, 26.0, 48.0, 34.0, 54.0, 65.0, 58.0, 55.0, 76.0, 77.0, 72.0, 66.0, 55.0, 44.0, 41.0, 28.0, 26.0, 17.0, 21.0, 13.0, 12.0, 9.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0021991729736328125, -0.002132803201675415, -0.0020664334297180176, -0.00200006365776062, -0.0019336938858032227, -0.0018673241138458252, -0.0018009543418884277, -0.0017345845699310303, -0.0016682147979736328, -0.0016018450260162354, -0.0015354752540588379, -0.0014691054821014404, -0.001402735710144043, -0.0013363659381866455, -0.001269996166229248, -0.0012036263942718506, -0.0011372566223144531, -0.0010708868503570557, -0.0010045170783996582, -0.0009381473064422607, -0.0008717775344848633, -0.0008054077625274658, -0.0007390379905700684, -0.0006726682186126709, -0.0006062984466552734, -0.000539928674697876, -0.0004735589027404785, -0.00040718913078308105, -0.0003408193588256836, -0.00027444958686828613, -0.00020807981491088867, -0.0001417100429534912, -7.534027099609375e-05, -8.970499038696289e-06, 5.739927291870117e-05, 0.00012376904487609863, 0.0001901388168334961, 0.00025650858879089355, 0.000322878360748291, 0.0003892481327056885, 0.00045561790466308594, 0.0005219876766204834, 0.0005883574485778809, 0.0006547272205352783, 0.0007210969924926758, 0.0007874667644500732, 0.0008538365364074707, 0.0009202063083648682, 0.0009865760803222656, 0.001052945852279663, 0.0011193156242370605, 0.001185685396194458, 0.0012520551681518555, 0.001318424940109253, 0.0013847947120666504, 0.0014511644840240479, 0.0015175342559814453, 0.0015839040279388428, 0.0016502737998962402, 0.0017166435718536377, 0.0017830133438110352, 0.0018493831157684326, 0.00191575288772583, 0.0019821226596832275, 0.002048492431640625]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 8.0, 5.0, 12.0, 23.0, 30.0, 42.0, 47.0, 75.0, 104.0, 176.0, 278.0, 559.0, 6904.0, 1037004.0, 2080.0, 475.0, 244.0, 145.0, 83.0, 69.0, 50.0, 39.0, 33.0, 22.0, 12.0, 10.0, 8.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04803466796875, -0.04655170440673828, -0.04506874084472656, -0.043585777282714844, -0.042102813720703125, -0.040619850158691406, -0.03913688659667969, -0.03765392303466797, -0.03617095947265625, -0.03468799591064453, -0.03320503234863281, -0.031722068786621094, -0.030239105224609375, -0.028756141662597656, -0.027273178100585938, -0.02579021453857422, -0.0243072509765625, -0.02282428741455078, -0.021341323852539062, -0.019858360290527344, -0.018375396728515625, -0.016892433166503906, -0.015409469604492188, -0.013926506042480469, -0.01244354248046875, -0.010960578918457031, -0.009477615356445312, -0.007994651794433594, -0.006511688232421875, -0.005028724670410156, -0.0035457611083984375, -0.0020627975463867188, -0.000579833984375, 0.0009031295776367188, 0.0023860931396484375, 0.0038690567016601562, 0.005352020263671875, 0.006834983825683594, 0.008317947387695312, 0.009800910949707031, 0.01128387451171875, 0.012766838073730469, 0.014249801635742188, 0.015732765197753906, 0.017215728759765625, 0.018698692321777344, 0.020181655883789062, 0.02166461944580078, 0.0231475830078125, 0.02463054656982422, 0.026113510131835938, 0.027596473693847656, 0.029079437255859375, 0.030562400817871094, 0.03204536437988281, 0.03352832794189453, 0.03501129150390625, 0.03649425506591797, 0.03797721862792969, 0.039460182189941406, 0.040943145751953125, 0.042426109313964844, 0.04390907287597656, 0.04539203643798828, 0.046875]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 11.0, 54.0, 275.0, 412.0, 216.0, 32.0, 12.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0056892018765211105, -0.005578573327511549, -0.0054679447785019875, -0.005357316695153713, -0.005246688146144152, -0.00513605959713459, -0.005025431048125029, -0.004914802499115467, -0.004804174415767193, -0.004693545866757631, -0.00458291731774807, -0.0044722892343997955, -0.004361660685390234, -0.0042510321363806725, -0.004140403587371111, -0.004029775038361549, -0.003919146955013275, -0.0038085184060037136, -0.0036978900898247957, -0.003587261540815234, -0.0034766332246363163, -0.0033660046756267548, -0.0032553761266171932, -0.0031447478104382753, -0.00303411902859807, -0.0029234904795885086, -0.0028128621634095907, -0.002702233614400029, -0.0025916052982211113, -0.0024809767492115498, -0.0023703482002019882, -0.0022597198840230703, -0.0021490915678441525, -0.002038463018834591, -0.001927834702655673, -0.0018172061536461115, -0.0017065778374671936, -0.001595949288457632, -0.0014853208558633924, -0.0013746924232691526, -0.001264063874259591, -0.0011534354416653514, -0.0010428070090711117, -0.000932178518269211, -0.0008215500856749713, -0.0007109216530807316, -0.000600293162278831, -0.0004896647296845913, -0.0003790362970903516, -0.00026840786449611187, -0.0001577794027980417, -4.715094109997153e-05, 6.347749149426818e-05, 0.0001741059240885079, 0.0002847344148904085, 0.00039536284748464823, 0.0005059912800788879, 0.0006166197126731277, 0.0007272481452673674, 0.000837876636069268, 0.0009485050686635077, 0.0010591335594654083, 0.001169761992059648, 0.0012803904246538877, 0.0013910188572481275]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 5.0, 3.0, 4.0, 8.0, 4.0, 7.0, 6.0, 12.0, 16.0, 18.0, 9.0, 15.0, 14.0, 17.0, 15.0, 23.0, 21.0, 24.0, 30.0, 28.0, 20.0, 32.0, 40.0, 40.0, 29.0, 40.0, 43.0, 46.0, 44.0, 39.0, 36.0, 29.0, 40.0, 21.0, 32.0, 35.0, 25.0, 21.0, 14.0, 21.0, 13.0, 9.0, 13.0, 6.0, 6.0, 8.0, 8.0, 1.0, 4.0, 4.0, 9.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0], "bins": [-0.0008816123008728027, -0.0008549988269805908, -0.0008283853530883789, -0.000801771879196167, -0.0007751584053039551, -0.0007485449314117432, -0.0007219314575195312, -0.0006953179836273193, -0.0006687045097351074, -0.0006420910358428955, -0.0006154775619506836, -0.0005888640880584717, -0.0005622506141662598, -0.0005356371402740479, -0.0005090236663818359, -0.000482410192489624, -0.0004557967185974121, -0.0004291832447052002, -0.0004025697708129883, -0.00037595629692077637, -0.00034934282302856445, -0.00032272934913635254, -0.0002961158752441406, -0.0002695024013519287, -0.0002428889274597168, -0.00021627545356750488, -0.00018966197967529297, -0.00016304850578308105, -0.00013643503189086914, -0.00010982155799865723, -8.320808410644531e-05, -5.65946102142334e-05, -2.9981136322021484e-05, -3.3676624298095703e-06, 2.3245811462402344e-05, 4.985928535461426e-05, 7.647275924682617e-05, 0.00010308623313903809, 0.00012969970703125, 0.00015631318092346191, 0.00018292665481567383, 0.00020954012870788574, 0.00023615360260009766, 0.00026276707649230957, 0.0002893805503845215, 0.0003159940242767334, 0.0003426074981689453, 0.0003692209720611572, 0.00039583444595336914, 0.00042244791984558105, 0.00044906139373779297, 0.0004756748676300049, 0.0005022883415222168, 0.0005289018154144287, 0.0005555152893066406, 0.0005821287631988525, 0.0006087422370910645, 0.0006353557109832764, 0.0006619691848754883, 0.0006885826587677002, 0.0007151961326599121, 0.000741809606552124, 0.0007684230804443359, 0.0007950365543365479, 0.0008216500282287598]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 0.0, 6.0, 4.0, 10.0, 11.0, 16.0, 19.0, 29.0, 26.0, 36.0, 36.0, 32.0, 47.0, 49.0, 49.0, 53.0, 58.0, 52.0, 50.0, 47.0, 48.0, 47.0, 42.0, 36.0, 35.0, 31.0, 30.0, 24.0, 22.0, 21.0, 9.0, 10.0, 6.0, 6.0, 2.0, 7.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6015625, -5.398681640625, -5.19580078125, -4.992919921875, -4.7900390625, -4.587158203125, -4.38427734375, -4.181396484375, -3.978515625, -3.775634765625, -3.57275390625, -3.369873046875, -3.1669921875, -2.964111328125, -2.76123046875, -2.558349609375, -2.35546875, -2.152587890625, -1.94970703125, -1.746826171875, -1.5439453125, -1.341064453125, -1.13818359375, -0.935302734375, -0.732421875, -0.529541015625, -0.32666015625, -0.123779296875, 0.0791015625, 0.281982421875, 0.48486328125, 0.687744140625, 0.890625, 1.093505859375, 1.29638671875, 1.499267578125, 1.7021484375, 1.905029296875, 2.10791015625, 2.310791015625, 2.513671875, 2.716552734375, 2.91943359375, 3.122314453125, 3.3251953125, 3.528076171875, 3.73095703125, 3.933837890625, 4.13671875, 4.339599609375, 4.54248046875, 4.745361328125, 4.9482421875, 5.151123046875, 5.35400390625, 5.556884765625, 5.759765625, 5.962646484375, 6.16552734375, 6.368408203125, 6.5712890625, 6.774169921875, 6.97705078125, 7.179931640625, 7.3828125]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 6.0, 11.0, 4.0, 15.0, 26.0, 24.0, 34.0, 56.0, 75.0, 135.0, 175.0, 298.0, 464.0, 668.0, 1178.0, 2165.0, 4293.0, 9651.0, 27111.0, 109613.0, 533540.0, 274326.0, 54937.0, 16114.0, 6384.0, 3109.0, 1641.0, 927.0, 553.0, 357.0, 204.0, 143.0, 108.0, 68.0, 42.0, 32.0, 22.0, 17.0, 11.0, 9.0, 4.0, 1.0, 3.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.708984375, -3.575408935546875, -3.44183349609375, -3.308258056640625, -3.1746826171875, -3.041107177734375, -2.90753173828125, -2.773956298828125, -2.640380859375, -2.506805419921875, -2.37322998046875, -2.239654541015625, -2.1060791015625, -1.972503662109375, -1.83892822265625, -1.705352783203125, -1.57177734375, -1.438201904296875, -1.30462646484375, -1.171051025390625, -1.0374755859375, -0.903900146484375, -0.77032470703125, -0.636749267578125, -0.503173828125, -0.369598388671875, -0.23602294921875, -0.102447509765625, 0.0311279296875, 0.164703369140625, 0.29827880859375, 0.431854248046875, 0.5654296875, 0.699005126953125, 0.83258056640625, 0.966156005859375, 1.0997314453125, 1.233306884765625, 1.36688232421875, 1.500457763671875, 1.634033203125, 1.767608642578125, 1.90118408203125, 2.034759521484375, 2.1683349609375, 2.301910400390625, 2.43548583984375, 2.569061279296875, 2.70263671875, 2.836212158203125, 2.96978759765625, 3.103363037109375, 3.2369384765625, 3.370513916015625, 3.50408935546875, 3.637664794921875, 3.771240234375, 3.904815673828125, 4.03839111328125, 4.171966552734375, 4.3055419921875, 4.439117431640625, 4.57269287109375, 4.706268310546875, 4.83984375]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 4.0, 7.0, 9.0, 8.0, 8.0, 10.0, 10.0, 13.0, 17.0, 18.0, 20.0, 22.0, 32.0, 31.0, 24.0, 31.0, 30.0, 39.0, 40.0, 36.0, 54.0, 328.0, 1726.0, 86.0, 54.0, 34.0, 45.0, 36.0, 40.0, 18.0, 26.0, 19.0, 25.0, 20.0, 22.0, 13.0, 19.0, 8.0, 13.0, 16.0, 12.0, 10.0, 6.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.7734375, -14.2667236328125, -13.760009765625, -13.2532958984375, -12.74658203125, -12.2398681640625, -11.733154296875, -11.2264404296875, -10.7197265625, -10.2130126953125, -9.706298828125, -9.1995849609375, -8.69287109375, -8.1861572265625, -7.679443359375, -7.1727294921875, -6.666015625, -6.1593017578125, -5.652587890625, -5.1458740234375, -4.63916015625, -4.1324462890625, -3.625732421875, -3.1190185546875, -2.6123046875, -2.1055908203125, -1.598876953125, -1.0921630859375, -0.58544921875, -0.0787353515625, 0.427978515625, 0.9346923828125, 1.44140625, 1.9481201171875, 2.454833984375, 2.9615478515625, 3.46826171875, 3.9749755859375, 4.481689453125, 4.9884033203125, 5.4951171875, 6.0018310546875, 6.508544921875, 7.0152587890625, 7.52197265625, 8.0286865234375, 8.535400390625, 9.0421142578125, 9.548828125, 10.0555419921875, 10.562255859375, 11.0689697265625, 11.57568359375, 12.0823974609375, 12.589111328125, 13.0958251953125, 13.6025390625, 14.1092529296875, 14.615966796875, 15.1226806640625, 15.62939453125, 16.1361083984375, 16.642822265625, 17.1495361328125, 17.65625]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 2.0, 2.0, 3.0, 14.0, 6.0, 13.0, 17.0, 12.0, 10.0, 15.0, 15.0, 28.0, 20.0, 24.0, 31.0, 37.0, 66.0, 107.0, 154.0, 234.0, 353.0, 990.0, 9216.0, 3054018.0, 76953.0, 1926.0, 558.0, 256.0, 161.0, 108.0, 88.0, 41.0, 36.0, 42.0, 27.0, 21.0, 20.0, 17.0, 9.0, 12.0, 10.0, 5.0, 8.0, 9.0, 7.0, 4.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0], "bins": [-29.171875, -28.33154296875, -27.4912109375, -26.65087890625, -25.810546875, -24.97021484375, -24.1298828125, -23.28955078125, -22.44921875, -21.60888671875, -20.7685546875, -19.92822265625, -19.087890625, -18.24755859375, -17.4072265625, -16.56689453125, -15.7265625, -14.88623046875, -14.0458984375, -13.20556640625, -12.365234375, -11.52490234375, -10.6845703125, -9.84423828125, -9.00390625, -8.16357421875, -7.3232421875, -6.48291015625, -5.642578125, -4.80224609375, -3.9619140625, -3.12158203125, -2.28125, -1.44091796875, -0.6005859375, 0.23974609375, 1.080078125, 1.92041015625, 2.7607421875, 3.60107421875, 4.44140625, 5.28173828125, 6.1220703125, 6.96240234375, 7.802734375, 8.64306640625, 9.4833984375, 10.32373046875, 11.1640625, 12.00439453125, 12.8447265625, 13.68505859375, 14.525390625, 15.36572265625, 16.2060546875, 17.04638671875, 17.88671875, 18.72705078125, 19.5673828125, 20.40771484375, 21.248046875, 22.08837890625, 22.9287109375, 23.76904296875, 24.609375]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 11.0, 200.0, 581.0, 209.0, 17.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-96.26148986816406, -94.39361572265625, -92.5257339477539, -90.6578598022461, -88.78998565673828, -86.92210388183594, -85.05422973632812, -83.18635559082031, -81.3184814453125, -79.45060729980469, -77.58272552490234, -75.71485137939453, -73.84697723388672, -71.97909545898438, -70.11122131347656, -68.24334716796875, -66.3754653930664, -64.5075912475586, -62.639713287353516, -60.77183532714844, -58.903961181640625, -57.03608322143555, -55.16820526123047, -53.300331115722656, -51.43245315551758, -49.5645751953125, -47.69670104980469, -45.82882308959961, -43.96094512939453, -42.09307098388672, -40.22519302368164, -38.35731506347656, -36.489437103271484, -34.621559143066406, -32.753684997558594, -30.885807037353516, -29.01793098449707, -27.150054931640625, -25.282176971435547, -23.4143009185791, -21.546424865722656, -19.67854881286621, -17.810672760009766, -15.942794799804688, -14.074918746948242, -12.207042694091797, -10.339165687561035, -8.471288681030273, -6.603412628173828, -4.735536098480225, -2.867659568786621, -0.9997830390930176, 0.8680934906005859, 2.7359695434570312, 4.603846549987793, 6.471723556518555, 8.339599609375, 10.207475662231445, 12.075352668762207, 13.943229675292969, 15.811105728149414, 17.67898178100586, 19.546859741210938, 21.414735794067383, 23.282611846923828]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 0.0, 4.0, 4.0, 1.0, 9.0, 4.0, 7.0, 10.0, 12.0, 10.0, 6.0, 24.0, 12.0, 22.0, 21.0, 25.0, 28.0, 33.0, 39.0, 37.0, 31.0, 44.0, 38.0, 45.0, 44.0, 47.0, 33.0, 42.0, 32.0, 38.0, 34.0, 38.0, 29.0, 30.0, 17.0, 25.0, 19.0, 29.0, 18.0, 8.0, 8.0, 9.0, 10.0, 4.0, 11.0, 5.0, 2.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-47.57497787475586, -45.91034698486328, -44.24571990966797, -42.58108901977539, -40.91645812988281, -39.2518310546875, -37.58720016479492, -35.922569274902344, -34.25794219970703, -32.59331130981445, -30.928682327270508, -29.264053344726562, -27.599422454833984, -25.93479347229004, -24.270164489746094, -22.605533599853516, -20.940902709960938, -19.276273727416992, -17.611642837524414, -15.947013854980469, -14.282383918762207, -12.617753982543945, -10.953125, -9.288495063781738, -7.623865127563477, -5.959235191345215, -4.294605731964111, -2.629976272583008, -0.9653463363647461, 0.6992835998535156, 2.363912582397461, 4.028542518615723, 5.693168640136719, 7.3577985763549805, 9.022428512573242, 10.687057495117188, 12.35168743133545, 14.016317367553711, 15.680946350097656, 17.345577239990234, 19.01020622253418, 20.674835205078125, 22.339466094970703, 24.00409507751465, 25.668724060058594, 27.333354949951172, 28.997983932495117, 30.662612915039062, 32.32724380493164, 33.99187469482422, 35.65650177001953, 37.32113265991211, 38.98576354980469, 40.650390625, 42.31502151489258, 43.979652404785156, 45.64427947998047, 47.30891036987305, 48.97353744506836, 50.63816833496094, 52.302799224853516, 53.967430114746094, 55.632057189941406, 57.296688079833984, 58.96131896972656]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 3.0, 6.0, 5.0, 9.0, 17.0, 13.0, 26.0, 25.0, 33.0, 37.0, 34.0, 35.0, 52.0, 43.0, 51.0, 63.0, 47.0, 55.0, 53.0, 33.0, 45.0, 62.0, 37.0, 27.0, 35.0, 31.0, 31.0, 25.0, 17.0, 20.0, 9.0, 7.0, 6.0, 6.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.734375, -5.53131103515625, -5.3282470703125, -5.12518310546875, -4.922119140625, -4.71905517578125, -4.5159912109375, -4.31292724609375, -4.10986328125, -3.90679931640625, -3.7037353515625, -3.50067138671875, -3.297607421875, -3.09454345703125, -2.8914794921875, -2.68841552734375, -2.4853515625, -2.28228759765625, -2.0792236328125, -1.87615966796875, -1.673095703125, -1.47003173828125, -1.2669677734375, -1.06390380859375, -0.86083984375, -0.65777587890625, -0.4547119140625, -0.25164794921875, -0.048583984375, 0.15447998046875, 0.3575439453125, 0.56060791015625, 0.763671875, 0.96673583984375, 1.1697998046875, 1.37286376953125, 1.575927734375, 1.77899169921875, 1.9820556640625, 2.18511962890625, 2.38818359375, 2.59124755859375, 2.7943115234375, 2.99737548828125, 3.200439453125, 3.40350341796875, 3.6065673828125, 3.80963134765625, 4.0126953125, 4.21575927734375, 4.4188232421875, 4.62188720703125, 4.824951171875, 5.02801513671875, 5.2310791015625, 5.43414306640625, 5.63720703125, 5.84027099609375, 6.0433349609375, 6.24639892578125, 6.449462890625, 6.65252685546875, 6.8555908203125, 7.05865478515625, 7.26171875]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 2.0, 4.0, 6.0, 7.0, 5.0, 7.0, 24.0, 16.0, 31.0, 45.0, 68.0, 101.0, 209.0, 449.0, 1090.0, 3314.0, 11765.0, 52944.0, 373463.0, 2314531.0, 1259168.0, 141137.0, 25830.0, 6537.0, 2049.0, 742.0, 300.0, 160.0, 86.0, 52.0, 33.0, 25.0, 16.0, 20.0, 8.0, 6.0, 6.0, 8.0, 6.0, 6.0, 6.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.125, -10.7384033203125, -10.351806640625, -9.9652099609375, -9.57861328125, -9.1920166015625, -8.805419921875, -8.4188232421875, -8.0322265625, -7.6456298828125, -7.259033203125, -6.8724365234375, -6.48583984375, -6.0992431640625, -5.712646484375, -5.3260498046875, -4.939453125, -4.5528564453125, -4.166259765625, -3.7796630859375, -3.39306640625, -3.0064697265625, -2.619873046875, -2.2332763671875, -1.8466796875, -1.4600830078125, -1.073486328125, -0.6868896484375, -0.30029296875, 0.0863037109375, 0.472900390625, 0.8594970703125, 1.24609375, 1.6326904296875, 2.019287109375, 2.4058837890625, 2.79248046875, 3.1790771484375, 3.565673828125, 3.9522705078125, 4.3388671875, 4.7254638671875, 5.112060546875, 5.4986572265625, 5.88525390625, 6.2718505859375, 6.658447265625, 7.0450439453125, 7.431640625, 7.8182373046875, 8.204833984375, 8.5914306640625, 8.97802734375, 9.3646240234375, 9.751220703125, 10.1378173828125, 10.5244140625, 10.9110107421875, 11.297607421875, 11.6842041015625, 12.07080078125, 12.4573974609375, 12.843994140625, 13.2305908203125, 13.6171875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 8.0, 4.0, 7.0, 7.0, 16.0, 17.0, 14.0, 23.0, 21.0, 37.0, 42.0, 70.0, 72.0, 103.0, 114.0, 140.0, 193.0, 220.0, 300.0, 358.0, 384.0, 342.0, 305.0, 252.0, 214.0, 160.0, 152.0, 116.0, 85.0, 63.0, 54.0, 29.0, 30.0, 29.0, 21.0, 10.0, 14.0, 14.0, 6.0, 5.0, 4.0, 4.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-11.21875, -10.8651123046875, -10.511474609375, -10.1578369140625, -9.80419921875, -9.4505615234375, -9.096923828125, -8.7432861328125, -8.3896484375, -8.0360107421875, -7.682373046875, -7.3287353515625, -6.97509765625, -6.6214599609375, -6.267822265625, -5.9141845703125, -5.560546875, -5.2069091796875, -4.853271484375, -4.4996337890625, -4.14599609375, -3.7923583984375, -3.438720703125, -3.0850830078125, -2.7314453125, -2.3778076171875, -2.024169921875, -1.6705322265625, -1.31689453125, -0.9632568359375, -0.609619140625, -0.2559814453125, 0.09765625, 0.4512939453125, 0.804931640625, 1.1585693359375, 1.51220703125, 1.8658447265625, 2.219482421875, 2.5731201171875, 2.9267578125, 3.2803955078125, 3.634033203125, 3.9876708984375, 4.34130859375, 4.6949462890625, 5.048583984375, 5.4022216796875, 5.755859375, 6.1094970703125, 6.463134765625, 6.8167724609375, 7.17041015625, 7.5240478515625, 7.877685546875, 8.2313232421875, 8.5849609375, 8.9385986328125, 9.292236328125, 9.6458740234375, 9.99951171875, 10.3531494140625, 10.706787109375, 11.0604248046875, 11.4140625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 5.0, 6.0, 7.0, 11.0, 12.0, 19.0, 29.0, 45.0, 57.0, 69.0, 101.0, 164.0, 281.0, 711.0, 3474.0, 80223.0, 3784969.0, 314229.0, 7927.0, 1038.0, 327.0, 176.0, 110.0, 72.0, 52.0, 39.0, 35.0, 17.0, 21.0, 18.0, 10.0, 6.0, 7.0, 4.0, 5.0, 6.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-43.96875, -42.37890625, -40.7890625, -39.19921875, -37.609375, -36.01953125, -34.4296875, -32.83984375, -31.25, -29.66015625, -28.0703125, -26.48046875, -24.890625, -23.30078125, -21.7109375, -20.12109375, -18.53125, -16.94140625, -15.3515625, -13.76171875, -12.171875, -10.58203125, -8.9921875, -7.40234375, -5.8125, -4.22265625, -2.6328125, -1.04296875, 0.546875, 2.13671875, 3.7265625, 5.31640625, 6.90625, 8.49609375, 10.0859375, 11.67578125, 13.265625, 14.85546875, 16.4453125, 18.03515625, 19.625, 21.21484375, 22.8046875, 24.39453125, 25.984375, 27.57421875, 29.1640625, 30.75390625, 32.34375, 33.93359375, 35.5234375, 37.11328125, 38.703125, 40.29296875, 41.8828125, 43.47265625, 45.0625, 46.65234375, 48.2421875, 49.83203125, 51.421875, 53.01171875, 54.6015625, 56.19140625, 57.78125]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [25.0, 103.0, 294.0, 350.0, 188.0, 50.0, 10.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.158655166625977, -13.8875093460083, -7.616363525390625, -1.3452167510986328, 4.925928115844727, 11.197072982788086, 17.46822166442871, 23.73936653137207, 30.01051139831543, 36.28165817260742, 42.55280303955078, 48.823951721191406, 55.0950927734375, 61.366241455078125, 67.63739013671875, 73.90853118896484, 80.17967987060547, 86.4508285522461, 92.72196960449219, 98.99311828613281, 105.26426696777344, 111.53540802001953, 117.80655670166016, 124.07769775390625, 130.34884643554688, 136.6199951171875, 142.89114379882812, 149.16229248046875, 155.4334259033203, 161.70457458496094, 167.97572326660156, 174.2468719482422, 180.51800537109375, 186.78915405273438, 193.060302734375, 199.33145141601562, 205.6025848388672, 211.8737335205078, 218.14488220214844, 224.41603088378906, 230.68716430664062, 236.95831298828125, 243.22946166992188, 249.5006103515625, 255.77174377441406, 262.04290771484375, 268.31402587890625, 274.5851745605469, 280.8563232421875, 287.1274719238281, 293.39862060546875, 299.6697692871094, 305.94091796875, 312.2120361328125, 318.48321533203125, 324.75433349609375, 331.0255126953125, 337.2966613769531, 343.56781005859375, 349.8389587402344, 356.110107421875, 362.3812255859375, 368.65240478515625, 374.92352294921875, 381.1946716308594]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 6.0, 8.0, 6.0, 7.0, 9.0, 12.0, 14.0, 15.0, 12.0, 18.0, 26.0, 25.0, 26.0, 25.0, 21.0, 26.0, 32.0, 34.0, 35.0, 35.0, 38.0, 36.0, 36.0, 23.0, 34.0, 42.0, 41.0, 40.0, 28.0, 36.0, 28.0, 27.0, 17.0, 22.0, 22.0, 15.0, 18.0, 17.0, 18.0, 20.0, 12.0, 11.0, 6.0, 6.0, 7.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-41.127525329589844, -39.811710357666016, -38.49589538574219, -37.18008041381836, -35.86426544189453, -34.54844665527344, -33.232635498046875, -31.91681671142578, -30.601001739501953, -29.285186767578125, -27.969371795654297, -26.65355682373047, -25.337739944458008, -24.02192497253418, -22.70611000061035, -21.39029312133789, -20.074480056762695, -18.758665084838867, -17.44285011291504, -16.127033233642578, -14.81121826171875, -13.495403289794922, -12.179588317871094, -10.86377239227295, -9.547957420349121, -8.232142448425293, -6.916326522827148, -5.60051155090332, -4.284696102142334, -2.9688806533813477, -1.6530656814575195, -0.337249755859375, 0.9785652160644531, 2.2943806648254395, 3.6101958751678467, 4.926011085510254, 6.24182653427124, 7.557641983032227, 8.873456954956055, 10.1892728805542, 11.505087852478027, 12.820902824401855, 14.13671875, 15.452533721923828, 16.768348693847656, 18.084163665771484, 19.399978637695312, 20.715795516967773, 22.0316104888916, 23.34742546081543, 24.663240432739258, 25.97905731201172, 27.294872283935547, 28.610687255859375, 29.926502227783203, 31.24231719970703, 32.55813217163086, 33.87394714355469, 35.189762115478516, 36.505577087402344, 37.82139205932617, 39.13720703125, 40.453025817871094, 41.76884078979492, 43.08465576171875]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 6.0, 8.0, 11.0, 13.0, 13.0, 11.0, 23.0, 27.0, 33.0, 39.0, 46.0, 35.0, 46.0, 45.0, 50.0, 46.0, 54.0, 48.0, 52.0, 58.0, 42.0, 39.0, 40.0, 40.0, 29.0, 35.0, 28.0, 21.0, 15.0, 10.0, 20.0, 6.0, 5.0, 3.0, 4.0, 1.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.9296875, -5.72491455078125, -5.5201416015625, -5.31536865234375, -5.110595703125, -4.90582275390625, -4.7010498046875, -4.49627685546875, -4.29150390625, -4.08673095703125, -3.8819580078125, -3.67718505859375, -3.472412109375, -3.26763916015625, -3.0628662109375, -2.85809326171875, -2.6533203125, -2.44854736328125, -2.2437744140625, -2.03900146484375, -1.834228515625, -1.62945556640625, -1.4246826171875, -1.21990966796875, -1.01513671875, -0.81036376953125, -0.6055908203125, -0.40081787109375, -0.196044921875, 0.00872802734375, 0.2135009765625, 0.41827392578125, 0.623046875, 0.82781982421875, 1.0325927734375, 1.23736572265625, 1.442138671875, 1.64691162109375, 1.8516845703125, 2.05645751953125, 2.26123046875, 2.46600341796875, 2.6707763671875, 2.87554931640625, 3.080322265625, 3.28509521484375, 3.4898681640625, 3.69464111328125, 3.8994140625, 4.10418701171875, 4.3089599609375, 4.51373291015625, 4.718505859375, 4.92327880859375, 5.1280517578125, 5.33282470703125, 5.53759765625, 5.74237060546875, 5.9471435546875, 6.15191650390625, 6.356689453125, 6.56146240234375, 6.7662353515625, 6.97100830078125, 7.17578125]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 4.0, 6.0, 12.0, 17.0, 18.0, 29.0, 45.0, 89.0, 95.0, 176.0, 237.0, 319.0, 457.0, 672.0, 962.0, 1387.0, 1962.0, 2792.0, 4023.0, 5742.0, 8281.0, 11973.0, 17406.0, 26136.0, 40403.0, 64095.0, 109601.0, 197621.0, 220800.0, 125596.0, 72522.0, 44546.0, 28792.0, 19338.0, 12896.0, 8879.0, 6196.0, 4345.0, 3045.0, 2126.0, 1524.0, 1027.0, 747.0, 507.0, 352.0, 254.0, 157.0, 123.0, 80.0, 47.0, 36.0, 18.0, 25.0, 8.0, 8.0, 7.0, 3.0, 1.0, 2.0, 1.0], "bins": [-0.68701171875, -0.665618896484375, -0.64422607421875, -0.622833251953125, -0.6014404296875, -0.580047607421875, -0.55865478515625, -0.537261962890625, -0.515869140625, -0.494476318359375, -0.47308349609375, -0.451690673828125, -0.4302978515625, -0.408905029296875, -0.38751220703125, -0.366119384765625, -0.3447265625, -0.323333740234375, -0.30194091796875, -0.280548095703125, -0.2591552734375, -0.237762451171875, -0.21636962890625, -0.194976806640625, -0.173583984375, -0.152191162109375, -0.13079833984375, -0.109405517578125, -0.0880126953125, -0.066619873046875, -0.04522705078125, -0.023834228515625, -0.00244140625, 0.018951416015625, 0.04034423828125, 0.061737060546875, 0.0831298828125, 0.104522705078125, 0.12591552734375, 0.147308349609375, 0.168701171875, 0.190093994140625, 0.21148681640625, 0.232879638671875, 0.2542724609375, 0.275665283203125, 0.29705810546875, 0.318450927734375, 0.33984375, 0.361236572265625, 0.38262939453125, 0.404022216796875, 0.4254150390625, 0.446807861328125, 0.46820068359375, 0.489593505859375, 0.510986328125, 0.532379150390625, 0.55377197265625, 0.575164794921875, 0.5965576171875, 0.617950439453125, 0.63934326171875, 0.660736083984375, 0.68212890625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 7.0, 3.0, 5.0, 4.0, 6.0, 8.0, 11.0, 12.0, 14.0, 15.0, 19.0, 17.0, 26.0, 29.0, 28.0, 28.0, 29.0, 38.0, 49.0, 48.0, 39.0, 48.0, 37.0, 1055.0, 30.0, 43.0, 28.0, 32.0, 32.0, 27.0, 31.0, 27.0, 24.0, 24.0, 35.0, 14.0, 16.0, 15.0, 12.0, 13.0, 13.0, 7.0, 5.0, 6.0, 5.0, 6.0, 3.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 2.0], "bins": [-3.45703125, -3.353363037109375, -3.24969482421875, -3.146026611328125, -3.0423583984375, -2.938690185546875, -2.83502197265625, -2.731353759765625, -2.627685546875, -2.524017333984375, -2.42034912109375, -2.316680908203125, -2.2130126953125, -2.109344482421875, -2.00567626953125, -1.902008056640625, -1.79833984375, -1.694671630859375, -1.59100341796875, -1.487335205078125, -1.3836669921875, -1.279998779296875, -1.17633056640625, -1.072662353515625, -0.968994140625, -0.865325927734375, -0.76165771484375, -0.657989501953125, -0.5543212890625, -0.450653076171875, -0.34698486328125, -0.243316650390625, -0.1396484375, -0.035980224609375, 0.06768798828125, 0.171356201171875, 0.2750244140625, 0.378692626953125, 0.48236083984375, 0.586029052734375, 0.689697265625, 0.793365478515625, 0.89703369140625, 1.000701904296875, 1.1043701171875, 1.208038330078125, 1.31170654296875, 1.415374755859375, 1.51904296875, 1.622711181640625, 1.72637939453125, 1.830047607421875, 1.9337158203125, 2.037384033203125, 2.14105224609375, 2.244720458984375, 2.348388671875, 2.452056884765625, 2.55572509765625, 2.659393310546875, 2.7630615234375, 2.866729736328125, 2.97039794921875, 3.074066162109375, 3.177734375]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 3.0, 7.0, 13.0, 14.0, 23.0, 39.0, 62.0, 94.0, 130.0, 194.0, 260.0, 390.0, 491.0, 707.0, 1014.0, 1453.0, 2035.0, 2900.0, 4345.0, 6385.0, 9559.0, 14029.0, 21573.0, 33255.0, 53647.0, 90944.0, 167073.0, 1289496.0, 161436.0, 88231.0, 51760.0, 32190.0, 20419.0, 13651.0, 9057.0, 6153.0, 4246.0, 2898.0, 2003.0, 1419.0, 1036.0, 712.0, 528.0, 407.0, 248.0, 190.0, 137.0, 101.0, 64.0, 43.0, 26.0, 17.0, 12.0, 10.0, 9.0, 5.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.59375, -0.5748825073242188, -0.5560150146484375, -0.5371475219726562, -0.518280029296875, -0.49941253662109375, -0.4805450439453125, -0.46167755126953125, -0.44281005859375, -0.42394256591796875, -0.4050750732421875, -0.38620758056640625, -0.367340087890625, -0.34847259521484375, -0.3296051025390625, -0.31073760986328125, -0.2918701171875, -0.27300262451171875, -0.2541351318359375, -0.23526763916015625, -0.216400146484375, -0.19753265380859375, -0.1786651611328125, -0.15979766845703125, -0.14093017578125, -0.12206268310546875, -0.1031951904296875, -0.08432769775390625, -0.065460205078125, -0.04659271240234375, -0.0277252197265625, -0.00885772705078125, 0.010009765625, 0.02887725830078125, 0.0477447509765625, 0.06661224365234375, 0.085479736328125, 0.10434722900390625, 0.1232147216796875, 0.14208221435546875, 0.16094970703125, 0.17981719970703125, 0.1986846923828125, 0.21755218505859375, 0.236419677734375, 0.25528717041015625, 0.2741546630859375, 0.29302215576171875, 0.3118896484375, 0.33075714111328125, 0.3496246337890625, 0.36849212646484375, 0.387359619140625, 0.40622711181640625, 0.4250946044921875, 0.44396209716796875, 0.46282958984375, 0.48169708251953125, 0.5005645751953125, 0.5194320678710938, 0.538299560546875, 0.5571670532226562, 0.5760345458984375, 0.5949020385742188, 0.61376953125]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 1.0, 5.0, 2.0, 3.0, 5.0, 9.0, 10.0, 12.0, 14.0, 13.0, 30.0, 40.0, 43.0, 57.0, 69.0, 94.0, 88.0, 90.0, 101.0, 73.0, 56.0, 50.0, 31.0, 32.0, 17.0, 19.0, 5.0, 3.0, 11.0, 3.0, 4.0, 7.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0026950836181640625, -0.0026199519634246826, -0.0025448203086853027, -0.002469688653945923, -0.002394556999206543, -0.002319425344467163, -0.002244293689727783, -0.0021691620349884033, -0.0020940303802490234, -0.0020188987255096436, -0.0019437670707702637, -0.0018686354160308838, -0.001793503761291504, -0.001718372106552124, -0.0016432404518127441, -0.0015681087970733643, -0.0014929771423339844, -0.0014178454875946045, -0.0013427138328552246, -0.0012675821781158447, -0.0011924505233764648, -0.001117318868637085, -0.001042187213897705, -0.0009670555591583252, -0.0008919239044189453, -0.0008167922496795654, -0.0007416605949401855, -0.0006665289402008057, -0.0005913972854614258, -0.0005162656307220459, -0.000441133975982666, -0.00036600232124328613, -0.00029087066650390625, -0.00021573901176452637, -0.00014060735702514648, -6.54757022857666e-05, 9.655952453613281e-06, 8.478760719299316e-05, 0.00015991926193237305, 0.00023505091667175293, 0.0003101825714111328, 0.0003853142261505127, 0.0004604458808898926, 0.0005355775356292725, 0.0006107091903686523, 0.0006858408451080322, 0.0007609724998474121, 0.000836104154586792, 0.0009112358093261719, 0.0009863674640655518, 0.0010614991188049316, 0.0011366307735443115, 0.0012117624282836914, 0.0012868940830230713, 0.0013620257377624512, 0.001437157392501831, 0.001512289047241211, 0.0015874207019805908, 0.0016625523567199707, 0.0017376840114593506, 0.0018128156661987305, 0.0018879473209381104, 0.0019630789756774902, 0.00203821063041687, 0.00211334228515625]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 7.0, 5.0, 14.0, 9.0, 11.0, 27.0, 32.0, 36.0, 56.0, 67.0, 81.0, 135.0, 199.0, 383.0, 925.0, 136856.0, 906883.0, 1587.0, 453.0, 263.0, 178.0, 93.0, 59.0, 48.0, 31.0, 31.0, 25.0, 13.0, 18.0, 6.0, 4.0, 3.0, 3.0, 6.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0426025390625, -0.041234493255615234, -0.03986644744873047, -0.0384984016418457, -0.03713035583496094, -0.03576231002807617, -0.034394264221191406, -0.03302621841430664, -0.031658172607421875, -0.03029012680053711, -0.028922080993652344, -0.027554035186767578, -0.026185989379882812, -0.024817943572998047, -0.02344989776611328, -0.022081851959228516, -0.02071380615234375, -0.019345760345458984, -0.01797771453857422, -0.016609668731689453, -0.015241622924804688, -0.013873577117919922, -0.012505531311035156, -0.01113748550415039, -0.009769439697265625, -0.00840139389038086, -0.007033348083496094, -0.005665302276611328, -0.0042972564697265625, -0.002929210662841797, -0.0015611648559570312, -0.00019311904907226562, 0.0011749267578125, 0.0025429725646972656, 0.003911018371582031, 0.005279064178466797, 0.0066471099853515625, 0.008015155792236328, 0.009383201599121094, 0.01075124740600586, 0.012119293212890625, 0.01348733901977539, 0.014855384826660156, 0.016223430633544922, 0.017591476440429688, 0.018959522247314453, 0.02032756805419922, 0.021695613861083984, 0.02306365966796875, 0.024431705474853516, 0.02579975128173828, 0.027167797088623047, 0.028535842895507812, 0.029903888702392578, 0.031271934509277344, 0.03263998031616211, 0.034008026123046875, 0.03537607192993164, 0.036744117736816406, 0.03811216354370117, 0.03948020935058594, 0.0408482551574707, 0.04221630096435547, 0.043584346771240234, 0.044952392578125]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 14.0, 31.0, 71.0, 165.0, 281.0, 238.0, 131.0, 45.0, 20.0, 8.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0036393117625266314, -0.0035615754313766956, -0.0034838393330574036, -0.003406103001907468, -0.003328366670757532, -0.0032506303396075964, -0.0031728942412883043, -0.0030951579101383686, -0.003017421578988433, -0.002939685247838497, -0.002861949149519205, -0.0027842128183692694, -0.0027064764872193336, -0.002628740156069398, -0.002551004057750106, -0.00247326772660017, -0.002395531628280878, -0.0023177952971309423, -0.0022400591988116503, -0.0021623228676617146, -0.002084586536511779, -0.002006850205361843, -0.001929114107042551, -0.0018513777758926153, -0.0017736414447426796, -0.0016959052300080657, -0.00161816889885813, -0.001540432684123516, -0.0014626963529735804, -0.0013849601382389665, -0.0013072239235043526, -0.0012294875923544168, -0.0011517511447891593, -0.0010740149300545454, -0.0009962785989046097, -0.0009185423841699958, -0.0008408060530200601, -0.0007630698382854462, -0.0006853335653431714, -0.0006075972924008965, -0.0005298610194586217, -0.00045212474651634693, -0.0003743884735740721, -0.00029665222973562777, -0.00021891595679335296, -0.00014117968385107815, -6.34434400126338e-05, 1.4292832929641008e-05, 9.202910587191582e-05, 0.00016976537881419063, 0.00024750165175646544, 0.0003252378955949098, 0.0004029741685371846, 0.0004807104414794594, 0.0005584466853179038, 0.0006361829582601786, 0.0007139192312024534, 0.0007916555041447282, 0.000869391777087003, 0.0009471280500292778, 0.0010248642647638917, 0.0011026005959138274, 0.0011803368106484413, 0.001258073141798377, 0.001335809356532991]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 2.0, 6.0, 6.0, 16.0, 15.0, 17.0, 18.0, 21.0, 19.0, 21.0, 24.0, 33.0, 38.0, 40.0, 37.0, 41.0, 35.0, 41.0, 47.0, 38.0, 35.0, 36.0, 40.0, 38.0, 54.0, 35.0, 24.0, 24.0, 35.0, 27.0, 21.0, 15.0, 13.0, 15.0, 14.0, 13.0, 12.0, 12.0, 4.0, 10.0, 2.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009309649467468262, -0.0008998150005936623, -0.0008686650544404984, -0.0008375151082873344, -0.0008063651621341705, -0.0007752152159810066, -0.0007440652698278427, -0.0007129153236746788, -0.0006817653775215149, -0.000650615431368351, -0.0006194654852151871, -0.0005883155390620232, -0.0005571655929088593, -0.0005260156467556953, -0.0004948657006025314, -0.0004637157544493675, -0.0004325658082962036, -0.0004014158621430397, -0.0003702659159898758, -0.0003391159698367119, -0.000307966023683548, -0.00027681607753038406, -0.00024566613137722015, -0.00021451618522405624, -0.00018336623907089233, -0.00015221629291772842, -0.00012106634676456451, -8.99164006114006e-05, -5.8766454458236694e-05, -2.7616508305072784e-05, 3.5334378480911255e-06, 3.4683384001255035e-05, 6.583333015441895e-05, 9.698327630758286e-05, 0.00012813322246074677, 0.00015928316861391068, 0.00019043311476707458, 0.0002215830609202385, 0.0002527330070734024, 0.0002838829532265663, 0.0003150328993797302, 0.00034618284553289413, 0.00037733279168605804, 0.00040848273783922195, 0.00043963268399238586, 0.0004707826301455498, 0.0005019325762987137, 0.0005330825224518776, 0.0005642324686050415, 0.0005953824147582054, 0.0006265323609113693, 0.0006576823070645332, 0.0006888322532176971, 0.000719982199370861, 0.000751132145524025, 0.0007822820916771889, 0.0008134320378303528, 0.0008445819839835167, 0.0008757319301366806, 0.0009068818762898445, 0.0009380318224430084, 0.0009691817685961723, 0.0010003317147493362, 0.0010314816609025002, 0.001062631607055664]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 6.0, 8.0, 11.0, 13.0, 13.0, 11.0, 23.0, 27.0, 33.0, 39.0, 46.0, 35.0, 46.0, 45.0, 50.0, 46.0, 54.0, 48.0, 52.0, 58.0, 42.0, 39.0, 40.0, 40.0, 29.0, 35.0, 28.0, 21.0, 15.0, 10.0, 20.0, 6.0, 5.0, 3.0, 4.0, 1.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.9296875, -5.72491455078125, -5.5201416015625, -5.31536865234375, -5.110595703125, -4.90582275390625, -4.7010498046875, -4.49627685546875, -4.29150390625, -4.08673095703125, -3.8819580078125, -3.67718505859375, -3.472412109375, -3.26763916015625, -3.0628662109375, -2.85809326171875, -2.6533203125, -2.44854736328125, -2.2437744140625, -2.03900146484375, -1.834228515625, -1.62945556640625, -1.4246826171875, -1.21990966796875, -1.01513671875, -0.81036376953125, -0.6055908203125, -0.40081787109375, -0.196044921875, 0.00872802734375, 0.2135009765625, 0.41827392578125, 0.623046875, 0.82781982421875, 1.0325927734375, 1.23736572265625, 1.442138671875, 1.64691162109375, 1.8516845703125, 2.05645751953125, 2.26123046875, 2.46600341796875, 2.6707763671875, 2.87554931640625, 3.080322265625, 3.28509521484375, 3.4898681640625, 3.69464111328125, 3.8994140625, 4.10418701171875, 4.3089599609375, 4.51373291015625, 4.718505859375, 4.92327880859375, 5.1280517578125, 5.33282470703125, 5.53759765625, 5.74237060546875, 5.9471435546875, 6.15191650390625, 6.356689453125, 6.56146240234375, 6.7662353515625, 6.97100830078125, 7.17578125]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 5.0, 19.0, 15.0, 36.0, 56.0, 80.0, 124.0, 213.0, 282.0, 531.0, 918.0, 1491.0, 2644.0, 5021.0, 10163.0, 24080.0, 70052.0, 284377.0, 463154.0, 120588.0, 35597.0, 14349.0, 6693.0, 3498.0, 1820.0, 1060.0, 618.0, 401.0, 251.0, 170.0, 92.0, 77.0, 40.0, 19.0, 9.0, 9.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.734375, -3.60650634765625, -3.4786376953125, -3.35076904296875, -3.222900390625, -3.09503173828125, -2.9671630859375, -2.83929443359375, -2.71142578125, -2.58355712890625, -2.4556884765625, -2.32781982421875, -2.199951171875, -2.07208251953125, -1.9442138671875, -1.81634521484375, -1.6884765625, -1.56060791015625, -1.4327392578125, -1.30487060546875, -1.177001953125, -1.04913330078125, -0.9212646484375, -0.79339599609375, -0.66552734375, -0.53765869140625, -0.4097900390625, -0.28192138671875, -0.154052734375, -0.02618408203125, 0.1016845703125, 0.22955322265625, 0.357421875, 0.48529052734375, 0.6131591796875, 0.74102783203125, 0.868896484375, 0.99676513671875, 1.1246337890625, 1.25250244140625, 1.38037109375, 1.50823974609375, 1.6361083984375, 1.76397705078125, 1.891845703125, 2.01971435546875, 2.1475830078125, 2.27545166015625, 2.4033203125, 2.53118896484375, 2.6590576171875, 2.78692626953125, 2.914794921875, 3.04266357421875, 3.1705322265625, 3.29840087890625, 3.42626953125, 3.55413818359375, 3.6820068359375, 3.80987548828125, 3.937744140625, 4.06561279296875, 4.1934814453125, 4.32135009765625, 4.44921875]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 0.0, 3.0, 1.0, 3.0, 9.0, 8.0, 13.0, 13.0, 7.0, 18.0, 22.0, 19.0, 29.0, 25.0, 31.0, 29.0, 38.0, 48.0, 33.0, 39.0, 70.0, 505.0, 1562.0, 83.0, 64.0, 40.0, 46.0, 39.0, 33.0, 22.0, 28.0, 26.0, 28.0, 13.0, 12.0, 18.0, 14.0, 13.0, 11.0, 13.0, 4.0, 3.0, 4.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 1.0], "bins": [-18.5625, -17.9638671875, -17.365234375, -16.7666015625, -16.16796875, -15.5693359375, -14.970703125, -14.3720703125, -13.7734375, -13.1748046875, -12.576171875, -11.9775390625, -11.37890625, -10.7802734375, -10.181640625, -9.5830078125, -8.984375, -8.3857421875, -7.787109375, -7.1884765625, -6.58984375, -5.9912109375, -5.392578125, -4.7939453125, -4.1953125, -3.5966796875, -2.998046875, -2.3994140625, -1.80078125, -1.2021484375, -0.603515625, -0.0048828125, 0.59375, 1.1923828125, 1.791015625, 2.3896484375, 2.98828125, 3.5869140625, 4.185546875, 4.7841796875, 5.3828125, 5.9814453125, 6.580078125, 7.1787109375, 7.77734375, 8.3759765625, 8.974609375, 9.5732421875, 10.171875, 10.7705078125, 11.369140625, 11.9677734375, 12.56640625, 13.1650390625, 13.763671875, 14.3623046875, 14.9609375, 15.5595703125, 16.158203125, 16.7568359375, 17.35546875, 17.9541015625, 18.552734375, 19.1513671875, 19.75]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 5.0, 9.0, 15.0, 13.0, 12.0, 17.0, 16.0, 16.0, 27.0, 37.0, 31.0, 51.0, 73.0, 111.0, 158.0, 216.0, 480.0, 1277.0, 28245.0, 3097438.0, 15189.0, 1079.0, 415.0, 238.0, 152.0, 94.0, 51.0, 45.0, 40.0, 23.0, 23.0, 19.0, 16.0, 15.0, 11.0, 7.0, 10.0, 6.0, 4.0, 1.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-33.03125, -32.04345703125, -31.0556640625, -30.06787109375, -29.080078125, -28.09228515625, -27.1044921875, -26.11669921875, -25.12890625, -24.14111328125, -23.1533203125, -22.16552734375, -21.177734375, -20.18994140625, -19.2021484375, -18.21435546875, -17.2265625, -16.23876953125, -15.2509765625, -14.26318359375, -13.275390625, -12.28759765625, -11.2998046875, -10.31201171875, -9.32421875, -8.33642578125, -7.3486328125, -6.36083984375, -5.373046875, -4.38525390625, -3.3974609375, -2.40966796875, -1.421875, -0.43408203125, 0.5537109375, 1.54150390625, 2.529296875, 3.51708984375, 4.5048828125, 5.49267578125, 6.48046875, 7.46826171875, 8.4560546875, 9.44384765625, 10.431640625, 11.41943359375, 12.4072265625, 13.39501953125, 14.3828125, 15.37060546875, 16.3583984375, 17.34619140625, 18.333984375, 19.32177734375, 20.3095703125, 21.29736328125, 22.28515625, 23.27294921875, 24.2607421875, 25.24853515625, 26.236328125, 27.22412109375, 28.2119140625, 29.19970703125, 30.1875]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [7.0, 24.0, 137.0, 260.0, 310.0, 176.0, 73.0, 19.0, 6.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9876203536987305, -3.842341899871826, -2.6970632076263428, -1.5517845153808594, -0.4065060615539551, 0.7387723922729492, 1.8840513229370117, 3.029329299926758, 4.17460823059082, 5.319886684417725, 6.465165138244629, 7.610444068908691, 8.755722045898438, 9.9010009765625, 11.046279907226562, 12.191557884216309, 13.336836814880371, 14.482115745544434, 15.62739372253418, 16.772672653198242, 17.917951583862305, 19.063228607177734, 20.208507537841797, 21.35378646850586, 22.499065399169922, 23.644344329833984, 24.789623260498047, 25.93490219116211, 27.08017921447754, 28.2254581451416, 29.370737075805664, 30.516014099121094, 31.661296844482422, 32.806575775146484, 33.95185470581055, 35.09713363647461, 36.24241256713867, 37.38768768310547, 38.53296661376953, 39.678245544433594, 40.823524475097656, 41.96880340576172, 43.11408233642578, 44.259361267089844, 45.404640197753906, 46.54991912841797, 47.69519805908203, 48.84047317504883, 49.985755920410156, 51.13103485107422, 52.27631378173828, 53.421592712402344, 54.566871643066406, 55.71215057373047, 56.85742950439453, 58.00270462036133, 59.14798355102539, 60.29326248168945, 61.438541412353516, 62.58382034301758, 63.72909927368164, 64.87437438964844, 66.0196533203125, 67.16493225097656, 68.31021118164062]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 6.0, 7.0, 5.0, 10.0, 6.0, 13.0, 22.0, 22.0, 18.0, 18.0, 20.0, 15.0, 26.0, 30.0, 30.0, 24.0, 35.0, 40.0, 33.0, 37.0, 33.0, 34.0, 34.0, 33.0, 37.0, 37.0, 38.0, 32.0, 41.0, 23.0, 35.0, 31.0, 21.0, 16.0, 28.0, 18.0, 15.0, 17.0, 10.0, 10.0, 9.0, 8.0, 8.0, 9.0, 2.0, 3.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-55.81963348388672, -54.091609954833984, -52.363582611083984, -50.63555908203125, -48.907535552978516, -47.17951202392578, -45.45148468017578, -43.72346115112305, -41.99543762207031, -40.26741409301758, -38.53938674926758, -36.811363220214844, -35.08333969116211, -33.355316162109375, -31.627288818359375, -29.89926528930664, -28.17123794555664, -26.443212509155273, -24.71518898010254, -22.987163543701172, -21.259140014648438, -19.53111457824707, -17.803089141845703, -16.07506561279297, -14.347040176391602, -12.61901569366455, -10.8909912109375, -9.162965774536133, -7.434941291809082, -5.706916809082031, -3.978891372680664, -2.2508668899536133, -0.5228424072265625, 1.2051823139190674, 2.9332070350646973, 4.661231994628906, 6.389256477355957, 8.117280960083008, 9.845306396484375, 11.573330879211426, 13.301355361938477, 15.029379844665527, 16.757404327392578, 18.485429763793945, 20.213455200195312, 21.941478729248047, 23.669504165649414, 25.39752960205078, 27.125553131103516, 28.853578567504883, 30.581602096557617, 32.309627532958984, 34.03765106201172, 35.76567840576172, 37.49370193481445, 39.22172546386719, 40.94975280761719, 42.67777633666992, 44.40580368041992, 46.133827209472656, 47.86185073852539, 49.589874267578125, 51.317901611328125, 53.04592514038086, 54.773948669433594]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 8.0, 7.0, 10.0, 12.0, 10.0, 15.0, 25.0, 19.0, 30.0, 42.0, 46.0, 38.0, 44.0, 54.0, 42.0, 46.0, 60.0, 43.0, 62.0, 48.0, 49.0, 42.0, 39.0, 37.0, 28.0, 40.0, 26.0, 21.0, 20.0, 6.0, 15.0, 6.0, 5.0, 4.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.09765625, -5.8870849609375, -5.676513671875, -5.4659423828125, -5.25537109375, -5.0447998046875, -4.834228515625, -4.6236572265625, -4.4130859375, -4.2025146484375, -3.991943359375, -3.7813720703125, -3.57080078125, -3.3602294921875, -3.149658203125, -2.9390869140625, -2.728515625, -2.5179443359375, -2.307373046875, -2.0968017578125, -1.88623046875, -1.6756591796875, -1.465087890625, -1.2545166015625, -1.0439453125, -0.8333740234375, -0.622802734375, -0.4122314453125, -0.20166015625, 0.0089111328125, 0.219482421875, 0.4300537109375, 0.640625, 0.8511962890625, 1.061767578125, 1.2723388671875, 1.48291015625, 1.6934814453125, 1.904052734375, 2.1146240234375, 2.3251953125, 2.5357666015625, 2.746337890625, 2.9569091796875, 3.16748046875, 3.3780517578125, 3.588623046875, 3.7991943359375, 4.009765625, 4.2203369140625, 4.430908203125, 4.6414794921875, 4.85205078125, 5.0626220703125, 5.273193359375, 5.4837646484375, 5.6943359375, 5.9049072265625, 6.115478515625, 6.3260498046875, 6.53662109375, 6.7471923828125, 6.957763671875, 7.1683349609375, 7.37890625]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 6.0, 4.0, 9.0, 4.0, 15.0, 11.0, 19.0, 24.0, 26.0, 49.0, 72.0, 130.0, 184.0, 525.0, 2148.0, 10982.0, 111447.0, 2549466.0, 1451115.0, 58119.0, 7352.0, 1605.0, 459.0, 174.0, 107.0, 66.0, 53.0, 24.0, 23.0, 22.0, 6.0, 16.0, 9.0, 11.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.21875, -17.587890625, -16.95703125, -16.326171875, -15.6953125, -15.064453125, -14.43359375, -13.802734375, -13.171875, -12.541015625, -11.91015625, -11.279296875, -10.6484375, -10.017578125, -9.38671875, -8.755859375, -8.125, -7.494140625, -6.86328125, -6.232421875, -5.6015625, -4.970703125, -4.33984375, -3.708984375, -3.078125, -2.447265625, -1.81640625, -1.185546875, -0.5546875, 0.076171875, 0.70703125, 1.337890625, 1.96875, 2.599609375, 3.23046875, 3.861328125, 4.4921875, 5.123046875, 5.75390625, 6.384765625, 7.015625, 7.646484375, 8.27734375, 8.908203125, 9.5390625, 10.169921875, 10.80078125, 11.431640625, 12.0625, 12.693359375, 13.32421875, 13.955078125, 14.5859375, 15.216796875, 15.84765625, 16.478515625, 17.109375, 17.740234375, 18.37109375, 19.001953125, 19.6328125, 20.263671875, 20.89453125, 21.525390625, 22.15625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 6.0, 6.0, 8.0, 6.0, 24.0, 17.0, 35.0, 30.0, 58.0, 67.0, 90.0, 121.0, 149.0, 179.0, 245.0, 317.0, 393.0, 406.0, 367.0, 368.0, 290.0, 207.0, 173.0, 118.0, 108.0, 75.0, 52.0, 45.0, 26.0, 24.0, 11.0, 13.0, 9.0, 7.0, 10.0, 6.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.4765625, -15.0655517578125, -14.654541015625, -14.2435302734375, -13.83251953125, -13.4215087890625, -13.010498046875, -12.5994873046875, -12.1884765625, -11.7774658203125, -11.366455078125, -10.9554443359375, -10.54443359375, -10.1334228515625, -9.722412109375, -9.3114013671875, -8.900390625, -8.4893798828125, -8.078369140625, -7.6673583984375, -7.25634765625, -6.8453369140625, -6.434326171875, -6.0233154296875, -5.6123046875, -5.2012939453125, -4.790283203125, -4.3792724609375, -3.96826171875, -3.5572509765625, -3.146240234375, -2.7352294921875, -2.32421875, -1.9132080078125, -1.502197265625, -1.0911865234375, -0.68017578125, -0.2691650390625, 0.141845703125, 0.5528564453125, 0.9638671875, 1.3748779296875, 1.785888671875, 2.1968994140625, 2.60791015625, 3.0189208984375, 3.429931640625, 3.8409423828125, 4.251953125, 4.6629638671875, 5.073974609375, 5.4849853515625, 5.89599609375, 6.3070068359375, 6.718017578125, 7.1290283203125, 7.5400390625, 7.9510498046875, 8.362060546875, 8.7730712890625, 9.18408203125, 9.5950927734375, 10.006103515625, 10.4171142578125, 10.828125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 3.0, 9.0, 14.0, 10.0, 26.0, 37.0, 31.0, 64.0, 94.0, 119.0, 192.0, 312.0, 620.0, 4304.0, 154037.0, 3918815.0, 110646.0, 3549.0, 539.0, 290.0, 165.0, 129.0, 75.0, 54.0, 45.0, 24.0, 24.0, 21.0, 13.0, 10.0, 6.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.375, -38.724609375, -37.07421875, -35.423828125, -33.7734375, -32.123046875, -30.47265625, -28.822265625, -27.171875, -25.521484375, -23.87109375, -22.220703125, -20.5703125, -18.919921875, -17.26953125, -15.619140625, -13.96875, -12.318359375, -10.66796875, -9.017578125, -7.3671875, -5.716796875, -4.06640625, -2.416015625, -0.765625, 0.884765625, 2.53515625, 4.185546875, 5.8359375, 7.486328125, 9.13671875, 10.787109375, 12.4375, 14.087890625, 15.73828125, 17.388671875, 19.0390625, 20.689453125, 22.33984375, 23.990234375, 25.640625, 27.291015625, 28.94140625, 30.591796875, 32.2421875, 33.892578125, 35.54296875, 37.193359375, 38.84375, 40.494140625, 42.14453125, 43.794921875, 45.4453125, 47.095703125, 48.74609375, 50.396484375, 52.046875, 53.697265625, 55.34765625, 56.998046875, 58.6484375, 60.298828125, 61.94921875, 63.599609375, 65.25]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 8.0, 12.0, 8.0, 32.0, 44.0, 75.0, 112.0, 126.0, 143.0, 124.0, 119.0, 78.0, 52.0, 28.0, 21.0, 17.0, 5.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.53249740600586, -59.126258850097656, -56.72001647949219, -54.313777923583984, -51.907535552978516, -49.50129699707031, -47.095054626464844, -44.68881607055664, -42.28257751464844, -39.876338958740234, -37.470096588134766, -35.06385803222656, -32.657615661621094, -30.25137710571289, -27.845136642456055, -25.43889617919922, -23.03265380859375, -20.626413345336914, -18.220172882080078, -15.813933372497559, -13.407692909240723, -11.001452445983887, -8.595212936401367, -6.188972473144531, -3.7827320098876953, -1.3764917850494385, 1.0297484397888184, 3.435988426208496, 5.842228889465332, 8.248469352722168, 10.654708862304688, 13.060949325561523, 15.467193603515625, 17.87343406677246, 20.279674530029297, 22.6859130859375, 25.09215545654297, 27.498394012451172, 29.904634475708008, 32.310874938964844, 34.71711730957031, 37.123355865478516, 39.529598236083984, 41.93583679199219, 44.342079162597656, 46.74831771850586, 49.15455627441406, 51.56079864501953, 53.967037200927734, 56.37327575683594, 58.779518127441406, 61.18575668334961, 63.59199905395508, 65.99823760986328, 68.40447998046875, 70.81071472167969, 73.21695709228516, 75.62319946289062, 78.02943420410156, 80.43567657470703, 82.8419189453125, 85.24816131591797, 87.6543960571289, 90.06063842773438, 92.46688079833984]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 6.0, 5.0, 5.0, 6.0, 4.0, 9.0, 11.0, 17.0, 13.0, 18.0, 18.0, 29.0, 29.0, 33.0, 25.0, 39.0, 34.0, 25.0, 42.0, 34.0, 40.0, 29.0, 45.0, 43.0, 43.0, 44.0, 33.0, 33.0, 37.0, 37.0, 36.0, 22.0, 21.0, 16.0, 15.0, 29.0, 13.0, 11.0, 17.0, 8.0, 7.0, 9.0, 6.0, 3.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0], "bins": [-50.12028503417969, -48.74879837036133, -47.37731170654297, -46.00582504272461, -44.63433837890625, -43.262855529785156, -41.89136505126953, -40.51988220214844, -39.14839553833008, -37.77690887451172, -36.40542221069336, -35.033935546875, -33.66244888305664, -32.29096221923828, -30.919477462768555, -29.547992706298828, -28.176504135131836, -26.805017471313477, -25.433530807495117, -24.06204605102539, -22.69055938720703, -21.319072723388672, -19.947586059570312, -18.576099395751953, -17.204612731933594, -15.833126068115234, -14.461640357971191, -13.090153694152832, -11.718667984008789, -10.34718132019043, -8.97569465637207, -7.604208946228027, -6.232723236083984, -4.861237049102783, -3.489750623703003, -2.1182641983032227, -0.7467780113220215, 0.6247081756591797, 1.996194839477539, 3.367680549621582, 4.739167213439941, 6.110653400421143, 7.482139587402344, 8.853626251220703, 10.225112915039062, 11.596598625183105, 12.968085289001465, 14.339570999145508, 15.711057662963867, 17.082544326782227, 18.454030990600586, 19.825515747070312, 21.197002410888672, 22.56848907470703, 23.93997573852539, 25.31146240234375, 26.68294906616211, 28.05443572998047, 29.425922393798828, 30.797409057617188, 32.16889572143555, 33.540382385253906, 34.911865234375, 36.28335189819336, 37.65483856201172]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 7.0, 6.0, 6.0, 12.0, 11.0, 14.0, 15.0, 25.0, 30.0, 20.0, 33.0, 30.0, 31.0, 46.0, 52.0, 61.0, 46.0, 39.0, 53.0, 51.0, 57.0, 37.0, 39.0, 44.0, 46.0, 33.0, 35.0, 25.0, 28.0, 20.0, 9.0, 14.0, 12.0, 9.0, 2.0, 5.0, 4.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.390625, -5.1868896484375, -4.983154296875, -4.7794189453125, -4.57568359375, -4.3719482421875, -4.168212890625, -3.9644775390625, -3.7607421875, -3.5570068359375, -3.353271484375, -3.1495361328125, -2.94580078125, -2.7420654296875, -2.538330078125, -2.3345947265625, -2.130859375, -1.9271240234375, -1.723388671875, -1.5196533203125, -1.31591796875, -1.1121826171875, -0.908447265625, -0.7047119140625, -0.5009765625, -0.2972412109375, -0.093505859375, 0.1102294921875, 0.31396484375, 0.5177001953125, 0.721435546875, 0.9251708984375, 1.12890625, 1.3326416015625, 1.536376953125, 1.7401123046875, 1.94384765625, 2.1475830078125, 2.351318359375, 2.5550537109375, 2.7587890625, 2.9625244140625, 3.166259765625, 3.3699951171875, 3.57373046875, 3.7774658203125, 3.981201171875, 4.1849365234375, 4.388671875, 4.5924072265625, 4.796142578125, 4.9998779296875, 5.20361328125, 5.4073486328125, 5.611083984375, 5.8148193359375, 6.0185546875, 6.2222900390625, 6.426025390625, 6.6297607421875, 6.83349609375, 7.0372314453125, 7.240966796875, 7.4447021484375, 7.6484375]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 9.0, 10.0, 22.0, 38.0, 55.0, 57.0, 102.0, 171.0, 227.0, 340.0, 520.0, 696.0, 1056.0, 1542.0, 2117.0, 3025.0, 4508.0, 6407.0, 9323.0, 13994.0, 20706.0, 31572.0, 50004.0, 83999.0, 154173.0, 235353.0, 173503.0, 94529.0, 55294.0, 34678.0, 22737.0, 15150.0, 10143.0, 6924.0, 4762.0, 3319.0, 2223.0, 1695.0, 1102.0, 778.0, 559.0, 340.0, 287.0, 160.0, 114.0, 66.0, 59.0, 44.0, 22.0, 17.0, 7.0, 11.0, 4.0, 6.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.71923828125, -0.6964797973632812, -0.6737213134765625, -0.6509628295898438, -0.628204345703125, -0.6054458618164062, -0.5826873779296875, -0.5599288940429688, -0.53717041015625, -0.5144119262695312, -0.4916534423828125, -0.46889495849609375, -0.446136474609375, -0.42337799072265625, -0.4006195068359375, -0.37786102294921875, -0.3551025390625, -0.33234405517578125, -0.3095855712890625, -0.28682708740234375, -0.264068603515625, -0.24131011962890625, -0.2185516357421875, -0.19579315185546875, -0.17303466796875, -0.15027618408203125, -0.1275177001953125, -0.10475921630859375, -0.082000732421875, -0.05924224853515625, -0.0364837646484375, -0.01372528076171875, 0.009033203125, 0.03179168701171875, 0.0545501708984375, 0.07730865478515625, 0.100067138671875, 0.12282562255859375, 0.1455841064453125, 0.16834259033203125, 0.19110107421875, 0.21385955810546875, 0.2366180419921875, 0.25937652587890625, 0.282135009765625, 0.30489349365234375, 0.3276519775390625, 0.35041046142578125, 0.3731689453125, 0.39592742919921875, 0.4186859130859375, 0.44144439697265625, 0.464202880859375, 0.48696136474609375, 0.5097198486328125, 0.5324783325195312, 0.55523681640625, 0.5779953002929688, 0.6007537841796875, 0.6235122680664062, 0.646270751953125, 0.6690292358398438, 0.6917877197265625, 0.7145462036132812, 0.7373046875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 7.0, 7.0, 6.0, 7.0, 15.0, 17.0, 14.0, 24.0, 22.0, 19.0, 27.0, 24.0, 27.0, 35.0, 24.0, 27.0, 52.0, 40.0, 56.0, 1057.0, 40.0, 39.0, 49.0, 43.0, 38.0, 29.0, 31.0, 36.0, 29.0, 19.0, 23.0, 21.0, 23.0, 18.0, 14.0, 9.0, 16.0, 9.0, 9.0, 5.0, 2.0, 2.0, 2.0, 4.0, 1.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.263671875, -3.1611328125, -3.05859375, -2.9560546875, -2.853515625, -2.7509765625, -2.6484375, -2.5458984375, -2.443359375, -2.3408203125, -2.23828125, -2.1357421875, -2.033203125, -1.9306640625, -1.828125, -1.7255859375, -1.623046875, -1.5205078125, -1.41796875, -1.3154296875, -1.212890625, -1.1103515625, -1.0078125, -0.9052734375, -0.802734375, -0.7001953125, -0.59765625, -0.4951171875, -0.392578125, -0.2900390625, -0.1875, -0.0849609375, 0.017578125, 0.1201171875, 0.22265625, 0.3251953125, 0.427734375, 0.5302734375, 0.6328125, 0.7353515625, 0.837890625, 0.9404296875, 1.04296875, 1.1455078125, 1.248046875, 1.3505859375, 1.453125, 1.5556640625, 1.658203125, 1.7607421875, 1.86328125, 1.9658203125, 2.068359375, 2.1708984375, 2.2734375, 2.3759765625, 2.478515625, 2.5810546875, 2.68359375, 2.7861328125, 2.888671875, 2.9912109375, 3.09375, 3.1962890625, 3.298828125]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 6.0, 6.0, 6.0, 17.0, 15.0, 25.0, 45.0, 62.0, 108.0, 142.0, 217.0, 326.0, 472.0, 728.0, 957.0, 1379.0, 1976.0, 3061.0, 4634.0, 7005.0, 10844.0, 16866.0, 26753.0, 44179.0, 77416.0, 144004.0, 1291967.0, 199938.0, 107361.0, 59594.0, 35117.0, 21533.0, 13903.0, 8950.0, 5636.0, 3829.0, 2586.0, 1745.0, 1196.0, 835.0, 552.0, 381.0, 264.0, 166.0, 117.0, 71.0, 54.0, 36.0, 24.0, 11.0, 10.0, 11.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.6298828125, -0.6094131469726562, -0.5889434814453125, -0.5684738159179688, -0.548004150390625, -0.5275344848632812, -0.5070648193359375, -0.48659515380859375, -0.46612548828125, -0.44565582275390625, -0.4251861572265625, -0.40471649169921875, -0.384246826171875, -0.36377716064453125, -0.3433074951171875, -0.32283782958984375, -0.3023681640625, -0.28189849853515625, -0.2614288330078125, -0.24095916748046875, -0.220489501953125, -0.20001983642578125, -0.1795501708984375, -0.15908050537109375, -0.13861083984375, -0.11814117431640625, -0.0976715087890625, -0.07720184326171875, -0.056732177734375, -0.03626251220703125, -0.0157928466796875, 0.00467681884765625, 0.025146484375, 0.04561614990234375, 0.0660858154296875, 0.08655548095703125, 0.107025146484375, 0.12749481201171875, 0.1479644775390625, 0.16843414306640625, 0.18890380859375, 0.20937347412109375, 0.2298431396484375, 0.25031280517578125, 0.270782470703125, 0.29125213623046875, 0.3117218017578125, 0.33219146728515625, 0.3526611328125, 0.37313079833984375, 0.3936004638671875, 0.41407012939453125, 0.434539794921875, 0.45500946044921875, 0.4754791259765625, 0.49594879150390625, 0.51641845703125, 0.5368881225585938, 0.5573577880859375, 0.5778274536132812, 0.598297119140625, 0.6187667846679688, 0.6392364501953125, 0.6597061157226562, 0.68017578125]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 3.0, 6.0, 4.0, 7.0, 8.0, 12.0, 14.0, 12.0, 24.0, 27.0, 24.0, 18.0, 49.0, 42.0, 53.0, 58.0, 68.0, 51.0, 60.0, 70.0, 62.0, 57.0, 42.0, 45.0, 30.0, 32.0, 20.0, 19.0, 17.0, 15.0, 10.0, 11.0, 6.0, 4.0, 7.0, 3.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.00194549560546875, -0.0018904954195022583, -0.0018354952335357666, -0.001780495047569275, -0.0017254948616027832, -0.0016704946756362915, -0.0016154944896697998, -0.001560494303703308, -0.0015054941177368164, -0.0014504939317703247, -0.001395493745803833, -0.0013404935598373413, -0.0012854933738708496, -0.001230493187904358, -0.0011754930019378662, -0.0011204928159713745, -0.0010654926300048828, -0.0010104924440383911, -0.0009554922580718994, -0.0009004920721054077, -0.000845491886138916, -0.0007904917001724243, -0.0007354915142059326, -0.0006804913282394409, -0.0006254911422729492, -0.0005704909563064575, -0.0005154907703399658, -0.0004604905843734741, -0.0004054903984069824, -0.0003504902124404907, -0.000295490026473999, -0.00024048984050750732, -0.00018548965454101562, -0.00013048946857452393, -7.548928260803223e-05, -2.0489096641540527e-05, 3.451108932495117e-05, 8.951127529144287e-05, 0.00014451146125793457, 0.00019951164722442627, 0.00025451183319091797, 0.00030951201915740967, 0.00036451220512390137, 0.00041951239109039307, 0.00047451257705688477, 0.0005295127630233765, 0.0005845129489898682, 0.0006395131349563599, 0.0006945133209228516, 0.0007495135068893433, 0.000804513692855835, 0.0008595138788223267, 0.0009145140647888184, 0.0009695142507553101, 0.0010245144367218018, 0.0010795146226882935, 0.0011345148086547852, 0.0011895149946212769, 0.0012445151805877686, 0.0012995153665542603, 0.001354515552520752, 0.0014095157384872437, 0.0014645159244537354, 0.001519516110420227, 0.0015745162963867188]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 8.0, 4.0, 4.0, 4.0, 8.0, 7.0, 6.0, 13.0, 15.0, 25.0, 39.0, 57.0, 86.0, 133.0, 221.0, 436.0, 1627.0, 1007507.0, 36870.0, 691.0, 294.0, 187.0, 99.0, 62.0, 44.0, 29.0, 23.0, 17.0, 11.0, 17.0, 4.0, 6.0, 4.0, 4.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04339599609375, -0.041886329650878906, -0.04037666320800781, -0.03886699676513672, -0.037357330322265625, -0.03584766387939453, -0.03433799743652344, -0.032828330993652344, -0.03131866455078125, -0.029808998107910156, -0.028299331665039062, -0.02678966522216797, -0.025279998779296875, -0.02377033233642578, -0.022260665893554688, -0.020750999450683594, -0.0192413330078125, -0.017731666564941406, -0.016222000122070312, -0.014712333679199219, -0.013202667236328125, -0.011693000793457031, -0.010183334350585938, -0.008673667907714844, -0.00716400146484375, -0.005654335021972656, -0.0041446685791015625, -0.0026350021362304688, -0.001125335693359375, 0.00038433074951171875, 0.0018939971923828125, 0.0034036636352539062, 0.004913330078125, 0.006422996520996094, 0.007932662963867188, 0.009442329406738281, 0.010951995849609375, 0.012461662292480469, 0.013971328735351562, 0.015480995178222656, 0.01699066162109375, 0.018500328063964844, 0.020009994506835938, 0.02151966094970703, 0.023029327392578125, 0.02453899383544922, 0.026048660278320312, 0.027558326721191406, 0.0290679931640625, 0.030577659606933594, 0.03208732604980469, 0.03359699249267578, 0.035106658935546875, 0.03661632537841797, 0.03812599182128906, 0.039635658264160156, 0.04114532470703125, 0.042654991149902344, 0.04416465759277344, 0.04567432403564453, 0.047183990478515625, 0.04869365692138672, 0.05020332336425781, 0.051712989807128906, 0.05322265625]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 10.0, 761.0, 248.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00523178419098258, -0.004789181984961033, -0.0043465797789394855, -0.0039039775729179382, -0.003461375366896391, -0.0030187733937054873, -0.00257617118768394, -0.0021335689816623926, -0.0016909667756408453, -0.001248364569619298, -0.0008057624218054116, -0.0003631602739915252, 7.944193203002214e-05, 0.0005220440216362476, 0.000964646227657795, 0.0014072484336793423, 0.0018498506397008896, 0.002292452845722437, 0.0027350550517439842, 0.0031776572577655315, 0.003620259463787079, 0.004062861204147339, 0.0045054638758301735, 0.0049480656161904335, 0.005390668287873268, 0.0058332704938948154, 0.006275872699916363, 0.00671847490593791, 0.007161077111959457, 0.007603678852319717, 0.008046281524002552, 0.008488883264362812, 0.008931485004723072, 0.009374086745083332, 0.009816689416766167, 0.010259291157126427, 0.010701893828809261, 0.011144495569169521, 0.011587098240852356, 0.012029699981212616, 0.01247230265289545, 0.01291490439325571, 0.013357507064938545, 0.013800108805298805, 0.01424271147698164, 0.0146853132173419, 0.015127915889024734, 0.015570517629384995, 0.016013119369745255, 0.016455721110105515, 0.016898322850465775, 0.017340926453471184, 0.017783528193831444, 0.018226129934191704, 0.018668731674551964, 0.019111335277557373, 0.019553937017917633, 0.019996538758277893, 0.020439140498638153, 0.020881744101643562, 0.021324345842003822, 0.021766947582364082, 0.022209549322724342, 0.02265215292572975, 0.02309475466609001]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 3.0, 10.0, 9.0, 8.0, 11.0, 13.0, 10.0, 17.0, 14.0, 17.0, 26.0, 30.0, 36.0, 38.0, 21.0, 33.0, 36.0, 39.0, 41.0, 48.0, 46.0, 41.0, 52.0, 38.0, 35.0, 45.0, 29.0, 34.0, 34.0, 40.0, 19.0, 24.0, 13.0, 18.0, 16.0, 10.0, 9.0, 8.0, 7.0, 5.0, 3.0, 6.0, 3.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0009239912033081055, -0.0008953018113970757, -0.0008666124194860458, -0.000837923027575016, -0.0008092336356639862, -0.0007805442437529564, -0.0007518548518419266, -0.0007231654599308968, -0.0006944760680198669, -0.0006657866761088371, -0.0006370972841978073, -0.0006084078922867775, -0.0005797185003757477, -0.0005510291084647179, -0.000522339716553688, -0.0004936503246426582, -0.0004649609327316284, -0.0004362715408205986, -0.0004075821489095688, -0.00037889275699853897, -0.00035020336508750916, -0.00032151397317647934, -0.0002928245812654495, -0.0002641351893544197, -0.0002354457974433899, -0.00020675640553236008, -0.00017806701362133026, -0.00014937762171030045, -0.00012068822979927063, -9.199883788824081e-05, -6.3309445977211e-05, -3.462005406618118e-05, -5.930662155151367e-06, 2.275872975587845e-05, 5.1448121666908264e-05, 8.013751357793808e-05, 0.0001088269054889679, 0.0001375162973999977, 0.00016620568931102753, 0.00019489508122205734, 0.00022358447313308716, 0.000252273865044117, 0.0002809632569551468, 0.0003096526488661766, 0.0003383420407772064, 0.00036703143268823624, 0.00039572082459926605, 0.00042441021651029587, 0.0004530996084213257, 0.0004817890003323555, 0.0005104783922433853, 0.0005391677841544151, 0.000567857176065445, 0.0005965465679764748, 0.0006252359598875046, 0.0006539253517985344, 0.0006826147437095642, 0.000711304135620594, 0.0007399935275316238, 0.0007686829194426537, 0.0007973723113536835, 0.0008260617032647133, 0.0008547510951757431, 0.0008834404870867729, 0.0009121298789978027]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 7.0, 6.0, 6.0, 12.0, 11.0, 14.0, 15.0, 25.0, 30.0, 20.0, 33.0, 30.0, 31.0, 46.0, 52.0, 61.0, 46.0, 39.0, 53.0, 51.0, 57.0, 37.0, 39.0, 44.0, 46.0, 33.0, 35.0, 25.0, 28.0, 20.0, 9.0, 14.0, 12.0, 9.0, 2.0, 5.0, 4.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.390625, -5.1868896484375, -4.983154296875, -4.7794189453125, -4.57568359375, -4.3719482421875, -4.168212890625, -3.9644775390625, -3.7607421875, -3.5570068359375, -3.353271484375, -3.1495361328125, -2.94580078125, -2.7420654296875, -2.538330078125, -2.3345947265625, -2.130859375, -1.9271240234375, -1.723388671875, -1.5196533203125, -1.31591796875, -1.1121826171875, -0.908447265625, -0.7047119140625, -0.5009765625, -0.2972412109375, -0.093505859375, 0.1102294921875, 0.31396484375, 0.5177001953125, 0.721435546875, 0.9251708984375, 1.12890625, 1.3326416015625, 1.536376953125, 1.7401123046875, 1.94384765625, 2.1475830078125, 2.351318359375, 2.5550537109375, 2.7587890625, 2.9625244140625, 3.166259765625, 3.3699951171875, 3.57373046875, 3.7774658203125, 3.981201171875, 4.1849365234375, 4.388671875, 4.5924072265625, 4.796142578125, 4.9998779296875, 5.20361328125, 5.4073486328125, 5.611083984375, 5.8148193359375, 6.0185546875, 6.2222900390625, 6.426025390625, 6.6297607421875, 6.83349609375, 7.0372314453125, 7.240966796875, 7.4447021484375, 7.6484375]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 4.0, 4.0, 8.0, 15.0, 11.0, 25.0, 25.0, 49.0, 62.0, 89.0, 121.0, 157.0, 247.0, 356.0, 486.0, 676.0, 885.0, 1278.0, 1827.0, 2414.0, 3466.0, 5094.0, 7593.0, 12631.0, 25019.0, 63656.0, 211232.0, 459942.0, 148983.0, 48347.0, 20613.0, 10943.0, 6728.0, 4458.0, 3190.0, 2286.0, 1612.0, 1120.0, 810.0, 607.0, 429.0, 302.0, 211.0, 164.0, 105.0, 71.0, 65.0, 40.0, 42.0, 18.0, 10.0, 16.0, 11.0, 11.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-3.96875, -3.84613037109375, -3.7235107421875, -3.60089111328125, -3.478271484375, -3.35565185546875, -3.2330322265625, -3.11041259765625, -2.98779296875, -2.86517333984375, -2.7425537109375, -2.61993408203125, -2.497314453125, -2.37469482421875, -2.2520751953125, -2.12945556640625, -2.0068359375, -1.88421630859375, -1.7615966796875, -1.63897705078125, -1.516357421875, -1.39373779296875, -1.2711181640625, -1.14849853515625, -1.02587890625, -0.90325927734375, -0.7806396484375, -0.65802001953125, -0.535400390625, -0.41278076171875, -0.2901611328125, -0.16754150390625, -0.044921875, 0.07769775390625, 0.2003173828125, 0.32293701171875, 0.445556640625, 0.56817626953125, 0.6907958984375, 0.81341552734375, 0.93603515625, 1.05865478515625, 1.1812744140625, 1.30389404296875, 1.426513671875, 1.54913330078125, 1.6717529296875, 1.79437255859375, 1.9169921875, 2.03961181640625, 2.1622314453125, 2.28485107421875, 2.407470703125, 2.53009033203125, 2.6527099609375, 2.77532958984375, 2.89794921875, 3.02056884765625, 3.1431884765625, 3.26580810546875, 3.388427734375, 3.51104736328125, 3.6336669921875, 3.75628662109375, 3.87890625]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 2.0, 4.0, 3.0, 5.0, 5.0, 13.0, 10.0, 14.0, 15.0, 19.0, 22.0, 22.0, 33.0, 28.0, 26.0, 40.0, 50.0, 37.0, 63.0, 102.0, 403.0, 1609.0, 102.0, 57.0, 56.0, 34.0, 34.0, 28.0, 29.0, 30.0, 37.0, 25.0, 22.0, 17.0, 18.0, 10.0, 9.0, 1.0, 3.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-21.34375, -20.69873046875, -20.0537109375, -19.40869140625, -18.763671875, -18.11865234375, -17.4736328125, -16.82861328125, -16.18359375, -15.53857421875, -14.8935546875, -14.24853515625, -13.603515625, -12.95849609375, -12.3134765625, -11.66845703125, -11.0234375, -10.37841796875, -9.7333984375, -9.08837890625, -8.443359375, -7.79833984375, -7.1533203125, -6.50830078125, -5.86328125, -5.21826171875, -4.5732421875, -3.92822265625, -3.283203125, -2.63818359375, -1.9931640625, -1.34814453125, -0.703125, -0.05810546875, 0.5869140625, 1.23193359375, 1.876953125, 2.52197265625, 3.1669921875, 3.81201171875, 4.45703125, 5.10205078125, 5.7470703125, 6.39208984375, 7.037109375, 7.68212890625, 8.3271484375, 8.97216796875, 9.6171875, 10.26220703125, 10.9072265625, 11.55224609375, 12.197265625, 12.84228515625, 13.4873046875, 14.13232421875, 14.77734375, 15.42236328125, 16.0673828125, 16.71240234375, 17.357421875, 18.00244140625, 18.6474609375, 19.29248046875, 19.9375]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 9.0, 2.0, 5.0, 10.0, 12.0, 26.0, 30.0, 26.0, 28.0, 37.0, 46.0, 70.0, 108.0, 182.0, 239.0, 392.0, 1544.0, 21743.0, 3062024.0, 54996.0, 2719.0, 512.0, 272.0, 180.0, 127.0, 86.0, 51.0, 38.0, 38.0, 29.0, 17.0, 25.0, 17.0, 10.0, 14.0, 8.0, 2.0, 6.0, 3.0, 4.0, 3.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-35.4375, -34.2802734375, -33.123046875, -31.9658203125, -30.80859375, -29.6513671875, -28.494140625, -27.3369140625, -26.1796875, -25.0224609375, -23.865234375, -22.7080078125, -21.55078125, -20.3935546875, -19.236328125, -18.0791015625, -16.921875, -15.7646484375, -14.607421875, -13.4501953125, -12.29296875, -11.1357421875, -9.978515625, -8.8212890625, -7.6640625, -6.5068359375, -5.349609375, -4.1923828125, -3.03515625, -1.8779296875, -0.720703125, 0.4365234375, 1.59375, 2.7509765625, 3.908203125, 5.0654296875, 6.22265625, 7.3798828125, 8.537109375, 9.6943359375, 10.8515625, 12.0087890625, 13.166015625, 14.3232421875, 15.48046875, 16.6376953125, 17.794921875, 18.9521484375, 20.109375, 21.2666015625, 22.423828125, 23.5810546875, 24.73828125, 25.8955078125, 27.052734375, 28.2099609375, 29.3671875, 30.5244140625, 31.681640625, 32.8388671875, 33.99609375, 35.1533203125, 36.310546875, 37.4677734375, 38.625]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 7.0, 41.0, 148.0, 333.0, 307.0, 140.0, 32.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.50423049926758, -55.807281494140625, -54.11033248901367, -52.41338348388672, -50.716434478759766, -49.01948547363281, -47.322540283203125, -45.62559127807617, -43.92864227294922, -42.231693267822266, -40.53474426269531, -38.83779525756836, -37.140846252441406, -35.44390106201172, -33.7469482421875, -32.05000305175781, -30.353052139282227, -28.656103134155273, -26.95915412902832, -25.26220703125, -23.565258026123047, -21.868309020996094, -20.17136001586914, -18.474411010742188, -16.777462005615234, -15.080513000488281, -13.383564949035645, -11.686615943908691, -9.989667892456055, -8.292718887329102, -6.595769882202148, -4.898821830749512, -3.201873779296875, -1.5049251317977905, 0.19202351570129395, 1.888972282409668, 3.585920810699463, 5.282869338989258, 6.979818344116211, 8.676766395568848, 10.3737154006958, 12.070664405822754, 13.76761245727539, 15.464561462402344, 17.161510467529297, 18.85845947265625, 20.555408477783203, 22.252355575561523, 23.949304580688477, 25.64625358581543, 27.343202590942383, 29.040149688720703, 30.737098693847656, 32.43404769897461, 34.13099670410156, 35.827945709228516, 37.52489471435547, 39.22184371948242, 40.918792724609375, 42.61574172973633, 44.31269073486328, 46.00963592529297, 47.70658874511719, 49.403533935546875, 51.10048294067383]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 6.0, 6.0, 5.0, 5.0, 9.0, 13.0, 18.0, 12.0, 25.0, 24.0, 16.0, 18.0, 24.0, 23.0, 30.0, 35.0, 38.0, 43.0, 34.0, 45.0, 64.0, 42.0, 39.0, 38.0, 47.0, 43.0, 43.0, 29.0, 29.0, 29.0, 24.0, 25.0, 21.0, 22.0, 12.0, 13.0, 12.0, 7.0, 10.0, 7.0, 3.0, 7.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-57.369537353515625, -55.53218078613281, -53.694828033447266, -51.85747146606445, -50.02011489868164, -48.182762145996094, -46.34540557861328, -44.50804901123047, -42.670692443847656, -40.833335876464844, -38.9959831237793, -37.158626556396484, -35.32126998901367, -33.483917236328125, -31.646560668945312, -29.8092041015625, -27.971851348876953, -26.134496688842773, -24.29714012145996, -22.45978546142578, -20.62242889404297, -18.78507423400879, -16.94771957397461, -15.110363960266113, -13.273008346557617, -11.435652732849121, -9.598297119140625, -7.760942459106445, -5.923586845397949, -4.086231231689453, -2.2488765716552734, -0.41152095794677734, 1.4258346557617188, 3.2631900310516357, 5.100545406341553, 6.937900543212891, 8.775256156921387, 10.612611770629883, 12.449966430664062, 14.287322044372559, 16.124677658081055, 17.962032318115234, 19.799388885498047, 21.636743545532227, 23.474098205566406, 25.31145477294922, 27.1488094329834, 28.986164093017578, 30.82352066040039, 32.6608772277832, 34.49822998046875, 36.33558654785156, 38.172943115234375, 40.01029968261719, 41.847652435302734, 43.68500900268555, 45.522361755371094, 47.359718322753906, 49.19707107543945, 51.034427642822266, 52.87178421020508, 54.709136962890625, 56.54649353027344, 58.38385009765625, 60.22120666503906]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 8.0, 7.0, 6.0, 13.0, 13.0, 17.0, 24.0, 31.0, 23.0, 24.0, 34.0, 30.0, 46.0, 61.0, 55.0, 49.0, 39.0, 55.0, 48.0, 51.0, 44.0, 44.0, 44.0, 47.0, 26.0, 40.0, 28.0, 25.0, 14.0, 16.0, 14.0, 8.0, 7.0, 6.0, 3.0, 4.0, 1.0, 0.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.76171875, -5.55206298828125, -5.3424072265625, -5.13275146484375, -4.923095703125, -4.71343994140625, -4.5037841796875, -4.29412841796875, -4.08447265625, -3.87481689453125, -3.6651611328125, -3.45550537109375, -3.245849609375, -3.03619384765625, -2.8265380859375, -2.61688232421875, -2.4072265625, -2.19757080078125, -1.9879150390625, -1.77825927734375, -1.568603515625, -1.35894775390625, -1.1492919921875, -0.93963623046875, -0.72998046875, -0.52032470703125, -0.3106689453125, -0.10101318359375, 0.108642578125, 0.31829833984375, 0.5279541015625, 0.73760986328125, 0.947265625, 1.15692138671875, 1.3665771484375, 1.57623291015625, 1.785888671875, 1.99554443359375, 2.2052001953125, 2.41485595703125, 2.62451171875, 2.83416748046875, 3.0438232421875, 3.25347900390625, 3.463134765625, 3.67279052734375, 3.8824462890625, 4.09210205078125, 4.3017578125, 4.51141357421875, 4.7210693359375, 4.93072509765625, 5.140380859375, 5.35003662109375, 5.5596923828125, 5.76934814453125, 5.97900390625, 6.18865966796875, 6.3983154296875, 6.60797119140625, 6.817626953125, 7.02728271484375, 7.2369384765625, 7.44659423828125, 7.65625]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 5.0, 2.0, 9.0, 8.0, 16.0, 22.0, 36.0, 53.0, 87.0, 126.0, 197.0, 290.0, 472.0, 694.0, 1200.0, 2200.0, 3932.0, 7713.0, 16000.0, 36441.0, 93699.0, 284273.0, 828644.0, 1414331.0, 969557.0, 345877.0, 109338.0, 41589.0, 18324.0, 8833.0, 4384.0, 2376.0, 1355.0, 829.0, 471.0, 307.0, 199.0, 122.0, 96.0, 64.0, 44.0, 26.0, 18.0, 10.0, 6.0, 3.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.12109375, -4.928466796875, -4.73583984375, -4.543212890625, -4.3505859375, -4.157958984375, -3.96533203125, -3.772705078125, -3.580078125, -3.387451171875, -3.19482421875, -3.002197265625, -2.8095703125, -2.616943359375, -2.42431640625, -2.231689453125, -2.0390625, -1.846435546875, -1.65380859375, -1.461181640625, -1.2685546875, -1.075927734375, -0.88330078125, -0.690673828125, -0.498046875, -0.305419921875, -0.11279296875, 0.079833984375, 0.2724609375, 0.465087890625, 0.65771484375, 0.850341796875, 1.04296875, 1.235595703125, 1.42822265625, 1.620849609375, 1.8134765625, 2.006103515625, 2.19873046875, 2.391357421875, 2.583984375, 2.776611328125, 2.96923828125, 3.161865234375, 3.3544921875, 3.547119140625, 3.73974609375, 3.932373046875, 4.125, 4.317626953125, 4.51025390625, 4.702880859375, 4.8955078125, 5.088134765625, 5.28076171875, 5.473388671875, 5.666015625, 5.858642578125, 6.05126953125, 6.243896484375, 6.4365234375, 6.629150390625, 6.82177734375, 7.014404296875, 7.20703125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 5.0, 3.0, 11.0, 7.0, 18.0, 19.0, 24.0, 27.0, 39.0, 55.0, 71.0, 99.0, 97.0, 137.0, 158.0, 202.0, 284.0, 291.0, 327.0, 387.0, 305.0, 304.0, 264.0, 176.0, 173.0, 123.0, 105.0, 89.0, 64.0, 49.0, 23.0, 40.0, 28.0, 16.0, 17.0, 8.0, 9.0, 8.0, 5.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.6796875, -12.3214111328125, -11.963134765625, -11.6048583984375, -11.24658203125, -10.8883056640625, -10.530029296875, -10.1717529296875, -9.8134765625, -9.4552001953125, -9.096923828125, -8.7386474609375, -8.38037109375, -8.0220947265625, -7.663818359375, -7.3055419921875, -6.947265625, -6.5889892578125, -6.230712890625, -5.8724365234375, -5.51416015625, -5.1558837890625, -4.797607421875, -4.4393310546875, -4.0810546875, -3.7227783203125, -3.364501953125, -3.0062255859375, -2.64794921875, -2.2896728515625, -1.931396484375, -1.5731201171875, -1.21484375, -0.8565673828125, -0.498291015625, -0.1400146484375, 0.21826171875, 0.5765380859375, 0.934814453125, 1.2930908203125, 1.6513671875, 2.0096435546875, 2.367919921875, 2.7261962890625, 3.08447265625, 3.4427490234375, 3.801025390625, 4.1593017578125, 4.517578125, 4.8758544921875, 5.234130859375, 5.5924072265625, 5.95068359375, 6.3089599609375, 6.667236328125, 7.0255126953125, 7.3837890625, 7.7420654296875, 8.100341796875, 8.4586181640625, 8.81689453125, 9.1751708984375, 9.533447265625, 9.8917236328125, 10.25]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 4.0, 6.0, 3.0, 12.0, 14.0, 16.0, 16.0, 34.0, 44.0, 50.0, 86.0, 97.0, 163.0, 238.0, 517.0, 2441.0, 46765.0, 3386842.0, 741697.0, 13120.0, 1142.0, 359.0, 162.0, 128.0, 82.0, 63.0, 49.0, 33.0, 24.0, 16.0, 13.0, 12.0, 11.0, 5.0, 6.0, 1.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-42.09375, -40.6328125, -39.171875, -37.7109375, -36.25, -34.7890625, -33.328125, -31.8671875, -30.40625, -28.9453125, -27.484375, -26.0234375, -24.5625, -23.1015625, -21.640625, -20.1796875, -18.71875, -17.2578125, -15.796875, -14.3359375, -12.875, -11.4140625, -9.953125, -8.4921875, -7.03125, -5.5703125, -4.109375, -2.6484375, -1.1875, 0.2734375, 1.734375, 3.1953125, 4.65625, 6.1171875, 7.578125, 9.0390625, 10.5, 11.9609375, 13.421875, 14.8828125, 16.34375, 17.8046875, 19.265625, 20.7265625, 22.1875, 23.6484375, 25.109375, 26.5703125, 28.03125, 29.4921875, 30.953125, 32.4140625, 33.875, 35.3359375, 36.796875, 38.2578125, 39.71875, 41.1796875, 42.640625, 44.1015625, 45.5625, 47.0234375, 48.484375, 49.9453125, 51.40625]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 30.0, 99.0, 270.0, 333.0, 184.0, 73.0, 17.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-207.2979736328125, -201.4225616455078, -195.54714965820312, -189.67173767089844, -183.79632568359375, -177.92091369628906, -172.04550170898438, -166.1700897216797, -160.294677734375, -154.4192657470703, -148.54385375976562, -142.66844177246094, -136.79302978515625, -130.91761779785156, -125.04220581054688, -119.16679382324219, -113.2913818359375, -107.41596984863281, -101.54055786132812, -95.66514587402344, -89.78973388671875, -83.91432189941406, -78.03890991210938, -72.16349792480469, -66.2880859375, -60.41267395019531, -54.537261962890625, -48.66184997558594, -42.78643798828125, -36.91102600097656, -31.035614013671875, -25.160202026367188, -19.284805297851562, -13.409393310546875, -7.5339813232421875, -1.6585693359375, 4.2168426513671875, 10.092254638671875, 15.967666625976562, 21.84307861328125, 27.718490600585938, 33.593902587890625, 39.46931457519531, 45.3447265625, 51.22013854980469, 57.095550537109375, 62.97096252441406, 68.84637451171875, 74.72178649902344, 80.59719848632812, 86.47261047363281, 92.3480224609375, 98.22343444824219, 104.09884643554688, 109.97425842285156, 115.84967041015625, 121.72508239746094, 127.60049438476562, 133.4759063720703, 139.351318359375, 145.2267303466797, 151.10214233398438, 156.97755432128906, 162.85296630859375, 168.72837829589844]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 5.0, 7.0, 6.0, 4.0, 7.0, 13.0, 10.0, 11.0, 15.0, 18.0, 19.0, 19.0, 23.0, 28.0, 28.0, 31.0, 28.0, 43.0, 32.0, 35.0, 31.0, 41.0, 34.0, 39.0, 38.0, 43.0, 38.0, 36.0, 34.0, 32.0, 36.0, 34.0, 24.0, 24.0, 26.0, 22.0, 20.0, 15.0, 10.0, 10.0, 7.0, 5.0, 7.0, 6.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-44.34063720703125, -42.91967010498047, -41.49869918823242, -40.077728271484375, -38.656761169433594, -37.23579406738281, -35.814823150634766, -34.39385223388672, -32.97288513183594, -31.551916122436523, -30.13094711303711, -28.709978103637695, -27.28900909423828, -25.868040084838867, -24.447071075439453, -23.02610206604004, -21.605133056640625, -20.18416404724121, -18.763195037841797, -17.342226028442383, -15.921257019042969, -14.500288009643555, -13.07931900024414, -11.658349990844727, -10.237380981445312, -8.816411972045898, -7.395442962646484, -5.97447395324707, -4.553504943847656, -3.132535934448242, -1.7115669250488281, -0.29059791564941406, 1.13037109375, 2.551340103149414, 3.972309112548828, 5.393278121948242, 6.814247131347656, 8.23521614074707, 9.656185150146484, 11.077154159545898, 12.498123168945312, 13.919092178344727, 15.34006118774414, 16.761030197143555, 18.18199920654297, 19.602968215942383, 21.023937225341797, 22.44490623474121, 23.865875244140625, 25.28684425354004, 26.707813262939453, 28.128782272338867, 29.54975128173828, 30.970720291137695, 32.39168930053711, 33.812660217285156, 35.23362731933594, 36.65459442138672, 38.075565338134766, 39.49653625488281, 40.917503356933594, 42.338470458984375, 43.75944137573242, 45.18041229248047, 46.60137939453125]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 10.0, 7.0, 7.0, 18.0, 23.0, 25.0, 15.0, 20.0, 34.0, 41.0, 34.0, 47.0, 52.0, 52.0, 59.0, 39.0, 55.0, 53.0, 37.0, 49.0, 47.0, 35.0, 37.0, 45.0, 31.0, 27.0, 30.0, 19.0, 10.0, 13.0, 11.0, 6.0, 7.0, 4.0, 4.0, 3.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.45703125, -6.23828125, -6.01953125, -5.80078125, -5.58203125, -5.36328125, -5.14453125, -4.92578125, -4.70703125, -4.48828125, -4.26953125, -4.05078125, -3.83203125, -3.61328125, -3.39453125, -3.17578125, -2.95703125, -2.73828125, -2.51953125, -2.30078125, -2.08203125, -1.86328125, -1.64453125, -1.42578125, -1.20703125, -0.98828125, -0.76953125, -0.55078125, -0.33203125, -0.11328125, 0.10546875, 0.32421875, 0.54296875, 0.76171875, 0.98046875, 1.19921875, 1.41796875, 1.63671875, 1.85546875, 2.07421875, 2.29296875, 2.51171875, 2.73046875, 2.94921875, 3.16796875, 3.38671875, 3.60546875, 3.82421875, 4.04296875, 4.26171875, 4.48046875, 4.69921875, 4.91796875, 5.13671875, 5.35546875, 5.57421875, 5.79296875, 6.01171875, 6.23046875, 6.44921875, 6.66796875, 6.88671875, 7.10546875, 7.32421875, 7.54296875]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 8.0, 7.0, 12.0, 16.0, 27.0, 39.0, 67.0, 69.0, 121.0, 135.0, 233.0, 336.0, 454.0, 639.0, 856.0, 1183.0, 1756.0, 2471.0, 3448.0, 4969.0, 6921.0, 10159.0, 14659.0, 22016.0, 33908.0, 53457.0, 89479.0, 160320.0, 233091.0, 159710.0, 89811.0, 53536.0, 33909.0, 22361.0, 14715.0, 10039.0, 7081.0, 4800.0, 3481.0, 2366.0, 1631.0, 1209.0, 866.0, 676.0, 450.0, 343.0, 209.0, 138.0, 115.0, 77.0, 64.0, 41.0, 33.0, 17.0, 18.0, 6.0, 2.0, 3.0, 4.0, 1.0], "bins": [-0.7626953125, -0.739227294921875, -0.71575927734375, -0.692291259765625, -0.6688232421875, -0.645355224609375, -0.62188720703125, -0.598419189453125, -0.574951171875, -0.551483154296875, -0.52801513671875, -0.504547119140625, -0.4810791015625, -0.457611083984375, -0.43414306640625, -0.410675048828125, -0.38720703125, -0.363739013671875, -0.34027099609375, -0.316802978515625, -0.2933349609375, -0.269866943359375, -0.24639892578125, -0.222930908203125, -0.199462890625, -0.175994873046875, -0.15252685546875, -0.129058837890625, -0.1055908203125, -0.082122802734375, -0.05865478515625, -0.035186767578125, -0.01171875, 0.011749267578125, 0.03521728515625, 0.058685302734375, 0.0821533203125, 0.105621337890625, 0.12908935546875, 0.152557373046875, 0.176025390625, 0.199493408203125, 0.22296142578125, 0.246429443359375, 0.2698974609375, 0.293365478515625, 0.31683349609375, 0.340301513671875, 0.36376953125, 0.387237548828125, 0.41070556640625, 0.434173583984375, 0.4576416015625, 0.481109619140625, 0.50457763671875, 0.528045654296875, 0.551513671875, 0.574981689453125, 0.59844970703125, 0.621917724609375, 0.6453857421875, 0.668853759765625, 0.69232177734375, 0.715789794921875, 0.7392578125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 4.0, 5.0, 5.0, 6.0, 8.0, 16.0, 12.0, 16.0, 18.0, 16.0, 20.0, 25.0, 27.0, 28.0, 40.0, 27.0, 32.0, 41.0, 41.0, 44.0, 37.0, 1058.0, 24.0, 38.0, 47.0, 38.0, 36.0, 31.0, 37.0, 37.0, 32.0, 18.0, 30.0, 17.0, 22.0, 9.0, 9.0, 14.0, 15.0, 8.0, 10.0, 5.0, 5.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.162109375, -3.055755615234375, -2.94940185546875, -2.843048095703125, -2.7366943359375, -2.630340576171875, -2.52398681640625, -2.417633056640625, -2.311279296875, -2.204925537109375, -2.09857177734375, -1.992218017578125, -1.8858642578125, -1.779510498046875, -1.67315673828125, -1.566802978515625, -1.46044921875, -1.354095458984375, -1.24774169921875, -1.141387939453125, -1.0350341796875, -0.928680419921875, -0.82232666015625, -0.715972900390625, -0.609619140625, -0.503265380859375, -0.39691162109375, -0.290557861328125, -0.1842041015625, -0.077850341796875, 0.02850341796875, 0.134857177734375, 0.2412109375, 0.347564697265625, 0.45391845703125, 0.560272216796875, 0.6666259765625, 0.772979736328125, 0.87933349609375, 0.985687255859375, 1.092041015625, 1.198394775390625, 1.30474853515625, 1.411102294921875, 1.5174560546875, 1.623809814453125, 1.73016357421875, 1.836517333984375, 1.94287109375, 2.049224853515625, 2.15557861328125, 2.261932373046875, 2.3682861328125, 2.474639892578125, 2.58099365234375, 2.687347412109375, 2.793701171875, 2.900054931640625, 3.00640869140625, 3.112762451171875, 3.2191162109375, 3.325469970703125, 3.43182373046875, 3.538177490234375, 3.64453125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 6.0, 8.0, 10.0, 12.0, 9.0, 21.0, 33.0, 43.0, 53.0, 93.0, 146.0, 232.0, 324.0, 545.0, 757.0, 1165.0, 1815.0, 2754.0, 4287.0, 6828.0, 10789.0, 17749.0, 29527.0, 50447.0, 90542.0, 173755.0, 1309468.0, 175843.0, 90518.0, 50918.0, 30005.0, 18304.0, 11083.0, 6843.0, 4251.0, 2718.0, 1790.0, 1164.0, 772.0, 498.0, 329.0, 230.0, 132.0, 110.0, 71.0, 35.0, 30.0, 23.0, 16.0, 14.0, 11.0, 2.0, 5.0, 1.0, 5.0, 5.0, 1.0], "bins": [-0.77490234375, -0.7517776489257812, -0.7286529541015625, -0.7055282592773438, -0.682403564453125, -0.6592788696289062, -0.6361541748046875, -0.6130294799804688, -0.58990478515625, -0.5667800903320312, -0.5436553955078125, -0.5205307006835938, -0.497406005859375, -0.47428131103515625, -0.4511566162109375, -0.42803192138671875, -0.4049072265625, -0.38178253173828125, -0.3586578369140625, -0.33553314208984375, -0.312408447265625, -0.28928375244140625, -0.2661590576171875, -0.24303436279296875, -0.21990966796875, -0.19678497314453125, -0.1736602783203125, -0.15053558349609375, -0.127410888671875, -0.10428619384765625, -0.0811614990234375, -0.05803680419921875, -0.034912109375, -0.01178741455078125, 0.0113372802734375, 0.03446197509765625, 0.057586669921875, 0.08071136474609375, 0.1038360595703125, 0.12696075439453125, 0.15008544921875, 0.17321014404296875, 0.1963348388671875, 0.21945953369140625, 0.242584228515625, 0.26570892333984375, 0.2888336181640625, 0.31195831298828125, 0.3350830078125, 0.35820770263671875, 0.3813323974609375, 0.40445709228515625, 0.427581787109375, 0.45070648193359375, 0.4738311767578125, 0.49695587158203125, 0.52008056640625, 0.5432052612304688, 0.5663299560546875, 0.5894546508789062, 0.612579345703125, 0.6357040405273438, 0.6588287353515625, 0.6819534301757812, 0.705078125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 6.0, 2.0, 12.0, 15.0, 17.0, 22.0, 45.0, 70.0, 85.0, 106.0, 128.0, 108.0, 101.0, 83.0, 62.0, 40.0, 23.0, 20.0, 18.0, 6.0, 6.0, 8.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.002655029296875, -0.0025481581687927246, -0.0024412870407104492, -0.002334415912628174, -0.0022275447845458984, -0.002120673656463623, -0.0020138025283813477, -0.0019069314002990723, -0.0018000602722167969, -0.0016931891441345215, -0.001586318016052246, -0.0014794468879699707, -0.0013725757598876953, -0.00126570463180542, -0.0011588335037231445, -0.0010519623756408691, -0.0009450912475585938, -0.0008382201194763184, -0.000731348991394043, -0.0006244778633117676, -0.0005176067352294922, -0.0004107356071472168, -0.0003038644790649414, -0.00019699335098266602, -9.012222290039062e-05, 1.6748905181884766e-05, 0.00012362003326416016, 0.00023049116134643555, 0.00033736228942871094, 0.00044423341751098633, 0.0005511045455932617, 0.0006579756736755371, 0.0007648468017578125, 0.0008717179298400879, 0.0009785890579223633, 0.0010854601860046387, 0.001192331314086914, 0.0012992024421691895, 0.0014060735702514648, 0.0015129446983337402, 0.0016198158264160156, 0.001726686954498291, 0.0018335580825805664, 0.0019404292106628418, 0.002047300338745117, 0.0021541714668273926, 0.002261042594909668, 0.0023679137229919434, 0.0024747848510742188, 0.002581655979156494, 0.0026885271072387695, 0.002795398235321045, 0.0029022693634033203, 0.0030091404914855957, 0.003116011619567871, 0.0032228827476501465, 0.003329753875732422, 0.0034366250038146973, 0.0035434961318969727, 0.003650367259979248, 0.0037572383880615234, 0.003864109516143799, 0.003970980644226074, 0.00407785177230835, 0.004184722900390625]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 2.0, 6.0, 10.0, 18.0, 22.0, 35.0, 39.0, 63.0, 100.0, 178.0, 405.0, 1878.0, 1036122.0, 8540.0, 578.0, 230.0, 112.0, 65.0, 47.0, 27.0, 22.0, 12.0, 11.0, 6.0, 6.0, 2.0, 4.0, 3.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.08642578125, -0.08424615859985352, -0.08206653594970703, -0.07988691329956055, -0.07770729064941406, -0.07552766799926758, -0.0733480453491211, -0.07116842269897461, -0.06898880004882812, -0.06680917739868164, -0.06462955474853516, -0.06244993209838867, -0.06027030944824219, -0.0580906867980957, -0.05591106414794922, -0.053731441497802734, -0.05155181884765625, -0.049372196197509766, -0.04719257354736328, -0.0450129508972168, -0.04283332824707031, -0.04065370559692383, -0.038474082946777344, -0.03629446029663086, -0.034114837646484375, -0.03193521499633789, -0.029755592346191406, -0.027575969696044922, -0.025396347045898438, -0.023216724395751953, -0.02103710174560547, -0.018857479095458984, -0.0166778564453125, -0.014498233795166016, -0.012318611145019531, -0.010138988494873047, -0.007959365844726562, -0.005779743194580078, -0.0036001205444335938, -0.0014204978942871094, 0.000759124755859375, 0.0029387474060058594, 0.005118370056152344, 0.007297992706298828, 0.009477615356445312, 0.011657238006591797, 0.013836860656738281, 0.016016483306884766, 0.01819610595703125, 0.020375728607177734, 0.02255535125732422, 0.024734973907470703, 0.026914596557617188, 0.029094219207763672, 0.031273841857910156, 0.03345346450805664, 0.035633087158203125, 0.03781270980834961, 0.039992332458496094, 0.04217195510864258, 0.04435157775878906, 0.04653120040893555, 0.04871082305908203, 0.050890445709228516, 0.053070068359375]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 64.0, 593.0, 333.0, 21.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.011174412444233894, -0.010907172225415707, -0.010639931075274944, -0.010372690856456757, -0.010105449706315994, -0.009838209487497807, -0.009570968337357044, -0.009303728118538857, -0.009036486968398094, -0.008769246749579906, -0.008502005599439144, -0.008234765380620956, -0.007967524230480194, -0.007700284011662006, -0.007433043327182531, -0.007165802642703056, -0.006898562423884869, -0.006631321739405394, -0.006364081054925919, -0.0060968403704464436, -0.0058295996859669685, -0.005562359467148781, -0.005295118782669306, -0.005027878098189831, -0.004760637413710356, -0.004493396729230881, -0.004226156044751406, -0.003958915360271931, -0.0036916749086230993, -0.0034244342241436243, -0.003157193772494793, -0.002889953088015318, -0.002622712403535843, -0.002355471719056368, -0.002088231034576893, -0.0018209905829280615, -0.0015537498984485865, -0.0012865092139691114, -0.0010192686459049582, -0.000752028077840805, -0.00048478739336133003, -0.00021754676708951592, 4.9693859182298183e-05, 0.0003169344854541123, 0.0005841751117259264, 0.0008514157962054014, 0.0011186563642695546, 0.0013858969323337078, 0.0016531376168131828, 0.0019203783012926579, 0.002187618985772133, 0.0024548594374209642, 0.0027221001219004393, 0.0029893408063799143, 0.0032565812580287457, 0.0035238219425082207, 0.0037910626269876957, 0.004058303311467171, 0.004325543995946646, 0.004592784680426121, 0.0048600248992443085, 0.005127266049385071, 0.0053945062682032585, 0.0056617469526827335, 0.0059289876371622086]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 3.0, 7.0, 5.0, 5.0, 7.0, 13.0, 15.0, 12.0, 23.0, 23.0, 35.0, 22.0, 30.0, 27.0, 42.0, 37.0, 39.0, 49.0, 39.0, 51.0, 44.0, 47.0, 39.0, 49.0, 34.0, 37.0, 35.0, 38.0, 28.0, 24.0, 29.0, 17.0, 14.0, 17.0, 12.0, 12.0, 6.0, 13.0, 5.0, 2.0, 6.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013179183006286621, -0.0012793773785233498, -0.0012408364564180374, -0.001202295534312725, -0.0011637546122074127, -0.0011252136901021004, -0.001086672767996788, -0.0010481318458914757, -0.0010095909237861633, -0.000971050001680851, -0.0009325090795755386, -0.0008939681574702263, -0.0008554272353649139, -0.0008168863132596016, -0.0007783453911542892, -0.0007398044690489769, -0.0007012635469436646, -0.0006627226248383522, -0.0006241817027330399, -0.0005856407806277275, -0.0005470998585224152, -0.0005085589364171028, -0.00047001801431179047, -0.0004314770922064781, -0.00039293617010116577, -0.0003543952479958534, -0.0003158543258905411, -0.00027731340378522873, -0.00023877248167991638, -0.00020023155957460403, -0.0001616906374692917, -0.00012314971536397934, -8.460879325866699e-05, -4.6067871153354645e-05, -7.526949048042297e-06, 3.101397305727005e-05, 6.95548951625824e-05, 0.00010809581726789474, 0.0001466367393732071, 0.00018517766147851944, 0.0002237185835838318, 0.00026225950568914413, 0.0003008004277944565, 0.00033934134989976883, 0.0003778822720050812, 0.0004164231941103935, 0.00045496411621570587, 0.0004935050383210182, 0.0005320459604263306, 0.0005705868825316429, 0.0006091278046369553, 0.0006476687267422676, 0.00068620964884758, 0.0007247505709528923, 0.0007632914930582047, 0.000801832415163517, 0.0008403733372688293, 0.0008789142593741417, 0.000917455181479454, 0.0009559961035847664, 0.0009945370256900787, 0.001033077947795391, 0.0010716188699007034, 0.0011101597920060158, 0.0011487007141113281]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 10.0, 7.0, 7.0, 18.0, 23.0, 25.0, 15.0, 20.0, 34.0, 41.0, 34.0, 47.0, 52.0, 52.0, 59.0, 39.0, 55.0, 53.0, 37.0, 49.0, 47.0, 35.0, 37.0, 45.0, 31.0, 27.0, 30.0, 19.0, 10.0, 13.0, 11.0, 6.0, 7.0, 4.0, 4.0, 3.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.45703125, -6.23828125, -6.01953125, -5.80078125, -5.58203125, -5.36328125, -5.14453125, -4.92578125, -4.70703125, -4.48828125, -4.26953125, -4.05078125, -3.83203125, -3.61328125, -3.39453125, -3.17578125, -2.95703125, -2.73828125, -2.51953125, -2.30078125, -2.08203125, -1.86328125, -1.64453125, -1.42578125, -1.20703125, -0.98828125, -0.76953125, -0.55078125, -0.33203125, -0.11328125, 0.10546875, 0.32421875, 0.54296875, 0.76171875, 0.98046875, 1.19921875, 1.41796875, 1.63671875, 1.85546875, 2.07421875, 2.29296875, 2.51171875, 2.73046875, 2.94921875, 3.16796875, 3.38671875, 3.60546875, 3.82421875, 4.04296875, 4.26171875, 4.48046875, 4.69921875, 4.91796875, 5.13671875, 5.35546875, 5.57421875, 5.79296875, 6.01171875, 6.23046875, 6.44921875, 6.66796875, 6.88671875, 7.10546875, 7.32421875, 7.54296875]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 8.0, 7.0, 6.0, 14.0, 21.0, 42.0, 44.0, 65.0, 107.0, 169.0, 342.0, 520.0, 849.0, 1391.0, 2405.0, 4223.0, 8492.0, 17510.0, 41938.0, 124829.0, 436218.0, 275946.0, 77416.0, 28696.0, 12733.0, 6349.0, 3389.0, 1938.0, 1153.0, 668.0, 368.0, 243.0, 173.0, 102.0, 61.0, 38.0, 35.0, 23.0, 3.0, 6.0, 5.0, 6.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1953125, -4.04962158203125, -3.9039306640625, -3.75823974609375, -3.612548828125, -3.46685791015625, -3.3211669921875, -3.17547607421875, -3.02978515625, -2.88409423828125, -2.7384033203125, -2.59271240234375, -2.447021484375, -2.30133056640625, -2.1556396484375, -2.00994873046875, -1.8642578125, -1.71856689453125, -1.5728759765625, -1.42718505859375, -1.281494140625, -1.13580322265625, -0.9901123046875, -0.84442138671875, -0.69873046875, -0.55303955078125, -0.4073486328125, -0.26165771484375, -0.115966796875, 0.02972412109375, 0.1754150390625, 0.32110595703125, 0.466796875, 0.61248779296875, 0.7581787109375, 0.90386962890625, 1.049560546875, 1.19525146484375, 1.3409423828125, 1.48663330078125, 1.63232421875, 1.77801513671875, 1.9237060546875, 2.06939697265625, 2.215087890625, 2.36077880859375, 2.5064697265625, 2.65216064453125, 2.7978515625, 2.94354248046875, 3.0892333984375, 3.23492431640625, 3.380615234375, 3.52630615234375, 3.6719970703125, 3.81768798828125, 3.96337890625, 4.10906982421875, 4.2547607421875, 4.40045166015625, 4.546142578125, 4.69183349609375, 4.8375244140625, 4.98321533203125, 5.12890625]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 5.0, 6.0, 1.0, 4.0, 4.0, 12.0, 11.0, 10.0, 14.0, 11.0, 14.0, 16.0, 24.0, 29.0, 26.0, 22.0, 40.0, 36.0, 47.0, 46.0, 40.0, 84.0, 249.0, 1683.0, 143.0, 77.0, 50.0, 30.0, 41.0, 29.0, 35.0, 21.0, 27.0, 33.0, 27.0, 20.0, 20.0, 21.0, 7.0, 7.0, 8.0, 6.0, 5.0, 4.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 3.0], "bins": [-21.140625, -20.524169921875, -19.90771484375, -19.291259765625, -18.6748046875, -18.058349609375, -17.44189453125, -16.825439453125, -16.208984375, -15.592529296875, -14.97607421875, -14.359619140625, -13.7431640625, -13.126708984375, -12.51025390625, -11.893798828125, -11.27734375, -10.660888671875, -10.04443359375, -9.427978515625, -8.8115234375, -8.195068359375, -7.57861328125, -6.962158203125, -6.345703125, -5.729248046875, -5.11279296875, -4.496337890625, -3.8798828125, -3.263427734375, -2.64697265625, -2.030517578125, -1.4140625, -0.797607421875, -0.18115234375, 0.435302734375, 1.0517578125, 1.668212890625, 2.28466796875, 2.901123046875, 3.517578125, 4.134033203125, 4.75048828125, 5.366943359375, 5.9833984375, 6.599853515625, 7.21630859375, 7.832763671875, 8.44921875, 9.065673828125, 9.68212890625, 10.298583984375, 10.9150390625, 11.531494140625, 12.14794921875, 12.764404296875, 13.380859375, 13.997314453125, 14.61376953125, 15.230224609375, 15.8466796875, 16.463134765625, 17.07958984375, 17.696044921875, 18.3125]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 9.0, 3.0, 5.0, 7.0, 12.0, 11.0, 24.0, 33.0, 35.0, 57.0, 71.0, 88.0, 151.0, 247.0, 333.0, 1362.0, 48549.0, 3087763.0, 5404.0, 663.0, 262.0, 206.0, 116.0, 77.0, 59.0, 37.0, 33.0, 23.0, 24.0, 18.0, 7.0, 6.0, 6.0, 5.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.96875, -55.2041015625, -53.439453125, -51.6748046875, -49.91015625, -48.1455078125, -46.380859375, -44.6162109375, -42.8515625, -41.0869140625, -39.322265625, -37.5576171875, -35.79296875, -34.0283203125, -32.263671875, -30.4990234375, -28.734375, -26.9697265625, -25.205078125, -23.4404296875, -21.67578125, -19.9111328125, -18.146484375, -16.3818359375, -14.6171875, -12.8525390625, -11.087890625, -9.3232421875, -7.55859375, -5.7939453125, -4.029296875, -2.2646484375, -0.5, 1.2646484375, 3.029296875, 4.7939453125, 6.55859375, 8.3232421875, 10.087890625, 11.8525390625, 13.6171875, 15.3818359375, 17.146484375, 18.9111328125, 20.67578125, 22.4404296875, 24.205078125, 25.9697265625, 27.734375, 29.4990234375, 31.263671875, 33.0283203125, 34.79296875, 36.5576171875, 38.322265625, 40.0869140625, 41.8515625, 43.6162109375, 45.380859375, 47.1455078125, 48.91015625, 50.6748046875, 52.439453125, 54.2041015625, 55.96875]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 10.0, 879.0, 129.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.23406219482422, -55.09247970581055, -47.950897216796875, -40.8093147277832, -33.66773223876953, -26.52614974975586, -19.384567260742188, -12.242984771728516, -5.101402282714844, 2.040180206298828, 9.1817626953125, 16.323345184326172, 23.464927673339844, 30.606510162353516, 37.74809265136719, 44.88967514038086, 52.03125762939453, 59.1728401184082, 66.31442260742188, 73.45600891113281, 80.59758758544922, 87.73916625976562, 94.88075256347656, 102.0223388671875, 109.1639175415039, 116.30549621582031, 123.44708251953125, 130.5886688232422, 137.73025512695312, 144.871826171875, 152.01341247558594, 159.15499877929688, 166.29656982421875, 173.4381561279297, 180.57974243164062, 187.7213134765625, 194.86289978027344, 202.00448608398438, 209.14605712890625, 216.2876434326172, 223.42922973632812, 230.57081604003906, 237.71240234375, 244.85397338867188, 251.9955596923828, 259.13714599609375, 266.2787170410156, 273.4203186035156, 280.5618896484375, 287.7034606933594, 294.8450622558594, 301.98663330078125, 309.12823486328125, 316.2698059082031, 323.411376953125, 330.552978515625, 337.6945495605469, 344.83612060546875, 351.97772216796875, 359.1192932128906, 366.2608642578125, 373.4024658203125, 380.5440368652344, 387.6856384277344, 394.82720947265625]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 6.0, 9.0, 12.0, 9.0, 15.0, 13.0, 17.0, 22.0, 20.0, 34.0, 40.0, 25.0, 40.0, 38.0, 43.0, 42.0, 39.0, 28.0, 47.0, 44.0, 48.0, 37.0, 43.0, 35.0, 36.0, 38.0, 23.0, 36.0, 25.0, 32.0, 17.0, 16.0, 13.0, 7.0, 8.0, 9.0, 5.0, 6.0, 6.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.165687561035156, -48.547115325927734, -46.92854309082031, -45.309967041015625, -43.6913948059082, -42.07282257080078, -40.45425033569336, -38.83567810058594, -37.21710205078125, -35.59852981567383, -33.979957580566406, -32.36138153076172, -30.742809295654297, -29.124237060546875, -27.505664825439453, -25.88709259033203, -24.26852035522461, -22.649948120117188, -21.031373977661133, -19.41280174255371, -17.794227600097656, -16.175655364990234, -14.557083129882812, -12.938509941101074, -11.319936752319336, -9.701363563537598, -8.08279037475586, -6.4642181396484375, -4.845644950866699, -3.227071762084961, -1.608499526977539, 0.010073661804199219, 1.6286430358886719, 3.247215986251831, 4.86578893661499, 6.48436164855957, 8.102934837341309, 9.721508026123047, 11.340080261230469, 12.958653450012207, 14.577226638793945, 16.195798873901367, 17.814373016357422, 19.432945251464844, 21.051517486572266, 22.67009162902832, 24.288663864135742, 25.907238006591797, 27.52581024169922, 29.14438247680664, 30.762956619262695, 32.38153076171875, 34.00010299682617, 35.618675231933594, 37.237247467041016, 38.85581970214844, 40.474395751953125, 42.09296798706055, 43.71154022216797, 45.330116271972656, 46.94868850708008, 48.5672607421875, 50.18583297729492, 51.804405212402344, 53.422977447509766]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 5.0, 8.0, 9.0, 18.0, 16.0, 22.0, 20.0, 22.0, 33.0, 33.0, 24.0, 55.0, 50.0, 51.0, 55.0, 43.0, 51.0, 52.0, 47.0, 37.0, 39.0, 40.0, 45.0, 34.0, 33.0, 28.0, 34.0, 25.0, 12.0, 12.0, 12.0, 13.0, 10.0, 6.0, 5.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.578125, -6.35888671875, -6.1396484375, -5.92041015625, -5.701171875, -5.48193359375, -5.2626953125, -5.04345703125, -4.82421875, -4.60498046875, -4.3857421875, -4.16650390625, -3.947265625, -3.72802734375, -3.5087890625, -3.28955078125, -3.0703125, -2.85107421875, -2.6318359375, -2.41259765625, -2.193359375, -1.97412109375, -1.7548828125, -1.53564453125, -1.31640625, -1.09716796875, -0.8779296875, -0.65869140625, -0.439453125, -0.22021484375, -0.0009765625, 0.21826171875, 0.4375, 0.65673828125, 0.8759765625, 1.09521484375, 1.314453125, 1.53369140625, 1.7529296875, 1.97216796875, 2.19140625, 2.41064453125, 2.6298828125, 2.84912109375, 3.068359375, 3.28759765625, 3.5068359375, 3.72607421875, 3.9453125, 4.16455078125, 4.3837890625, 4.60302734375, 4.822265625, 5.04150390625, 5.2607421875, 5.47998046875, 5.69921875, 5.91845703125, 6.1376953125, 6.35693359375, 6.576171875, 6.79541015625, 7.0146484375, 7.23388671875, 7.453125]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 7.0, 15.0, 12.0, 18.0, 14.0, 16.0, 35.0, 35.0, 55.0, 66.0, 111.0, 160.0, 452.0, 4413.0, 408952.0, 3743609.0, 34200.0, 1382.0, 275.0, 117.0, 77.0, 56.0, 42.0, 40.0, 27.0, 24.0, 22.0, 11.0, 10.0, 1.0, 7.0, 7.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.53125, -35.32470703125, -34.1181640625, -32.91162109375, -31.705078125, -30.49853515625, -29.2919921875, -28.08544921875, -26.87890625, -25.67236328125, -24.4658203125, -23.25927734375, -22.052734375, -20.84619140625, -19.6396484375, -18.43310546875, -17.2265625, -16.02001953125, -14.8134765625, -13.60693359375, -12.400390625, -11.19384765625, -9.9873046875, -8.78076171875, -7.57421875, -6.36767578125, -5.1611328125, -3.95458984375, -2.748046875, -1.54150390625, -0.3349609375, 0.87158203125, 2.078125, 3.28466796875, 4.4912109375, 5.69775390625, 6.904296875, 8.11083984375, 9.3173828125, 10.52392578125, 11.73046875, 12.93701171875, 14.1435546875, 15.35009765625, 16.556640625, 17.76318359375, 18.9697265625, 20.17626953125, 21.3828125, 22.58935546875, 23.7958984375, 25.00244140625, 26.208984375, 27.41552734375, 28.6220703125, 29.82861328125, 31.03515625, 32.24169921875, 33.4482421875, 34.65478515625, 35.861328125, 37.06787109375, 38.2744140625, 39.48095703125, 40.6875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 6.0, 10.0, 9.0, 22.0, 21.0, 35.0, 53.0, 85.0, 122.0, 146.0, 216.0, 290.0, 400.0, 479.0, 495.0, 466.0, 343.0, 250.0, 179.0, 123.0, 89.0, 63.0, 50.0, 29.0, 26.0, 21.0, 14.0, 8.0, 5.0, 0.0, 6.0, 3.0, 4.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.546875, -13.069580078125, -12.59228515625, -12.114990234375, -11.6376953125, -11.160400390625, -10.68310546875, -10.205810546875, -9.728515625, -9.251220703125, -8.77392578125, -8.296630859375, -7.8193359375, -7.342041015625, -6.86474609375, -6.387451171875, -5.91015625, -5.432861328125, -4.95556640625, -4.478271484375, -4.0009765625, -3.523681640625, -3.04638671875, -2.569091796875, -2.091796875, -1.614501953125, -1.13720703125, -0.659912109375, -0.1826171875, 0.294677734375, 0.77197265625, 1.249267578125, 1.7265625, 2.203857421875, 2.68115234375, 3.158447265625, 3.6357421875, 4.113037109375, 4.59033203125, 5.067626953125, 5.544921875, 6.022216796875, 6.49951171875, 6.976806640625, 7.4541015625, 7.931396484375, 8.40869140625, 8.885986328125, 9.36328125, 9.840576171875, 10.31787109375, 10.795166015625, 11.2724609375, 11.749755859375, 12.22705078125, 12.704345703125, 13.181640625, 13.658935546875, 14.13623046875, 14.613525390625, 15.0908203125, 15.568115234375, 16.04541015625, 16.522705078125, 17.0]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 3.0, 14.0, 10.0, 12.0, 18.0, 12.0, 27.0, 49.0, 65.0, 85.0, 124.0, 138.0, 230.0, 324.0, 729.0, 4067.0, 154566.0, 3930726.0, 97904.0, 3359.0, 689.0, 329.0, 231.0, 165.0, 106.0, 77.0, 58.0, 40.0, 31.0, 31.0, 20.0, 16.0, 9.0, 6.0, 3.0, 9.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-60.75, -59.1279296875, -57.505859375, -55.8837890625, -54.26171875, -52.6396484375, -51.017578125, -49.3955078125, -47.7734375, -46.1513671875, -44.529296875, -42.9072265625, -41.28515625, -39.6630859375, -38.041015625, -36.4189453125, -34.796875, -33.1748046875, -31.552734375, -29.9306640625, -28.30859375, -26.6865234375, -25.064453125, -23.4423828125, -21.8203125, -20.1982421875, -18.576171875, -16.9541015625, -15.33203125, -13.7099609375, -12.087890625, -10.4658203125, -8.84375, -7.2216796875, -5.599609375, -3.9775390625, -2.35546875, -0.7333984375, 0.888671875, 2.5107421875, 4.1328125, 5.7548828125, 7.376953125, 8.9990234375, 10.62109375, 12.2431640625, 13.865234375, 15.4873046875, 17.109375, 18.7314453125, 20.353515625, 21.9755859375, 23.59765625, 25.2197265625, 26.841796875, 28.4638671875, 30.0859375, 31.7080078125, 33.330078125, 34.9521484375, 36.57421875, 38.1962890625, 39.818359375, 41.4404296875, 43.0625]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 22.0, 111.0, 376.0, 374.0, 114.0, 17.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-155.62362670898438, -147.85243225097656, -140.0812225341797, -132.31002807617188, -124.53882598876953, -116.76762390136719, -108.99642181396484, -101.2252197265625, -93.45402526855469, -85.68282318115234, -77.91162109375, -70.14042663574219, -62.369224548339844, -54.5980224609375, -46.826820373535156, -39.05562210083008, -31.28441619873047, -23.513216018676758, -15.74201488494873, -7.970813751220703, -0.1996135711669922, 7.571586608886719, 15.342788696289062, 23.11398696899414, 30.885189056396484, 38.65639114379883, 46.427589416503906, 54.19879150390625, 61.969993591308594, 69.74119567871094, 77.51239013671875, 85.2835922241211, 93.05479431152344, 100.82599639892578, 108.59719848632812, 116.36839294433594, 124.13959503173828, 131.91079711914062, 139.6820068359375, 147.4532012939453, 155.22439575195312, 162.99559020996094, 170.7667999267578, 178.53799438476562, 186.3092041015625, 194.0803985595703, 201.85159301757812, 209.622802734375, 217.39401245117188, 225.1652069091797, 232.93641662597656, 240.70761108398438, 248.47882080078125, 256.25, 264.0212097167969, 271.79241943359375, 279.5635986328125, 287.3348083496094, 295.1059875488281, 302.877197265625, 310.6484069824219, 318.41961669921875, 326.1907958984375, 333.9620056152344, 341.73321533203125]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 10.0, 7.0, 5.0, 8.0, 7.0, 8.0, 15.0, 24.0, 20.0, 25.0, 39.0, 26.0, 44.0, 50.0, 37.0, 57.0, 55.0, 55.0, 50.0, 46.0, 37.0, 52.0, 48.0, 40.0, 43.0, 33.0, 28.0, 18.0, 24.0, 18.0, 14.0, 21.0, 10.0, 10.0, 6.0, 5.0, 3.0, 8.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-57.649566650390625, -55.94164276123047, -54.23371505737305, -52.525787353515625, -50.81786346435547, -49.10993957519531, -47.40201187133789, -45.69408416748047, -43.98616027832031, -42.278236389160156, -40.570308685302734, -38.86238098144531, -37.154457092285156, -35.446533203125, -33.73860549926758, -32.030677795410156, -30.32275390625, -28.61482810974121, -26.906902313232422, -25.198976516723633, -23.491050720214844, -21.783124923706055, -20.075199127197266, -18.367273330688477, -16.659347534179688, -14.951421737670898, -13.24349594116211, -11.53557014465332, -9.827644348144531, -8.119718551635742, -6.411792755126953, -4.703866958618164, -2.995941162109375, -1.288015365600586, 0.4199104309082031, 2.127836227416992, 3.8357620239257812, 5.54368782043457, 7.251613616943359, 8.959539413452148, 10.667465209960938, 12.375391006469727, 14.083316802978516, 15.791242599487305, 17.499168395996094, 19.207094192504883, 20.915019989013672, 22.62294578552246, 24.33087158203125, 26.03879737854004, 27.746723175048828, 29.454648971557617, 31.162574768066406, 32.87049865722656, 34.578426361083984, 36.286354064941406, 37.99427795410156, 39.70220184326172, 41.41012954711914, 43.11805725097656, 44.82598114013672, 46.533905029296875, 48.2418327331543, 49.94976043701172, 51.657684326171875]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 7.0, 14.0, 14.0, 9.0, 13.0, 26.0, 23.0, 39.0, 37.0, 29.0, 33.0, 52.0, 34.0, 58.0, 50.0, 52.0, 49.0, 52.0, 48.0, 50.0, 43.0, 32.0, 37.0, 35.0, 36.0, 15.0, 25.0, 18.0, 15.0, 15.0, 7.0, 8.0, 8.0, 7.0, 5.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.59765625, -6.37213134765625, -6.1466064453125, -5.92108154296875, -5.695556640625, -5.47003173828125, -5.2445068359375, -5.01898193359375, -4.79345703125, -4.56793212890625, -4.3424072265625, -4.11688232421875, -3.891357421875, -3.66583251953125, -3.4403076171875, -3.21478271484375, -2.9892578125, -2.76373291015625, -2.5382080078125, -2.31268310546875, -2.087158203125, -1.86163330078125, -1.6361083984375, -1.41058349609375, -1.18505859375, -0.95953369140625, -0.7340087890625, -0.50848388671875, -0.282958984375, -0.05743408203125, 0.1680908203125, 0.39361572265625, 0.619140625, 0.84466552734375, 1.0701904296875, 1.29571533203125, 1.521240234375, 1.74676513671875, 1.9722900390625, 2.19781494140625, 2.42333984375, 2.64886474609375, 2.8743896484375, 3.09991455078125, 3.325439453125, 3.55096435546875, 3.7764892578125, 4.00201416015625, 4.2275390625, 4.45306396484375, 4.6785888671875, 4.90411376953125, 5.129638671875, 5.35516357421875, 5.5806884765625, 5.80621337890625, 6.03173828125, 6.25726318359375, 6.4827880859375, 6.70831298828125, 6.933837890625, 7.15936279296875, 7.3848876953125, 7.61041259765625, 7.8359375]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 5.0, 2.0, 7.0, 5.0, 17.0, 27.0, 39.0, 57.0, 79.0, 131.0, 176.0, 288.0, 448.0, 741.0, 975.0, 1601.0, 2513.0, 3833.0, 6117.0, 9422.0, 14631.0, 23940.0, 39216.0, 68221.0, 130909.0, 250006.0, 225964.0, 113897.0, 60266.0, 35451.0, 21885.0, 13361.0, 8610.0, 5582.0, 3610.0, 2277.0, 1462.0, 962.0, 615.0, 424.0, 254.0, 201.0, 102.0, 80.0, 54.0, 30.0, 28.0, 14.0, 15.0, 5.0, 7.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.94482421875, -0.9152069091796875, -0.885589599609375, -0.8559722900390625, -0.82635498046875, -0.7967376708984375, -0.767120361328125, -0.7375030517578125, -0.7078857421875, -0.6782684326171875, -0.648651123046875, -0.6190338134765625, -0.58941650390625, -0.5597991943359375, -0.530181884765625, -0.5005645751953125, -0.470947265625, -0.4413299560546875, -0.411712646484375, -0.3820953369140625, -0.35247802734375, -0.3228607177734375, -0.293243408203125, -0.2636260986328125, -0.2340087890625, -0.2043914794921875, -0.174774169921875, -0.1451568603515625, -0.11553955078125, -0.0859222412109375, -0.056304931640625, -0.0266876220703125, 0.0029296875, 0.0325469970703125, 0.062164306640625, 0.0917816162109375, 0.12139892578125, 0.1510162353515625, 0.180633544921875, 0.2102508544921875, 0.2398681640625, 0.2694854736328125, 0.299102783203125, 0.3287200927734375, 0.35833740234375, 0.3879547119140625, 0.417572021484375, 0.4471893310546875, 0.476806640625, 0.5064239501953125, 0.536041259765625, 0.5656585693359375, 0.59527587890625, 0.6248931884765625, 0.654510498046875, 0.6841278076171875, 0.7137451171875, 0.7433624267578125, 0.772979736328125, 0.8025970458984375, 0.83221435546875, 0.8618316650390625, 0.891448974609375, 0.9210662841796875, 0.95068359375]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 8.0, 4.0, 3.0, 6.0, 12.0, 11.0, 19.0, 13.0, 14.0, 18.0, 18.0, 22.0, 27.0, 36.0, 28.0, 36.0, 40.0, 29.0, 34.0, 34.0, 43.0, 41.0, 1065.0, 37.0, 34.0, 30.0, 52.0, 40.0, 42.0, 36.0, 22.0, 14.0, 23.0, 34.0, 14.0, 12.0, 14.0, 14.0, 9.0, 11.0, 7.0, 4.0, 6.0, 2.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0], "bins": [-3.712890625, -3.598358154296875, -3.48382568359375, -3.369293212890625, -3.2547607421875, -3.140228271484375, -3.02569580078125, -2.911163330078125, -2.796630859375, -2.682098388671875, -2.56756591796875, -2.453033447265625, -2.3385009765625, -2.223968505859375, -2.10943603515625, -1.994903564453125, -1.88037109375, -1.765838623046875, -1.65130615234375, -1.536773681640625, -1.4222412109375, -1.307708740234375, -1.19317626953125, -1.078643798828125, -0.964111328125, -0.849578857421875, -0.73504638671875, -0.620513916015625, -0.5059814453125, -0.391448974609375, -0.27691650390625, -0.162384033203125, -0.0478515625, 0.066680908203125, 0.18121337890625, 0.295745849609375, 0.4102783203125, 0.524810791015625, 0.63934326171875, 0.753875732421875, 0.868408203125, 0.982940673828125, 1.09747314453125, 1.212005615234375, 1.3265380859375, 1.441070556640625, 1.55560302734375, 1.670135498046875, 1.78466796875, 1.899200439453125, 2.01373291015625, 2.128265380859375, 2.2427978515625, 2.357330322265625, 2.47186279296875, 2.586395263671875, 2.700927734375, 2.815460205078125, 2.92999267578125, 3.044525146484375, 3.1590576171875, 3.273590087890625, 3.38812255859375, 3.502655029296875, 3.6171875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 5.0, 6.0, 12.0, 21.0, 25.0, 27.0, 49.0, 82.0, 119.0, 130.0, 213.0, 272.0, 358.0, 485.0, 669.0, 901.0, 1276.0, 1807.0, 2561.0, 3769.0, 5194.0, 7437.0, 10993.0, 16256.0, 24786.0, 37790.0, 60623.0, 102934.0, 178690.0, 1266940.0, 143266.0, 81989.0, 49412.0, 31986.0, 20983.0, 13904.0, 9283.0, 6504.0, 4427.0, 3241.0, 2141.0, 1554.0, 1110.0, 775.0, 587.0, 430.0, 315.0, 241.0, 167.0, 127.0, 93.0, 62.0, 37.0, 33.0, 21.0, 10.0, 9.0, 3.0, 3.0, 3.0, 2.0], "bins": [-0.6201171875, -0.6009140014648438, -0.5817108154296875, -0.5625076293945312, -0.543304443359375, -0.5241012573242188, -0.5048980712890625, -0.48569488525390625, -0.46649169921875, -0.44728851318359375, -0.4280853271484375, -0.40888214111328125, -0.389678955078125, -0.37047576904296875, -0.3512725830078125, -0.33206939697265625, -0.3128662109375, -0.29366302490234375, -0.2744598388671875, -0.25525665283203125, -0.236053466796875, -0.21685028076171875, -0.1976470947265625, -0.17844390869140625, -0.15924072265625, -0.14003753662109375, -0.1208343505859375, -0.10163116455078125, -0.082427978515625, -0.06322479248046875, -0.0440216064453125, -0.02481842041015625, -0.005615234375, 0.01358795166015625, 0.0327911376953125, 0.05199432373046875, 0.071197509765625, 0.09040069580078125, 0.1096038818359375, 0.12880706787109375, 0.14801025390625, 0.16721343994140625, 0.1864166259765625, 0.20561981201171875, 0.224822998046875, 0.24402618408203125, 0.2632293701171875, 0.28243255615234375, 0.3016357421875, 0.32083892822265625, 0.3400421142578125, 0.35924530029296875, 0.378448486328125, 0.39765167236328125, 0.4168548583984375, 0.43605804443359375, 0.45526123046875, 0.47446441650390625, 0.4936676025390625, 0.5128707885742188, 0.532073974609375, 0.5512771606445312, 0.5704803466796875, 0.5896835327148438, 0.60888671875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 2.0, 5.0, 3.0, 6.0, 6.0, 6.0, 7.0, 12.0, 11.0, 19.0, 18.0, 26.0, 27.0, 23.0, 31.0, 39.0, 63.0, 57.0, 60.0, 61.0, 54.0, 61.0, 61.0, 50.0, 53.0, 43.0, 40.0, 36.0, 21.0, 21.0, 12.0, 20.0, 11.0, 9.0, 11.0, 6.0, 3.0, 5.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020503997802734375, -0.001985311508178711, -0.0019202232360839844, -0.0018551349639892578, -0.0017900466918945312, -0.0017249584197998047, -0.0016598701477050781, -0.0015947818756103516, -0.001529693603515625, -0.0014646053314208984, -0.0013995170593261719, -0.0013344287872314453, -0.0012693405151367188, -0.0012042522430419922, -0.0011391639709472656, -0.001074075698852539, -0.0010089874267578125, -0.0009438991546630859, -0.0008788108825683594, -0.0008137226104736328, -0.0007486343383789062, -0.0006835460662841797, -0.0006184577941894531, -0.0005533695220947266, -0.00048828125, -0.00042319297790527344, -0.0003581047058105469, -0.0002930164337158203, -0.00022792816162109375, -0.0001628398895263672, -9.775161743164062e-05, -3.266334533691406e-05, 3.24249267578125e-05, 9.751319885253906e-05, 0.00016260147094726562, 0.0002276897430419922, 0.00029277801513671875, 0.0003578662872314453, 0.0004229545593261719, 0.00048804283142089844, 0.000553131103515625, 0.0006182193756103516, 0.0006833076477050781, 0.0007483959197998047, 0.0008134841918945312, 0.0008785724639892578, 0.0009436607360839844, 0.001008749008178711, 0.0010738372802734375, 0.001138925552368164, 0.0012040138244628906, 0.0012691020965576172, 0.0013341903686523438, 0.0013992786407470703, 0.0014643669128417969, 0.0015294551849365234, 0.00159454345703125, 0.0016596317291259766, 0.0017247200012207031, 0.0017898082733154297, 0.0018548965454101562, 0.0019199848175048828, 0.0019850730895996094, 0.002050161361694336, 0.0021152496337890625]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 6.0, 3.0, 9.0, 8.0, 14.0, 8.0, 20.0, 15.0, 23.0, 37.0, 38.0, 60.0, 84.0, 121.0, 188.0, 288.0, 711.0, 5853.0, 992997.0, 45896.0, 1051.0, 412.0, 200.0, 144.0, 90.0, 58.0, 39.0, 32.0, 27.0, 26.0, 24.0, 11.0, 15.0, 9.0, 5.0, 5.0, 5.0, 7.0, 5.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0], "bins": [-0.044281005859375, -0.04296588897705078, -0.04165077209472656, -0.040335655212402344, -0.039020538330078125, -0.037705421447753906, -0.03639030456542969, -0.03507518768310547, -0.03376007080078125, -0.03244495391845703, -0.031129837036132812, -0.029814720153808594, -0.028499603271484375, -0.027184486389160156, -0.025869369506835938, -0.02455425262451172, -0.0232391357421875, -0.02192401885986328, -0.020608901977539062, -0.019293785095214844, -0.017978668212890625, -0.016663551330566406, -0.015348434448242188, -0.014033317565917969, -0.01271820068359375, -0.011403083801269531, -0.010087966918945312, -0.008772850036621094, -0.007457733154296875, -0.006142616271972656, -0.0048274993896484375, -0.0035123825073242188, -0.002197265625, -0.0008821487426757812, 0.0004329681396484375, 0.0017480850219726562, 0.003063201904296875, 0.004378318786621094, 0.0056934356689453125, 0.007008552551269531, 0.00832366943359375, 0.009638786315917969, 0.010953903198242188, 0.012269020080566406, 0.013584136962890625, 0.014899253845214844, 0.016214370727539062, 0.01752948760986328, 0.0188446044921875, 0.02015972137451172, 0.021474838256835938, 0.022789955139160156, 0.024105072021484375, 0.025420188903808594, 0.026735305786132812, 0.02805042266845703, 0.02936553955078125, 0.03068065643310547, 0.03199577331542969, 0.033310890197753906, 0.034626007080078125, 0.035941123962402344, 0.03725624084472656, 0.03857135772705078, 0.039886474609375]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 8.0, 75.0, 501.0, 393.0, 39.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01471426896750927, -0.014460316859185696, -0.014206363819539547, -0.013952411711215973, -0.013698458671569824, -0.01344450656324625, -0.013190554454922676, -0.012936601415276527, -0.012682649306952953, -0.01242869719862938, -0.01217474415898323, -0.011920792050659657, -0.011666839011013508, -0.011412886902689934, -0.011158933863043785, -0.010904981754720211, -0.010651029646396637, -0.010397077538073063, -0.010143124498426914, -0.00988917239010334, -0.009635219350457191, -0.009381267242133617, -0.009127315133810043, -0.008873362094163895, -0.008619409054517746, -0.008365456946194172, -0.008111503906548023, -0.00785755179822445, -0.007603599224239588, -0.007349646650254726, -0.007095694076269865, -0.006841741502285004, -0.00658778939396143, -0.006333836819976568, -0.006079884245991707, -0.005825932137668133, -0.005571979563683271, -0.00531802698969841, -0.005064074415713549, -0.004810121841728687, -0.004556169267743826, -0.0043022166937589645, -0.004048264119774103, -0.0037943117786198854, -0.0035403594374656677, -0.0032864068634808064, -0.003032454289495945, -0.0027785017155110836, -0.002524549374356866, -0.0022705968003720045, -0.002016644459217787, -0.0017626918852329254, -0.0015087394276633859, -0.0012547869700938463, -0.001000834396108985, -0.0007468819385394454, -0.0004929294809699059, -0.00023897699429653585, 1.4975492376834154e-05, 0.0002689280081540346, 0.0005228804657235742, 0.0007768329232931137, 0.001030785497277975, 0.0012847379548475146, 0.0015386904124170542]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 9.0, 6.0, 3.0, 9.0, 4.0, 16.0, 11.0, 17.0, 30.0, 20.0, 27.0, 23.0, 29.0, 43.0, 37.0, 33.0, 57.0, 29.0, 42.0, 43.0, 43.0, 41.0, 37.0, 45.0, 43.0, 33.0, 28.0, 34.0, 28.0, 22.0, 28.0, 13.0, 21.0, 18.0, 21.0, 13.0, 10.0, 6.0, 6.0, 7.0, 9.0, 5.0, 2.0, 1.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010458827018737793, -0.001012478955090046, -0.0009790752083063126, -0.0009456714615225792, -0.0009122677147388458, -0.0008788639679551125, -0.0008454602211713791, -0.0008120564743876457, -0.0007786527276039124, -0.000745248980820179, -0.0007118452340364456, -0.0006784414872527122, -0.0006450377404689789, -0.0006116339936852455, -0.0005782302469015121, -0.0005448265001177788, -0.0005114227533340454, -0.00047801900655031204, -0.0004446152597665787, -0.0004112115129828453, -0.00037780776619911194, -0.00034440401941537857, -0.0003110002726316452, -0.00027759652584791183, -0.00024419277906417847, -0.0002107890322804451, -0.00017738528549671173, -0.00014398153871297836, -0.000110577791929245, -7.717404514551163e-05, -4.377029836177826e-05, -1.0366551578044891e-05, 2.3037195205688477e-05, 5.6440941989421844e-05, 8.984468877315521e-05, 0.00012324843555688858, 0.00015665218234062195, 0.00019005592912435532, 0.00022345967590808868, 0.00025686342269182205, 0.0002902671694755554, 0.0003236709162592888, 0.00035707466304302216, 0.0003904784098267555, 0.0004238821566104889, 0.00045728590339422226, 0.0004906896501779556, 0.000524093396961689, 0.0005574971437454224, 0.0005909008905291557, 0.0006243046373128891, 0.0006577083840966225, 0.0006911121308803558, 0.0007245158776640892, 0.0007579196244478226, 0.0007913233712315559, 0.0008247271180152893, 0.0008581308647990227, 0.000891534611582756, 0.0009249383583664894, 0.0009583421051502228, 0.0009917458519339561, 0.0010251495987176895, 0.0010585533455014229, 0.0010919570922851562]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 7.0, 14.0, 14.0, 9.0, 13.0, 26.0, 23.0, 39.0, 37.0, 29.0, 33.0, 52.0, 34.0, 58.0, 50.0, 52.0, 49.0, 52.0, 48.0, 50.0, 43.0, 32.0, 37.0, 35.0, 36.0, 15.0, 25.0, 18.0, 15.0, 15.0, 7.0, 8.0, 8.0, 7.0, 5.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.59765625, -6.37213134765625, -6.1466064453125, -5.92108154296875, -5.695556640625, -5.47003173828125, -5.2445068359375, -5.01898193359375, -4.79345703125, -4.56793212890625, -4.3424072265625, -4.11688232421875, -3.891357421875, -3.66583251953125, -3.4403076171875, -3.21478271484375, -2.9892578125, -2.76373291015625, -2.5382080078125, -2.31268310546875, -2.087158203125, -1.86163330078125, -1.6361083984375, -1.41058349609375, -1.18505859375, -0.95953369140625, -0.7340087890625, -0.50848388671875, -0.282958984375, -0.05743408203125, 0.1680908203125, 0.39361572265625, 0.619140625, 0.84466552734375, 1.0701904296875, 1.29571533203125, 1.521240234375, 1.74676513671875, 1.9722900390625, 2.19781494140625, 2.42333984375, 2.64886474609375, 2.8743896484375, 3.09991455078125, 3.325439453125, 3.55096435546875, 3.7764892578125, 4.00201416015625, 4.2275390625, 4.45306396484375, 4.6785888671875, 4.90411376953125, 5.129638671875, 5.35516357421875, 5.5806884765625, 5.80621337890625, 6.03173828125, 6.25726318359375, 6.4827880859375, 6.70831298828125, 6.933837890625, 7.15936279296875, 7.3848876953125, 7.61041259765625, 7.8359375]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 5.0, 3.0, 4.0, 2.0, 6.0, 12.0, 18.0, 15.0, 31.0, 38.0, 53.0, 75.0, 114.0, 172.0, 252.0, 403.0, 594.0, 897.0, 1377.0, 2147.0, 3382.0, 5434.0, 8461.0, 14366.0, 26787.0, 59989.0, 166177.0, 423137.0, 195597.0, 68331.0, 29928.0, 15674.0, 9200.0, 5609.0, 3611.0, 2355.0, 1420.0, 1001.0, 609.0, 454.0, 249.0, 178.0, 128.0, 76.0, 58.0, 43.0, 29.0, 25.0, 14.0, 10.0, 8.0, 7.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-3.173828125, -3.062744140625, -2.95166015625, -2.840576171875, -2.7294921875, -2.618408203125, -2.50732421875, -2.396240234375, -2.28515625, -2.174072265625, -2.06298828125, -1.951904296875, -1.8408203125, -1.729736328125, -1.61865234375, -1.507568359375, -1.396484375, -1.285400390625, -1.17431640625, -1.063232421875, -0.9521484375, -0.841064453125, -0.72998046875, -0.618896484375, -0.5078125, -0.396728515625, -0.28564453125, -0.174560546875, -0.0634765625, 0.047607421875, 0.15869140625, 0.269775390625, 0.380859375, 0.491943359375, 0.60302734375, 0.714111328125, 0.8251953125, 0.936279296875, 1.04736328125, 1.158447265625, 1.26953125, 1.380615234375, 1.49169921875, 1.602783203125, 1.7138671875, 1.824951171875, 1.93603515625, 2.047119140625, 2.158203125, 2.269287109375, 2.38037109375, 2.491455078125, 2.6025390625, 2.713623046875, 2.82470703125, 2.935791015625, 3.046875, 3.157958984375, 3.26904296875, 3.380126953125, 3.4912109375, 3.602294921875, 3.71337890625, 3.824462890625, 3.935546875]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 6.0, 7.0, 9.0, 14.0, 17.0, 18.0, 16.0, 27.0, 16.0, 35.0, 25.0, 32.0, 38.0, 44.0, 48.0, 63.0, 81.0, 121.0, 1548.0, 308.0, 92.0, 77.0, 47.0, 49.0, 42.0, 40.0, 38.0, 20.0, 18.0, 21.0, 25.0, 16.0, 11.0, 14.0, 11.0, 10.0, 9.0, 4.0, 8.0, 3.0, 5.0, 4.0, 1.0, 2.0, 3.0, 4.0, 1.0, 3.0], "bins": [-23.65625, -22.97802734375, -22.2998046875, -21.62158203125, -20.943359375, -20.26513671875, -19.5869140625, -18.90869140625, -18.23046875, -17.55224609375, -16.8740234375, -16.19580078125, -15.517578125, -14.83935546875, -14.1611328125, -13.48291015625, -12.8046875, -12.12646484375, -11.4482421875, -10.77001953125, -10.091796875, -9.41357421875, -8.7353515625, -8.05712890625, -7.37890625, -6.70068359375, -6.0224609375, -5.34423828125, -4.666015625, -3.98779296875, -3.3095703125, -2.63134765625, -1.953125, -1.27490234375, -0.5966796875, 0.08154296875, 0.759765625, 1.43798828125, 2.1162109375, 2.79443359375, 3.47265625, 4.15087890625, 4.8291015625, 5.50732421875, 6.185546875, 6.86376953125, 7.5419921875, 8.22021484375, 8.8984375, 9.57666015625, 10.2548828125, 10.93310546875, 11.611328125, 12.28955078125, 12.9677734375, 13.64599609375, 14.32421875, 15.00244140625, 15.6806640625, 16.35888671875, 17.037109375, 17.71533203125, 18.3935546875, 19.07177734375, 19.75]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 7.0, 2.0, 13.0, 10.0, 10.0, 13.0, 28.0, 25.0, 32.0, 55.0, 90.0, 127.0, 202.0, 444.0, 1220.0, 18333.0, 3112990.0, 10108.0, 1051.0, 360.0, 210.0, 119.0, 77.0, 54.0, 34.0, 30.0, 12.0, 10.0, 9.0, 11.0, 8.0, 2.0, 4.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-69.5625, -67.1162109375, -64.669921875, -62.2236328125, -59.77734375, -57.3310546875, -54.884765625, -52.4384765625, -49.9921875, -47.5458984375, -45.099609375, -42.6533203125, -40.20703125, -37.7607421875, -35.314453125, -32.8681640625, -30.421875, -27.9755859375, -25.529296875, -23.0830078125, -20.63671875, -18.1904296875, -15.744140625, -13.2978515625, -10.8515625, -8.4052734375, -5.958984375, -3.5126953125, -1.06640625, 1.3798828125, 3.826171875, 6.2724609375, 8.71875, 11.1650390625, 13.611328125, 16.0576171875, 18.50390625, 20.9501953125, 23.396484375, 25.8427734375, 28.2890625, 30.7353515625, 33.181640625, 35.6279296875, 38.07421875, 40.5205078125, 42.966796875, 45.4130859375, 47.859375, 50.3056640625, 52.751953125, 55.1982421875, 57.64453125, 60.0908203125, 62.537109375, 64.9833984375, 67.4296875, 69.8759765625, 72.322265625, 74.7685546875, 77.21484375, 79.6611328125, 82.107421875, 84.5537109375, 87.0]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 22.0, 801.0, 193.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.54315948486328, -65.83824920654297, -56.133338928222656, -46.42842483520508, -36.723514556884766, -27.018604278564453, -17.313690185546875, -7.6087799072265625, 2.09613037109375, 11.801041603088379, 21.505952835083008, 31.210865020751953, 40.915775299072266, 50.62068557739258, 60.325599670410156, 70.03050994873047, 79.73542022705078, 89.4403305053711, 99.1452407836914, 108.85015869140625, 118.55506896972656, 128.25997924804688, 137.9648895263672, 147.6697998046875, 157.3747100830078, 167.07962036132812, 176.78453063964844, 186.48944091796875, 196.19435119628906, 205.89926147460938, 215.60418701171875, 225.30908203125, 235.01400756835938, 244.7189178466797, 254.423828125, 264.1287536621094, 273.8336486816406, 283.53857421875, 293.24346923828125, 302.9483947753906, 312.6532897949219, 322.35821533203125, 332.0631103515625, 341.7680358886719, 351.4729309082031, 361.1778564453125, 370.88275146484375, 380.5876770019531, 390.2926025390625, 399.9975280761719, 409.7024230957031, 419.4073486328125, 429.11224365234375, 438.8171691894531, 448.5220642089844, 458.22698974609375, 467.931884765625, 477.6368103027344, 487.3417053222656, 497.046630859375, 506.75152587890625, 516.4564208984375, 526.161376953125, 535.8662719726562, 545.5711669921875]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 3.0, 3.0, 1.0, 5.0, 4.0, 7.0, 10.0, 10.0, 16.0, 20.0, 26.0, 19.0, 23.0, 26.0, 17.0, 36.0, 44.0, 37.0, 39.0, 32.0, 30.0, 36.0, 44.0, 40.0, 39.0, 40.0, 36.0, 36.0, 43.0, 38.0, 21.0, 25.0, 22.0, 34.0, 29.0, 16.0, 15.0, 13.0, 11.0, 11.0, 11.0, 9.0, 7.0, 3.0, 5.0, 4.0, 6.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-67.44723510742188, -65.40769958496094, -63.368160247802734, -61.32862091064453, -59.289085388183594, -57.24954605102539, -55.21000671386719, -53.17047119140625, -51.13093566894531, -49.09139633178711, -47.05186080932617, -45.01232147216797, -42.97278594970703, -40.93324661254883, -38.893707275390625, -36.85417175292969, -34.814632415771484, -32.77509307861328, -30.735557556152344, -28.69601821899414, -26.656482696533203, -24.616943359375, -22.57740592956543, -20.53786849975586, -18.49833106994629, -16.45879364013672, -14.419256210327148, -12.379717826843262, -10.340180397033691, -8.300642967224121, -6.261104583740234, -4.221567153930664, -2.1820297241210938, -0.14249205589294434, 1.897045612335205, 3.9365835189819336, 5.976120948791504, 8.015658378601074, 10.055196762084961, 12.094734191894531, 14.134271621704102, 16.173809051513672, 18.213346481323242, 20.252883911132812, 22.292423248291016, 24.331958770751953, 26.371498107910156, 28.411035537719727, 30.450572967529297, 32.4901123046875, 34.52964782714844, 36.56918716430664, 38.60872268676758, 40.64826202392578, 42.68779754638672, 44.72733688354492, 46.766876220703125, 48.80641555786133, 50.845951080322266, 52.88549041748047, 54.925025939941406, 56.96456527709961, 59.00410461425781, 61.04364013671875, 63.08317565917969]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 8.0, 4.0, 10.0, 18.0, 16.0, 17.0, 18.0, 27.0, 31.0, 37.0, 39.0, 40.0, 41.0, 50.0, 48.0, 46.0, 60.0, 60.0, 53.0, 46.0, 38.0, 53.0, 32.0, 31.0, 36.0, 24.0, 24.0, 22.0, 15.0, 13.0, 10.0, 16.0, 9.0, 1.0, 5.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.6015625, -7.3544921875, -7.107421875, -6.8603515625, -6.61328125, -6.3662109375, -6.119140625, -5.8720703125, -5.625, -5.3779296875, -5.130859375, -4.8837890625, -4.63671875, -4.3896484375, -4.142578125, -3.8955078125, -3.6484375, -3.4013671875, -3.154296875, -2.9072265625, -2.66015625, -2.4130859375, -2.166015625, -1.9189453125, -1.671875, -1.4248046875, -1.177734375, -0.9306640625, -0.68359375, -0.4365234375, -0.189453125, 0.0576171875, 0.3046875, 0.5517578125, 0.798828125, 1.0458984375, 1.29296875, 1.5400390625, 1.787109375, 2.0341796875, 2.28125, 2.5283203125, 2.775390625, 3.0224609375, 3.26953125, 3.5166015625, 3.763671875, 4.0107421875, 4.2578125, 4.5048828125, 4.751953125, 4.9990234375, 5.24609375, 5.4931640625, 5.740234375, 5.9873046875, 6.234375, 6.4814453125, 6.728515625, 6.9755859375, 7.22265625, 7.4697265625, 7.716796875, 7.9638671875, 8.2109375]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 4.0, 11.0, 17.0, 25.0, 20.0, 38.0, 59.0, 66.0, 140.0, 159.0, 281.0, 453.0, 864.0, 1805.0, 4162.0, 11735.0, 40589.0, 207808.0, 1081902.0, 1950527.0, 725578.0, 124954.0, 27900.0, 8606.0, 3237.0, 1463.0, 708.0, 419.0, 245.0, 163.0, 97.0, 66.0, 55.0, 33.0, 25.0, 29.0, 13.0, 7.0, 6.0, 2.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-11.5, -11.1837158203125, -10.867431640625, -10.5511474609375, -10.23486328125, -9.9185791015625, -9.602294921875, -9.2860107421875, -8.9697265625, -8.6534423828125, -8.337158203125, -8.0208740234375, -7.70458984375, -7.3883056640625, -7.072021484375, -6.7557373046875, -6.439453125, -6.1231689453125, -5.806884765625, -5.4906005859375, -5.17431640625, -4.8580322265625, -4.541748046875, -4.2254638671875, -3.9091796875, -3.5928955078125, -3.276611328125, -2.9603271484375, -2.64404296875, -2.3277587890625, -2.011474609375, -1.6951904296875, -1.37890625, -1.0626220703125, -0.746337890625, -0.4300537109375, -0.11376953125, 0.2025146484375, 0.518798828125, 0.8350830078125, 1.1513671875, 1.4676513671875, 1.783935546875, 2.1002197265625, 2.41650390625, 2.7327880859375, 3.049072265625, 3.3653564453125, 3.681640625, 3.9979248046875, 4.314208984375, 4.6304931640625, 4.94677734375, 5.2630615234375, 5.579345703125, 5.8956298828125, 6.2119140625, 6.5281982421875, 6.844482421875, 7.1607666015625, 7.47705078125, 7.7933349609375, 8.109619140625, 8.4259033203125, 8.7421875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 7.0, 8.0, 12.0, 14.0, 16.0, 19.0, 18.0, 27.0, 49.0, 64.0, 84.0, 108.0, 124.0, 176.0, 220.0, 290.0, 336.0, 374.0, 362.0, 363.0, 275.0, 258.0, 197.0, 145.0, 103.0, 93.0, 84.0, 50.0, 41.0, 39.0, 23.0, 17.0, 13.0, 12.0, 21.0, 13.0, 4.0, 10.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.984375, -8.6134033203125, -8.242431640625, -7.8714599609375, -7.50048828125, -7.1295166015625, -6.758544921875, -6.3875732421875, -6.0166015625, -5.6456298828125, -5.274658203125, -4.9036865234375, -4.53271484375, -4.1617431640625, -3.790771484375, -3.4197998046875, -3.048828125, -2.6778564453125, -2.306884765625, -1.9359130859375, -1.56494140625, -1.1939697265625, -0.822998046875, -0.4520263671875, -0.0810546875, 0.2899169921875, 0.660888671875, 1.0318603515625, 1.40283203125, 1.7738037109375, 2.144775390625, 2.5157470703125, 2.88671875, 3.2576904296875, 3.628662109375, 3.9996337890625, 4.37060546875, 4.7415771484375, 5.112548828125, 5.4835205078125, 5.8544921875, 6.2254638671875, 6.596435546875, 6.9674072265625, 7.33837890625, 7.7093505859375, 8.080322265625, 8.4512939453125, 8.822265625, 9.1932373046875, 9.564208984375, 9.9351806640625, 10.30615234375, 10.6771240234375, 11.048095703125, 11.4190673828125, 11.7900390625, 12.1610107421875, 12.531982421875, 12.9029541015625, 13.27392578125, 13.6448974609375, 14.015869140625, 14.3868408203125, 14.7578125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 2.0, 2.0, 0.0, 12.0, 6.0, 5.0, 14.0, 14.0, 28.0, 27.0, 25.0, 33.0, 45.0, 69.0, 83.0, 105.0, 142.0, 188.0, 292.0, 498.0, 1342.0, 10460.0, 332588.0, 3699503.0, 140435.0, 5998.0, 984.0, 454.0, 248.0, 169.0, 113.0, 85.0, 67.0, 54.0, 45.0, 27.0, 22.0, 28.0, 17.0, 15.0, 9.0, 5.0, 4.0, 3.0, 5.0, 4.0, 1.0, 4.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-37.96875, -36.75927734375, -35.5498046875, -34.34033203125, -33.130859375, -31.92138671875, -30.7119140625, -29.50244140625, -28.29296875, -27.08349609375, -25.8740234375, -24.66455078125, -23.455078125, -22.24560546875, -21.0361328125, -19.82666015625, -18.6171875, -17.40771484375, -16.1982421875, -14.98876953125, -13.779296875, -12.56982421875, -11.3603515625, -10.15087890625, -8.94140625, -7.73193359375, -6.5224609375, -5.31298828125, -4.103515625, -2.89404296875, -1.6845703125, -0.47509765625, 0.734375, 1.94384765625, 3.1533203125, 4.36279296875, 5.572265625, 6.78173828125, 7.9912109375, 9.20068359375, 10.41015625, 11.61962890625, 12.8291015625, 14.03857421875, 15.248046875, 16.45751953125, 17.6669921875, 18.87646484375, 20.0859375, 21.29541015625, 22.5048828125, 23.71435546875, 24.923828125, 26.13330078125, 27.3427734375, 28.55224609375, 29.76171875, 30.97119140625, 32.1806640625, 33.39013671875, 34.599609375, 35.80908203125, 37.0185546875, 38.22802734375, 39.4375]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 8.0, 17.0, 24.0, 49.0, 58.0, 108.0, 117.0, 112.0, 149.0, 133.0, 102.0, 57.0, 37.0, 22.0, 7.0, 6.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.56111145019531, -62.14396286010742, -59.726810455322266, -57.309661865234375, -54.89250946044922, -52.47536087036133, -50.05821228027344, -47.64105987548828, -45.223907470703125, -42.806758880615234, -40.38960647583008, -37.97245788574219, -35.55530548095703, -33.13815689086914, -30.721006393432617, -28.303855895996094, -25.886707305908203, -23.46955680847168, -21.052406311035156, -18.635257720947266, -16.21810531616211, -13.800955772399902, -11.383806228637695, -8.966655731201172, -6.549505233764648, -4.132354736328125, -1.7152047157287598, 0.7019453048706055, 3.119095802307129, 5.536246299743652, 7.953395843505859, 10.370546340942383, 12.787696838378906, 15.20484733581543, 17.621997833251953, 20.039146423339844, 22.456298828125, 24.87344741821289, 27.290597915649414, 29.707748413085938, 32.124900817871094, 34.542049407958984, 36.95920181274414, 39.37635040283203, 41.79350280761719, 44.21065139770508, 46.62779998779297, 49.044952392578125, 51.462100982666016, 53.879249572753906, 56.29640197753906, 58.71355056762695, 61.13070297241211, 63.5478515625, 65.96500396728516, 68.38215637207031, 70.79930114746094, 73.2164535522461, 75.63359832763672, 78.05075073242188, 80.46790313720703, 82.88505554199219, 85.30220031738281, 87.71935272216797, 90.13650512695312]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 7.0, 8.0, 7.0, 13.0, 7.0, 19.0, 19.0, 10.0, 21.0, 28.0, 41.0, 30.0, 36.0, 30.0, 52.0, 59.0, 45.0, 59.0, 50.0, 43.0, 46.0, 47.0, 41.0, 44.0, 37.0, 32.0, 30.0, 24.0, 23.0, 17.0, 23.0, 14.0, 16.0, 8.0, 6.0, 4.0, 4.0, 1.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-62.367523193359375, -60.69341278076172, -59.01930618286133, -57.34519958496094, -55.67108917236328, -53.996978759765625, -52.322872161865234, -50.648765563964844, -48.97465515136719, -47.30054473876953, -45.62643814086914, -43.95233154296875, -42.278221130371094, -40.60411071777344, -38.93000411987305, -37.255897521972656, -35.581787109375, -33.907676696777344, -32.23357009887695, -30.55946159362793, -28.885353088378906, -27.211244583129883, -25.53713607788086, -23.863027572631836, -22.188919067382812, -20.51481056213379, -18.840702056884766, -17.166593551635742, -15.492485046386719, -13.818376541137695, -12.144268035888672, -10.470159530639648, -8.796051025390625, -7.121942520141602, -5.447834014892578, -3.7737255096435547, -2.0996170043945312, -0.4255084991455078, 1.2486000061035156, 2.922708511352539, 4.5968170166015625, 6.270925521850586, 7.945034027099609, 9.619142532348633, 11.293251037597656, 12.96735954284668, 14.641468048095703, 16.315576553344727, 17.98968505859375, 19.663793563842773, 21.337902069091797, 23.01201057434082, 24.686119079589844, 26.360227584838867, 28.03433609008789, 29.708444595336914, 31.382553100585938, 33.056663513183594, 34.730770111083984, 36.404876708984375, 38.07898712158203, 39.75309753417969, 41.42720413208008, 43.10131072998047, 44.775421142578125]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 8.0, 8.0, 4.0, 14.0, 14.0, 15.0, 16.0, 29.0, 26.0, 33.0, 32.0, 37.0, 47.0, 39.0, 42.0, 58.0, 49.0, 41.0, 47.0, 51.0, 51.0, 45.0, 43.0, 48.0, 32.0, 33.0, 21.0, 18.0, 17.0, 18.0, 21.0, 16.0, 8.0, 9.0, 4.0, 3.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.80078125, -7.56231689453125, -7.3238525390625, -7.08538818359375, -6.846923828125, -6.60845947265625, -6.3699951171875, -6.13153076171875, -5.89306640625, -5.65460205078125, -5.4161376953125, -5.17767333984375, -4.939208984375, -4.70074462890625, -4.4622802734375, -4.22381591796875, -3.9853515625, -3.74688720703125, -3.5084228515625, -3.26995849609375, -3.031494140625, -2.79302978515625, -2.5545654296875, -2.31610107421875, -2.07763671875, -1.83917236328125, -1.6007080078125, -1.36224365234375, -1.123779296875, -0.88531494140625, -0.6468505859375, -0.40838623046875, -0.169921875, 0.06854248046875, 0.3070068359375, 0.54547119140625, 0.783935546875, 1.02239990234375, 1.2608642578125, 1.49932861328125, 1.73779296875, 1.97625732421875, 2.2147216796875, 2.45318603515625, 2.691650390625, 2.93011474609375, 3.1685791015625, 3.40704345703125, 3.6455078125, 3.88397216796875, 4.1224365234375, 4.36090087890625, 4.599365234375, 4.83782958984375, 5.0762939453125, 5.31475830078125, 5.55322265625, 5.79168701171875, 6.0301513671875, 6.26861572265625, 6.507080078125, 6.74554443359375, 6.9840087890625, 7.22247314453125, 7.4609375]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 9.0, 6.0, 5.0, 10.0, 17.0, 27.0, 55.0, 62.0, 90.0, 124.0, 177.0, 298.0, 434.0, 630.0, 893.0, 1334.0, 1969.0, 3034.0, 4536.0, 6834.0, 10409.0, 15655.0, 24235.0, 37756.0, 62096.0, 108489.0, 199731.0, 233191.0, 134985.0, 74504.0, 44765.0, 27971.0, 17923.0, 12201.0, 7996.0, 5275.0, 3560.0, 2337.0, 1580.0, 1096.0, 748.0, 470.0, 332.0, 236.0, 150.0, 99.0, 74.0, 48.0, 44.0, 24.0, 11.0, 10.0, 5.0, 8.0, 5.0, 1.0, 4.0, 1.0, 1.0], "bins": [-0.9287109375, -0.8998489379882812, -0.8709869384765625, -0.8421249389648438, -0.813262939453125, -0.7844009399414062, -0.7555389404296875, -0.7266769409179688, -0.69781494140625, -0.6689529418945312, -0.6400909423828125, -0.6112289428710938, -0.582366943359375, -0.5535049438476562, -0.5246429443359375, -0.49578094482421875, -0.4669189453125, -0.43805694580078125, -0.4091949462890625, -0.38033294677734375, -0.351470947265625, -0.32260894775390625, -0.2937469482421875, -0.26488494873046875, -0.23602294921875, -0.20716094970703125, -0.1782989501953125, -0.14943695068359375, -0.120574951171875, -0.09171295166015625, -0.0628509521484375, -0.03398895263671875, -0.005126953125, 0.02373504638671875, 0.0525970458984375, 0.08145904541015625, 0.110321044921875, 0.13918304443359375, 0.1680450439453125, 0.19690704345703125, 0.22576904296875, 0.25463104248046875, 0.2834930419921875, 0.31235504150390625, 0.341217041015625, 0.37007904052734375, 0.3989410400390625, 0.42780303955078125, 0.4566650390625, 0.48552703857421875, 0.5143890380859375, 0.5432510375976562, 0.572113037109375, 0.6009750366210938, 0.6298370361328125, 0.6586990356445312, 0.68756103515625, 0.7164230346679688, 0.7452850341796875, 0.7741470336914062, 0.803009033203125, 0.8318710327148438, 0.8607330322265625, 0.8895950317382812, 0.91845703125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 5.0, 3.0, 4.0, 1.0, 3.0, 5.0, 11.0, 7.0, 12.0, 16.0, 11.0, 19.0, 16.0, 21.0, 25.0, 25.0, 16.0, 39.0, 27.0, 29.0, 29.0, 39.0, 49.0, 35.0, 43.0, 1066.0, 45.0, 51.0, 49.0, 29.0, 33.0, 31.0, 38.0, 27.0, 29.0, 22.0, 22.0, 16.0, 19.0, 13.0, 8.0, 6.0, 15.0, 8.0, 4.0, 6.0, 4.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.828125, -3.70123291015625, -3.5743408203125, -3.44744873046875, -3.320556640625, -3.19366455078125, -3.0667724609375, -2.93988037109375, -2.81298828125, -2.68609619140625, -2.5592041015625, -2.43231201171875, -2.305419921875, -2.17852783203125, -2.0516357421875, -1.92474365234375, -1.7978515625, -1.67095947265625, -1.5440673828125, -1.41717529296875, -1.290283203125, -1.16339111328125, -1.0364990234375, -0.90960693359375, -0.78271484375, -0.65582275390625, -0.5289306640625, -0.40203857421875, -0.275146484375, -0.14825439453125, -0.0213623046875, 0.10552978515625, 0.232421875, 0.35931396484375, 0.4862060546875, 0.61309814453125, 0.739990234375, 0.86688232421875, 0.9937744140625, 1.12066650390625, 1.24755859375, 1.37445068359375, 1.5013427734375, 1.62823486328125, 1.755126953125, 1.88201904296875, 2.0089111328125, 2.13580322265625, 2.2626953125, 2.38958740234375, 2.5164794921875, 2.64337158203125, 2.770263671875, 2.89715576171875, 3.0240478515625, 3.15093994140625, 3.27783203125, 3.40472412109375, 3.5316162109375, 3.65850830078125, 3.785400390625, 3.91229248046875, 4.0391845703125, 4.16607666015625, 4.29296875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 5.0, 6.0, 6.0, 16.0, 23.0, 33.0, 40.0, 74.0, 89.0, 130.0, 189.0, 280.0, 399.0, 563.0, 846.0, 1205.0, 1705.0, 2571.0, 3736.0, 5726.0, 8623.0, 13416.0, 21115.0, 33769.0, 55751.0, 97472.0, 182993.0, 1298360.0, 152959.0, 83045.0, 48220.0, 29488.0, 18680.0, 11960.0, 7736.0, 5126.0, 3408.0, 2262.0, 1532.0, 1127.0, 795.0, 510.0, 372.0, 238.0, 178.0, 122.0, 81.0, 47.0, 37.0, 25.0, 22.0, 10.0, 9.0, 2.0, 6.0, 0.0, 0.0, 3.0], "bins": [-0.806640625, -0.7824630737304688, -0.7582855224609375, -0.7341079711914062, -0.709930419921875, -0.6857528686523438, -0.6615753173828125, -0.6373977661132812, -0.61322021484375, -0.5890426635742188, -0.5648651123046875, -0.5406875610351562, -0.516510009765625, -0.49233245849609375, -0.4681549072265625, -0.44397735595703125, -0.4197998046875, -0.39562225341796875, -0.3714447021484375, -0.34726715087890625, -0.323089599609375, -0.29891204833984375, -0.2747344970703125, -0.25055694580078125, -0.22637939453125, -0.20220184326171875, -0.1780242919921875, -0.15384674072265625, -0.129669189453125, -0.10549163818359375, -0.0813140869140625, -0.05713653564453125, -0.032958984375, -0.00878143310546875, 0.0153961181640625, 0.03957366943359375, 0.063751220703125, 0.08792877197265625, 0.1121063232421875, 0.13628387451171875, 0.16046142578125, 0.18463897705078125, 0.2088165283203125, 0.23299407958984375, 0.257171630859375, 0.28134918212890625, 0.3055267333984375, 0.32970428466796875, 0.3538818359375, 0.37805938720703125, 0.4022369384765625, 0.42641448974609375, 0.450592041015625, 0.47476959228515625, 0.4989471435546875, 0.5231246948242188, 0.54730224609375, 0.5714797973632812, 0.5956573486328125, 0.6198348999023438, 0.644012451171875, 0.6681900024414062, 0.6923675537109375, 0.7165451049804688, 0.74072265625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 0.0, 1.0, 5.0, 3.0, 4.0, 3.0, 2.0, 6.0, 8.0, 13.0, 6.0, 14.0, 14.0, 10.0, 16.0, 19.0, 36.0, 22.0, 41.0, 49.0, 42.0, 48.0, 63.0, 55.0, 57.0, 62.0, 47.0, 45.0, 45.0, 45.0, 30.0, 41.0, 31.0, 14.0, 21.0, 13.0, 10.0, 13.0, 5.0, 8.0, 8.0, 5.0, 9.0, 5.0, 3.0, 1.0, 0.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018720626831054688, -0.0018130689859390259, -0.001754075288772583, -0.0016950815916061401, -0.0016360878944396973, -0.0015770941972732544, -0.0015181005001068115, -0.0014591068029403687, -0.0014001131057739258, -0.001341119408607483, -0.00128212571144104, -0.0012231320142745972, -0.0011641383171081543, -0.0011051446199417114, -0.0010461509227752686, -0.0009871572256088257, -0.0009281635284423828, -0.0008691698312759399, -0.0008101761341094971, -0.0007511824369430542, -0.0006921887397766113, -0.0006331950426101685, -0.0005742013454437256, -0.0005152076482772827, -0.00045621395111083984, -0.00039722025394439697, -0.0003382265567779541, -0.00027923285961151123, -0.00022023916244506836, -0.0001612454652786255, -0.00010225176811218262, -4.3258070945739746e-05, 1.5735626220703125e-05, 7.4729323387146e-05, 0.00013372302055358887, 0.00019271671772003174, 0.0002517104148864746, 0.0003107041120529175, 0.00036969780921936035, 0.0004286915063858032, 0.0004876852035522461, 0.000546678900718689, 0.0006056725978851318, 0.0006646662950515747, 0.0007236599922180176, 0.0007826536893844604, 0.0008416473865509033, 0.0009006410837173462, 0.0009596347808837891, 0.001018628478050232, 0.0010776221752166748, 0.0011366158723831177, 0.0011956095695495605, 0.0012546032667160034, 0.0013135969638824463, 0.0013725906610488892, 0.001431584358215332, 0.001490578055381775, 0.0015495717525482178, 0.0016085654497146606, 0.0016675591468811035, 0.0017265528440475464, 0.0017855465412139893, 0.0018445402383804321, 0.001903533935546875]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 5.0, 9.0, 9.0, 7.0, 10.0, 10.0, 9.0, 22.0, 19.0, 28.0, 34.0, 49.0, 73.0, 99.0, 137.0, 263.0, 664.0, 3650.0, 988800.0, 52579.0, 989.0, 416.0, 209.0, 125.0, 78.0, 58.0, 37.0, 28.0, 22.0, 19.0, 18.0, 14.0, 14.0, 11.0, 7.0, 6.0, 4.0, 7.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.045806884765625, -0.044406890869140625, -0.04300689697265625, -0.041606903076171875, -0.0402069091796875, -0.038806915283203125, -0.03740692138671875, -0.036006927490234375, -0.03460693359375, -0.033206939697265625, -0.03180694580078125, -0.030406951904296875, -0.0290069580078125, -0.027606964111328125, -0.02620697021484375, -0.024806976318359375, -0.023406982421875, -0.022006988525390625, -0.02060699462890625, -0.019207000732421875, -0.0178070068359375, -0.016407012939453125, -0.01500701904296875, -0.013607025146484375, -0.01220703125, -0.010807037353515625, -0.00940704345703125, -0.008007049560546875, -0.0066070556640625, -0.005207061767578125, -0.00380706787109375, -0.002407073974609375, -0.001007080078125, 0.000392913818359375, 0.00179290771484375, 0.003192901611328125, 0.0045928955078125, 0.005992889404296875, 0.00739288330078125, 0.008792877197265625, 0.01019287109375, 0.011592864990234375, 0.01299285888671875, 0.014392852783203125, 0.0157928466796875, 0.017192840576171875, 0.01859283447265625, 0.019992828369140625, 0.021392822265625, 0.022792816162109375, 0.02419281005859375, 0.025592803955078125, 0.0269927978515625, 0.028392791748046875, 0.02979278564453125, 0.031192779541015625, 0.0325927734375, 0.033992767333984375, 0.03539276123046875, 0.036792755126953125, 0.0381927490234375, 0.039592742919921875, 0.04099273681640625, 0.042392730712890625, 0.043792724609375]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 42.0, 148.0, 349.0, 305.0, 128.0, 27.0, 6.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0068414597772061825, -0.006709668319672346, -0.00657787686213851, -0.006446085404604673, -0.006314293947070837, -0.006182502489537001, -0.006050711032003164, -0.005918919108808041, -0.005787127651274204, -0.005655336193740368, -0.0055235447362065315, -0.005391753278672695, -0.005259961821138859, -0.005128170363605022, -0.004996378906071186, -0.00486458744853735, -0.004732795991003513, -0.004601004533469677, -0.004469213075935841, -0.004337421618402004, -0.004205630160868168, -0.0040738387033343315, -0.003942047245800495, -0.003810255555436015, -0.0036784640979021788, -0.0035466726403683424, -0.003414881182834506, -0.0032830897253006697, -0.0031512980349361897, -0.0030195065774023533, -0.002887715119868517, -0.0027559236623346806, -0.0026241319719702005, -0.002492340514436364, -0.002360549056902528, -0.0022287575993686914, -0.0020969659090042114, -0.001965174451470375, -0.0018333829939365387, -0.0017015915364027023, -0.001569800078868866, -0.0014380086213350296, -0.0013062171638011932, -0.001174425589852035, -0.0010426341323181987, -0.0009108426747843623, -0.000779051159042865, -0.0006472596433013678, -0.0005154681857675314, -0.0003836766991298646, -0.00025188521249219775, -0.00012009372585453093, 1.1697760783135891e-05, 0.00014348921831697226, 0.00027528073405846953, 0.0004070722497999668, 0.0005388637073338032, 0.0006706551648676395, 0.0008024466806091368, 0.0009342381963506341, 0.0010660296538844705, 0.0011978211114183068, 0.001329612685367465, 0.0014614041429013014, 0.0015931956004351377]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 5.0, 7.0, 6.0, 6.0, 6.0, 8.0, 21.0, 12.0, 19.0, 16.0, 28.0, 27.0, 30.0, 40.0, 40.0, 40.0, 41.0, 37.0, 53.0, 37.0, 50.0, 36.0, 35.0, 36.0, 43.0, 37.0, 34.0, 29.0, 29.0, 30.0, 26.0, 23.0, 19.0, 12.0, 12.0, 16.0, 12.0, 12.0, 10.0, 7.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0011265277862548828, -0.0010912679135799408, -0.0010560080409049988, -0.0010207481682300568, -0.0009854882955551147, -0.0009502284228801727, -0.0009149685502052307, -0.0008797086775302887, -0.0008444488048553467, -0.0008091889321804047, -0.0007739290595054626, -0.0007386691868305206, -0.0007034093141555786, -0.0006681494414806366, -0.0006328895688056946, -0.0005976296961307526, -0.0005623698234558105, -0.0005271099507808685, -0.0004918500781059265, -0.0004565902054309845, -0.0004213303327560425, -0.00038607046008110046, -0.00035081058740615845, -0.00031555071473121643, -0.0002802908420562744, -0.0002450309693813324, -0.00020977109670639038, -0.00017451122403144836, -0.00013925135135650635, -0.00010399147868156433, -6.873160600662231e-05, -3.34717333316803e-05, 1.7881393432617188e-06, 3.7048012018203735e-05, 7.230788469314575e-05, 0.00010756775736808777, 0.00014282763004302979, 0.0001780875027179718, 0.00021334737539291382, 0.00024860724806785583, 0.00028386712074279785, 0.00031912699341773987, 0.0003543868660926819, 0.0003896467387676239, 0.0004249066114425659, 0.00046016648411750793, 0.00049542635679245, 0.000530686229467392, 0.000565946102142334, 0.000601205974817276, 0.000636465847492218, 0.00067172572016716, 0.000706985592842102, 0.0007422454655170441, 0.0007775053381919861, 0.0008127652108669281, 0.0008480250835418701, 0.0008832849562168121, 0.0009185448288917542, 0.0009538047015666962, 0.0009890645742416382, 0.0010243244469165802, 0.0010595843195915222, 0.0010948441922664642, 0.0011301040649414062]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 8.0, 8.0, 4.0, 14.0, 14.0, 15.0, 16.0, 29.0, 26.0, 33.0, 32.0, 37.0, 47.0, 40.0, 41.0, 58.0, 49.0, 41.0, 47.0, 51.0, 51.0, 45.0, 43.0, 48.0, 32.0, 33.0, 21.0, 18.0, 17.0, 18.0, 21.0, 16.0, 7.0, 10.0, 4.0, 3.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.80078125, -7.56231689453125, -7.3238525390625, -7.08538818359375, -6.846923828125, -6.60845947265625, -6.3699951171875, -6.13153076171875, -5.89306640625, -5.65460205078125, -5.4161376953125, -5.17767333984375, -4.939208984375, -4.70074462890625, -4.4622802734375, -4.22381591796875, -3.9853515625, -3.74688720703125, -3.5084228515625, -3.26995849609375, -3.031494140625, -2.79302978515625, -2.5545654296875, -2.31610107421875, -2.07763671875, -1.83917236328125, -1.6007080078125, -1.36224365234375, -1.123779296875, -0.88531494140625, -0.6468505859375, -0.40838623046875, -0.169921875, 0.06854248046875, 0.3070068359375, 0.54547119140625, 0.783935546875, 1.02239990234375, 1.2608642578125, 1.49932861328125, 1.73779296875, 1.97625732421875, 2.2147216796875, 2.45318603515625, 2.691650390625, 2.93011474609375, 3.1685791015625, 3.40704345703125, 3.6455078125, 3.88397216796875, 4.1224365234375, 4.36090087890625, 4.599365234375, 4.83782958984375, 5.0762939453125, 5.31475830078125, 5.55322265625, 5.79168701171875, 6.0301513671875, 6.26861572265625, 6.507080078125, 6.74554443359375, 6.9840087890625, 7.22247314453125, 7.4609375]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 7.0, 8.0, 3.0, 15.0, 25.0, 31.0, 34.0, 72.0, 83.0, 108.0, 165.0, 281.0, 524.0, 865.0, 1713.0, 3558.0, 8291.0, 20671.0, 55035.0, 156677.0, 396829.0, 258621.0, 89125.0, 32602.0, 12663.0, 5306.0, 2377.0, 1202.0, 605.0, 330.0, 235.0, 164.0, 105.0, 61.0, 53.0, 39.0, 21.0, 17.0, 12.0, 10.0, 11.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.67578125, -4.5284423828125, -4.381103515625, -4.2337646484375, -4.08642578125, -3.9390869140625, -3.791748046875, -3.6444091796875, -3.4970703125, -3.3497314453125, -3.202392578125, -3.0550537109375, -2.90771484375, -2.7603759765625, -2.613037109375, -2.4656982421875, -2.318359375, -2.1710205078125, -2.023681640625, -1.8763427734375, -1.72900390625, -1.5816650390625, -1.434326171875, -1.2869873046875, -1.1396484375, -0.9923095703125, -0.844970703125, -0.6976318359375, -0.55029296875, -0.4029541015625, -0.255615234375, -0.1082763671875, 0.0390625, 0.1864013671875, 0.333740234375, 0.4810791015625, 0.62841796875, 0.7757568359375, 0.923095703125, 1.0704345703125, 1.2177734375, 1.3651123046875, 1.512451171875, 1.6597900390625, 1.80712890625, 1.9544677734375, 2.101806640625, 2.2491455078125, 2.396484375, 2.5438232421875, 2.691162109375, 2.8385009765625, 2.98583984375, 3.1331787109375, 3.280517578125, 3.4278564453125, 3.5751953125, 3.7225341796875, 3.869873046875, 4.0172119140625, 4.16455078125, 4.3118896484375, 4.459228515625, 4.6065673828125, 4.75390625]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 0.0, 7.0, 6.0, 2.0, 9.0, 3.0, 15.0, 14.0, 25.0, 19.0, 35.0, 26.0, 42.0, 51.0, 50.0, 61.0, 87.0, 349.0, 1702.0, 136.0, 71.0, 46.0, 47.0, 41.0, 37.0, 29.0, 31.0, 18.0, 23.0, 12.0, 11.0, 14.0, 6.0, 4.0, 7.0, 4.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-32.84375, -31.853759765625, -30.86376953125, -29.873779296875, -28.8837890625, -27.893798828125, -26.90380859375, -25.913818359375, -24.923828125, -23.933837890625, -22.94384765625, -21.953857421875, -20.9638671875, -19.973876953125, -18.98388671875, -17.993896484375, -17.00390625, -16.013916015625, -15.02392578125, -14.033935546875, -13.0439453125, -12.053955078125, -11.06396484375, -10.073974609375, -9.083984375, -8.093994140625, -7.10400390625, -6.114013671875, -5.1240234375, -4.134033203125, -3.14404296875, -2.154052734375, -1.1640625, -0.174072265625, 0.81591796875, 1.805908203125, 2.7958984375, 3.785888671875, 4.77587890625, 5.765869140625, 6.755859375, 7.745849609375, 8.73583984375, 9.725830078125, 10.7158203125, 11.705810546875, 12.69580078125, 13.685791015625, 14.67578125, 15.665771484375, 16.65576171875, 17.645751953125, 18.6357421875, 19.625732421875, 20.61572265625, 21.605712890625, 22.595703125, 23.585693359375, 24.57568359375, 25.565673828125, 26.5556640625, 27.545654296875, 28.53564453125, 29.525634765625, 30.515625]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 6.0, 9.0, 14.0, 18.0, 16.0, 19.0, 30.0, 33.0, 62.0, 84.0, 101.0, 158.0, 199.0, 324.0, 728.0, 6989.0, 3126438.0, 8651.0, 764.0, 336.0, 198.0, 145.0, 105.0, 63.0, 57.0, 33.0, 37.0, 21.0, 15.0, 5.0, 12.0, 8.0, 8.0, 5.0, 3.0, 2.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-67.0, -64.8046875, -62.609375, -60.4140625, -58.21875, -56.0234375, -53.828125, -51.6328125, -49.4375, -47.2421875, -45.046875, -42.8515625, -40.65625, -38.4609375, -36.265625, -34.0703125, -31.875, -29.6796875, -27.484375, -25.2890625, -23.09375, -20.8984375, -18.703125, -16.5078125, -14.3125, -12.1171875, -9.921875, -7.7265625, -5.53125, -3.3359375, -1.140625, 1.0546875, 3.25, 5.4453125, 7.640625, 9.8359375, 12.03125, 14.2265625, 16.421875, 18.6171875, 20.8125, 23.0078125, 25.203125, 27.3984375, 29.59375, 31.7890625, 33.984375, 36.1796875, 38.375, 40.5703125, 42.765625, 44.9609375, 47.15625, 49.3515625, 51.546875, 53.7421875, 55.9375, 58.1328125, 60.328125, 62.5234375, 64.71875, 66.9140625, 69.109375, 71.3046875, 73.5]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 7.0, 446.0, 563.0], "bins": [-427.08331298828125, -420.3058776855469, -413.5284118652344, -406.7509765625, -399.9735107421875, -393.1960754394531, -386.41864013671875, -379.64117431640625, -372.8637390136719, -366.0863037109375, -359.308837890625, -352.5314025878906, -345.7539367675781, -338.97650146484375, -332.19903564453125, -325.4216003417969, -318.6441345214844, -311.86669921875, -305.0892333984375, -298.3117980957031, -291.5343322753906, -284.75689697265625, -277.97943115234375, -271.2019958496094, -264.424560546875, -257.6471252441406, -250.86965942382812, -244.09222412109375, -237.3147735595703, -230.53732299804688, -223.75987243652344, -216.982421875, -210.20497131347656, -203.42752075195312, -196.6500701904297, -189.87261962890625, -183.09518432617188, -176.31773376464844, -169.540283203125, -162.76283264160156, -155.98538208007812, -149.2079315185547, -142.43048095703125, -135.65304565429688, -128.87559509277344, -122.09814453125, -115.32069396972656, -108.54324340820312, -101.76580047607422, -94.98834991455078, -88.21090698242188, -81.43345642089844, -74.656005859375, -67.87855529785156, -61.101112365722656, -54.32366180419922, -47.54621887207031, -40.76877212524414, -33.9913215637207, -27.21387481689453, -20.436426162719727, -13.658977508544922, -6.88153076171875, -0.1040802001953125, 6.673367500305176]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 5.0, 3.0, 6.0, 10.0, 2.0, 6.0, 14.0, 14.0, 17.0, 16.0, 17.0, 25.0, 16.0, 15.0, 23.0, 24.0, 17.0, 24.0, 29.0, 35.0, 29.0, 36.0, 40.0, 39.0, 32.0, 35.0, 40.0, 29.0, 31.0, 25.0, 30.0, 40.0, 26.0, 24.0, 23.0, 18.0, 26.0, 20.0, 21.0, 15.0, 11.0, 12.0, 15.0, 16.0, 15.0, 13.0, 6.0, 6.0, 3.0, 5.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 6.0], "bins": [-51.062828063964844, -49.474693298339844, -47.88655471801758, -46.29841995239258, -44.71028518676758, -43.12215042114258, -41.53401184082031, -39.94587707519531, -38.35774230957031, -36.76960754394531, -35.18146896362305, -33.59333419799805, -32.00519943237305, -30.417062759399414, -28.82892608642578, -27.24079132080078, -25.65265464782715, -24.064517974853516, -22.476383209228516, -20.888246536254883, -19.300111770629883, -17.71197509765625, -16.12384033203125, -14.535703659057617, -12.9475679397583, -11.359432220458984, -9.771296501159668, -8.183160781860352, -6.595024585723877, -5.0068888664245605, -3.418752670288086, -1.8306169509887695, -0.24248123168945312, 1.3456546068191528, 2.933790445327759, 4.521926403045654, 6.110062122344971, 7.698197841644287, 9.286334037780762, 10.874469757080078, 12.462605476379395, 14.050741195678711, 15.638876914978027, 17.227012634277344, 18.815149307250977, 20.403284072875977, 21.99142074584961, 23.57955551147461, 25.167692184448242, 26.755828857421875, 28.343963623046875, 29.932100296020508, 31.520235061645508, 33.10837173461914, 34.69650650024414, 36.284645080566406, 37.872779846191406, 39.460914611816406, 41.04905319213867, 42.63718795776367, 44.22532272338867, 45.81345748901367, 47.40159606933594, 48.98973083496094, 50.57786560058594]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 5.0, 5.0, 7.0, 13.0, 7.0, 17.0, 13.0, 18.0, 20.0, 27.0, 30.0, 39.0, 35.0, 34.0, 47.0, 46.0, 47.0, 55.0, 39.0, 49.0, 44.0, 45.0, 42.0, 47.0, 45.0, 40.0, 24.0, 30.0, 15.0, 19.0, 17.0, 16.0, 18.0, 15.0, 9.0, 9.0, 5.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.078125, -7.84033203125, -7.6025390625, -7.36474609375, -7.126953125, -6.88916015625, -6.6513671875, -6.41357421875, -6.17578125, -5.93798828125, -5.7001953125, -5.46240234375, -5.224609375, -4.98681640625, -4.7490234375, -4.51123046875, -4.2734375, -4.03564453125, -3.7978515625, -3.56005859375, -3.322265625, -3.08447265625, -2.8466796875, -2.60888671875, -2.37109375, -2.13330078125, -1.8955078125, -1.65771484375, -1.419921875, -1.18212890625, -0.9443359375, -0.70654296875, -0.46875, -0.23095703125, 0.0068359375, 0.24462890625, 0.482421875, 0.72021484375, 0.9580078125, 1.19580078125, 1.43359375, 1.67138671875, 1.9091796875, 2.14697265625, 2.384765625, 2.62255859375, 2.8603515625, 3.09814453125, 3.3359375, 3.57373046875, 3.8115234375, 4.04931640625, 4.287109375, 4.52490234375, 4.7626953125, 5.00048828125, 5.23828125, 5.47607421875, 5.7138671875, 5.95166015625, 6.189453125, 6.42724609375, 6.6650390625, 6.90283203125, 7.140625]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 6.0, 9.0, 4.0, 8.0, 8.0, 9.0, 18.0, 10.0, 21.0, 15.0, 27.0, 31.0, 37.0, 49.0, 60.0, 130.0, 349.0, 1465.0, 11696.0, 654399.0, 3435826.0, 84788.0, 4066.0, 662.0, 233.0, 86.0, 55.0, 44.0, 26.0, 25.0, 24.0, 18.0, 14.0, 14.0, 16.0, 12.0, 10.0, 5.0, 4.0, 3.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-31.828125, -30.89990234375, -29.9716796875, -29.04345703125, -28.115234375, -27.18701171875, -26.2587890625, -25.33056640625, -24.40234375, -23.47412109375, -22.5458984375, -21.61767578125, -20.689453125, -19.76123046875, -18.8330078125, -17.90478515625, -16.9765625, -16.04833984375, -15.1201171875, -14.19189453125, -13.263671875, -12.33544921875, -11.4072265625, -10.47900390625, -9.55078125, -8.62255859375, -7.6943359375, -6.76611328125, -5.837890625, -4.90966796875, -3.9814453125, -3.05322265625, -2.125, -1.19677734375, -0.2685546875, 0.65966796875, 1.587890625, 2.51611328125, 3.4443359375, 4.37255859375, 5.30078125, 6.22900390625, 7.1572265625, 8.08544921875, 9.013671875, 9.94189453125, 10.8701171875, 11.79833984375, 12.7265625, 13.65478515625, 14.5830078125, 15.51123046875, 16.439453125, 17.36767578125, 18.2958984375, 19.22412109375, 20.15234375, 21.08056640625, 22.0087890625, 22.93701171875, 23.865234375, 24.79345703125, 25.7216796875, 26.64990234375, 27.578125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 5.0, 6.0, 4.0, 10.0, 11.0, 18.0, 23.0, 44.0, 58.0, 70.0, 99.0, 148.0, 183.0, 274.0, 359.0, 401.0, 480.0, 443.0, 376.0, 290.0, 221.0, 154.0, 122.0, 84.0, 54.0, 47.0, 20.0, 21.0, 11.0, 14.0, 6.0, 6.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-15.7734375, -15.31787109375, -14.8623046875, -14.40673828125, -13.951171875, -13.49560546875, -13.0400390625, -12.58447265625, -12.12890625, -11.67333984375, -11.2177734375, -10.76220703125, -10.306640625, -9.85107421875, -9.3955078125, -8.93994140625, -8.484375, -8.02880859375, -7.5732421875, -7.11767578125, -6.662109375, -6.20654296875, -5.7509765625, -5.29541015625, -4.83984375, -4.38427734375, -3.9287109375, -3.47314453125, -3.017578125, -2.56201171875, -2.1064453125, -1.65087890625, -1.1953125, -0.73974609375, -0.2841796875, 0.17138671875, 0.626953125, 1.08251953125, 1.5380859375, 1.99365234375, 2.44921875, 2.90478515625, 3.3603515625, 3.81591796875, 4.271484375, 4.72705078125, 5.1826171875, 5.63818359375, 6.09375, 6.54931640625, 7.0048828125, 7.46044921875, 7.916015625, 8.37158203125, 8.8271484375, 9.28271484375, 9.73828125, 10.19384765625, 10.6494140625, 11.10498046875, 11.560546875, 12.01611328125, 12.4716796875, 12.92724609375, 13.3828125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 6.0, 4.0, 4.0, 16.0, 16.0, 17.0, 25.0, 17.0, 43.0, 38.0, 49.0, 54.0, 82.0, 134.0, 159.0, 239.0, 440.0, 1083.0, 6615.0, 320600.0, 3791151.0, 68534.0, 3071.0, 731.0, 341.0, 201.0, 146.0, 106.0, 76.0, 63.0, 54.0, 29.0, 29.0, 20.0, 18.0, 14.0, 14.0, 9.0, 10.0, 5.0, 8.0, 2.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.46875, -40.05517578125, -38.6416015625, -37.22802734375, -35.814453125, -34.40087890625, -32.9873046875, -31.57373046875, -30.16015625, -28.74658203125, -27.3330078125, -25.91943359375, -24.505859375, -23.09228515625, -21.6787109375, -20.26513671875, -18.8515625, -17.43798828125, -16.0244140625, -14.61083984375, -13.197265625, -11.78369140625, -10.3701171875, -8.95654296875, -7.54296875, -6.12939453125, -4.7158203125, -3.30224609375, -1.888671875, -0.47509765625, 0.9384765625, 2.35205078125, 3.765625, 5.17919921875, 6.5927734375, 8.00634765625, 9.419921875, 10.83349609375, 12.2470703125, 13.66064453125, 15.07421875, 16.48779296875, 17.9013671875, 19.31494140625, 20.728515625, 22.14208984375, 23.5556640625, 24.96923828125, 26.3828125, 27.79638671875, 29.2099609375, 30.62353515625, 32.037109375, 33.45068359375, 34.8642578125, 36.27783203125, 37.69140625, 39.10498046875, 40.5185546875, 41.93212890625, 43.345703125, 44.75927734375, 46.1728515625, 47.58642578125, 49.0]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 16.0, 242.0, 610.0, 132.0, 17.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.20087432861328, -89.50810241699219, -78.81533813476562, -68.12257385253906, -57.42980194091797, -46.73703384399414, -36.04426574707031, -25.35149383544922, -14.658729553222656, -3.965961456298828, 6.726806640625, 17.419574737548828, 28.112342834472656, 38.805110931396484, 49.49787902832031, 60.190650939941406, 70.88341522216797, 81.57618713378906, 92.26895141601562, 102.96171569824219, 113.65448760986328, 124.34725952148438, 135.04002380371094, 145.7327880859375, 156.42556762695312, 167.1183319091797, 177.81109619140625, 188.50387573242188, 199.19664001464844, 209.889404296875, 220.58218383789062, 231.2749481201172, 241.96771240234375, 252.6604766845703, 263.3532409667969, 274.0460205078125, 284.73876953125, 295.4315490722656, 306.12432861328125, 316.81707763671875, 327.5098571777344, 338.20263671875, 348.8953857421875, 359.5881652832031, 370.28094482421875, 380.97369384765625, 391.6664733886719, 402.3592529296875, 413.052001953125, 423.7447814941406, 434.4375305175781, 445.13031005859375, 455.82305908203125, 466.5158386230469, 477.2086181640625, 487.9013671875, 498.5941467285156, 509.28692626953125, 519.9796752929688, 530.6724243164062, 541.365234375, 552.0579833984375, 562.750732421875, 573.4435424804688, 584.1362915039062]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 5.0, 9.0, 10.0, 13.0, 17.0, 16.0, 12.0, 22.0, 24.0, 33.0, 30.0, 27.0, 25.0, 30.0, 32.0, 26.0, 35.0, 36.0, 49.0, 46.0, 45.0, 39.0, 42.0, 34.0, 27.0, 34.0, 31.0, 25.0, 31.0, 26.0, 24.0, 16.0, 19.0, 8.0, 18.0, 20.0, 13.0, 12.0, 9.0, 6.0, 8.0, 6.0, 1.0, 2.0, 2.0, 2.0, 3.0], "bins": [-46.99755859375, -45.72099304199219, -44.44442367553711, -43.1678581237793, -41.89128875732422, -40.614723205566406, -39.33815383911133, -38.061588287353516, -36.78501892089844, -35.508453369140625, -34.23188400268555, -32.955318450927734, -31.678749084472656, -30.402183532714844, -29.1256160736084, -27.849048614501953, -26.57248306274414, -25.295915603637695, -24.01934814453125, -22.742780685424805, -21.46621322631836, -20.189647674560547, -18.9130802154541, -17.636512756347656, -16.35994529724121, -15.083377838134766, -13.80681037902832, -12.530243873596191, -11.253676414489746, -9.9771089553833, -8.700542449951172, -7.423974990844727, -6.147407531738281, -4.870840072631836, -3.594273090362549, -2.3177058696746826, -1.0411386489868164, 0.2354288101196289, 1.511995792388916, 2.788562774658203, 4.065130233764648, 5.341697692871094, 6.618264675140381, 7.894831657409668, 9.171399116516113, 10.447966575622559, 11.724533081054688, 13.001100540161133, 14.277667999267578, 15.554235458374023, 16.83080291748047, 18.107370376586914, 19.38393783569336, 20.660503387451172, 21.937070846557617, 23.213638305664062, 24.490205764770508, 25.766773223876953, 27.0433406829834, 28.319908142089844, 29.596473693847656, 30.873043060302734, 32.14960861206055, 33.426177978515625, 34.70274353027344]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 6.0, 2.0, 3.0, 6.0, 9.0, 3.0, 6.0, 9.0, 8.0, 15.0, 11.0, 17.0, 19.0, 23.0, 30.0, 31.0, 38.0, 46.0, 37.0, 50.0, 61.0, 50.0, 43.0, 52.0, 39.0, 40.0, 48.0, 46.0, 33.0, 40.0, 32.0, 27.0, 29.0, 22.0, 8.0, 17.0, 13.0, 12.0, 9.0, 8.0, 3.0, 4.0, 4.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.0625, -7.8306884765625, -7.598876953125, -7.3670654296875, -7.13525390625, -6.9034423828125, -6.671630859375, -6.4398193359375, -6.2080078125, -5.9761962890625, -5.744384765625, -5.5125732421875, -5.28076171875, -5.0489501953125, -4.817138671875, -4.5853271484375, -4.353515625, -4.1217041015625, -3.889892578125, -3.6580810546875, -3.42626953125, -3.1944580078125, -2.962646484375, -2.7308349609375, -2.4990234375, -2.2672119140625, -2.035400390625, -1.8035888671875, -1.57177734375, -1.3399658203125, -1.108154296875, -0.8763427734375, -0.64453125, -0.4127197265625, -0.180908203125, 0.0509033203125, 0.28271484375, 0.5145263671875, 0.746337890625, 0.9781494140625, 1.2099609375, 1.4417724609375, 1.673583984375, 1.9053955078125, 2.13720703125, 2.3690185546875, 2.600830078125, 2.8326416015625, 3.064453125, 3.2962646484375, 3.528076171875, 3.7598876953125, 3.99169921875, 4.2235107421875, 4.455322265625, 4.6871337890625, 4.9189453125, 5.1507568359375, 5.382568359375, 5.6143798828125, 5.84619140625, 6.0780029296875, 6.309814453125, 6.5416259765625, 6.7734375]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 4.0, 12.0, 17.0, 15.0, 21.0, 33.0, 51.0, 64.0, 99.0, 140.0, 221.0, 278.0, 401.0, 576.0, 804.0, 1173.0, 1677.0, 2314.0, 3318.0, 4859.0, 7100.0, 10571.0, 15474.0, 23616.0, 36895.0, 59225.0, 102145.0, 187554.0, 235718.0, 139215.0, 78025.0, 47109.0, 29310.0, 19422.0, 13134.0, 8651.0, 5912.0, 4110.0, 2755.0, 1936.0, 1408.0, 964.0, 661.0, 503.0, 298.0, 250.0, 158.0, 112.0, 83.0, 55.0, 35.0, 27.0, 15.0, 20.0, 7.0, 8.0, 6.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.80029296875, -0.7729415893554688, -0.7455902099609375, -0.7182388305664062, -0.690887451171875, -0.6635360717773438, -0.6361846923828125, -0.6088333129882812, -0.58148193359375, -0.5541305541992188, -0.5267791748046875, -0.49942779541015625, -0.472076416015625, -0.44472503662109375, -0.4173736572265625, -0.39002227783203125, -0.3626708984375, -0.33531951904296875, -0.3079681396484375, -0.28061676025390625, -0.253265380859375, -0.22591400146484375, -0.1985626220703125, -0.17121124267578125, -0.14385986328125, -0.11650848388671875, -0.0891571044921875, -0.06180572509765625, -0.034454345703125, -0.00710296630859375, 0.0202484130859375, 0.04759979248046875, 0.074951171875, 0.10230255126953125, 0.1296539306640625, 0.15700531005859375, 0.184356689453125, 0.21170806884765625, 0.2390594482421875, 0.26641082763671875, 0.29376220703125, 0.32111358642578125, 0.3484649658203125, 0.37581634521484375, 0.403167724609375, 0.43051910400390625, 0.4578704833984375, 0.48522186279296875, 0.5125732421875, 0.5399246215820312, 0.5672760009765625, 0.5946273803710938, 0.621978759765625, 0.6493301391601562, 0.6766815185546875, 0.7040328979492188, 0.73138427734375, 0.7587356567382812, 0.7860870361328125, 0.8134384155273438, 0.840789794921875, 0.8681411743164062, 0.8954925537109375, 0.9228439331054688, 0.9501953125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 3.0, 4.0, 6.0, 3.0, 9.0, 15.0, 15.0, 10.0, 16.0, 22.0, 20.0, 21.0, 31.0, 35.0, 32.0, 31.0, 37.0, 35.0, 42.0, 42.0, 39.0, 1071.0, 37.0, 40.0, 41.0, 34.0, 40.0, 30.0, 32.0, 27.0, 28.0, 28.0, 27.0, 21.0, 25.0, 22.0, 12.0, 12.0, 10.0, 9.0, 7.0, 4.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.55859375, -4.4268798828125, -4.295166015625, -4.1634521484375, -4.03173828125, -3.9000244140625, -3.768310546875, -3.6365966796875, -3.5048828125, -3.3731689453125, -3.241455078125, -3.1097412109375, -2.97802734375, -2.8463134765625, -2.714599609375, -2.5828857421875, -2.451171875, -2.3194580078125, -2.187744140625, -2.0560302734375, -1.92431640625, -1.7926025390625, -1.660888671875, -1.5291748046875, -1.3974609375, -1.2657470703125, -1.134033203125, -1.0023193359375, -0.87060546875, -0.7388916015625, -0.607177734375, -0.4754638671875, -0.34375, -0.2120361328125, -0.080322265625, 0.0513916015625, 0.18310546875, 0.3148193359375, 0.446533203125, 0.5782470703125, 0.7099609375, 0.8416748046875, 0.973388671875, 1.1051025390625, 1.23681640625, 1.3685302734375, 1.500244140625, 1.6319580078125, 1.763671875, 1.8953857421875, 2.027099609375, 2.1588134765625, 2.29052734375, 2.4222412109375, 2.553955078125, 2.6856689453125, 2.8173828125, 2.9490966796875, 3.080810546875, 3.2125244140625, 3.34423828125, 3.4759521484375, 3.607666015625, 3.7393798828125, 3.87109375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 2.0, 3.0, 11.0, 19.0, 17.0, 35.0, 44.0, 74.0, 109.0, 160.0, 222.0, 304.0, 518.0, 699.0, 1061.0, 1535.0, 2365.0, 3456.0, 5323.0, 8290.0, 13146.0, 20953.0, 34880.0, 59018.0, 108088.0, 206313.0, 1298947.0, 141850.0, 75409.0, 43310.0, 25848.0, 15894.0, 10056.0, 6475.0, 4240.0, 2729.0, 1806.0, 1232.0, 850.0, 557.0, 444.0, 277.0, 172.0, 138.0, 87.0, 66.0, 37.0, 18.0, 18.0, 13.0, 11.0, 3.0, 1.0, 3.0, 0.0, 2.0, 2.0], "bins": [-0.849609375, -0.8240280151367188, -0.7984466552734375, -0.7728652954101562, -0.747283935546875, -0.7217025756835938, -0.6961212158203125, -0.6705398559570312, -0.64495849609375, -0.6193771362304688, -0.5937957763671875, -0.5682144165039062, -0.542633056640625, -0.5170516967773438, -0.4914703369140625, -0.46588897705078125, -0.4403076171875, -0.41472625732421875, -0.3891448974609375, -0.36356353759765625, -0.337982177734375, -0.31240081787109375, -0.2868194580078125, -0.26123809814453125, -0.23565673828125, -0.21007537841796875, -0.1844940185546875, -0.15891265869140625, -0.133331298828125, -0.10774993896484375, -0.0821685791015625, -0.05658721923828125, -0.031005859375, -0.00542449951171875, 0.0201568603515625, 0.04573822021484375, 0.071319580078125, 0.09690093994140625, 0.1224822998046875, 0.14806365966796875, 0.17364501953125, 0.19922637939453125, 0.2248077392578125, 0.25038909912109375, 0.275970458984375, 0.30155181884765625, 0.3271331787109375, 0.35271453857421875, 0.3782958984375, 0.40387725830078125, 0.4294586181640625, 0.45503997802734375, 0.480621337890625, 0.5062026977539062, 0.5317840576171875, 0.5573654174804688, 0.58294677734375, 0.6085281372070312, 0.6341094970703125, 0.6596908569335938, 0.685272216796875, 0.7108535766601562, 0.7364349365234375, 0.7620162963867188, 0.78759765625]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 8.0, 4.0, 8.0, 9.0, 11.0, 5.0, 16.0, 18.0, 12.0, 18.0, 26.0, 35.0, 38.0, 29.0, 40.0, 33.0, 41.0, 58.0, 49.0, 53.0, 63.0, 48.0, 36.0, 48.0, 38.0, 43.0, 37.0, 22.0, 34.0, 19.0, 20.0, 20.0, 14.0, 11.0, 10.0, 7.0, 3.0, 5.0, 4.0, 2.0, 2.0, 3.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0016164779663085938, -0.0015639960765838623, -0.0015115141868591309, -0.0014590322971343994, -0.001406550407409668, -0.0013540685176849365, -0.001301586627960205, -0.0012491047382354736, -0.0011966228485107422, -0.0011441409587860107, -0.0010916590690612793, -0.0010391771793365479, -0.0009866952896118164, -0.000934213399887085, -0.0008817315101623535, -0.0008292496204376221, -0.0007767677307128906, -0.0007242858409881592, -0.0006718039512634277, -0.0006193220615386963, -0.0005668401718139648, -0.0005143582820892334, -0.00046187639236450195, -0.0004093945026397705, -0.00035691261291503906, -0.0003044307231903076, -0.00025194883346557617, -0.00019946694374084473, -0.00014698505401611328, -9.450316429138184e-05, -4.202127456665039e-05, 1.0460615158081055e-05, 6.29425048828125e-05, 0.00011542439460754395, 0.0001679062843322754, 0.00022038817405700684, 0.0002728700637817383, 0.0003253519535064697, 0.00037783384323120117, 0.0004303157329559326, 0.00048279762268066406, 0.0005352795124053955, 0.000587761402130127, 0.0006402432918548584, 0.0006927251815795898, 0.0007452070713043213, 0.0007976889610290527, 0.0008501708507537842, 0.0009026527404785156, 0.0009551346302032471, 0.0010076165199279785, 0.00106009840965271, 0.0011125802993774414, 0.0011650621891021729, 0.0012175440788269043, 0.0012700259685516357, 0.0013225078582763672, 0.0013749897480010986, 0.00142747163772583, 0.0014799535274505615, 0.001532435417175293, 0.0015849173069000244, 0.0016373991966247559, 0.0016898810863494873, 0.0017423629760742188]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 2.0, 2.0, 2.0, 7.0, 7.0, 3.0, 8.0, 8.0, 13.0, 21.0, 23.0, 34.0, 64.0, 57.0, 77.0, 110.0, 198.0, 459.0, 1269.0, 133814.0, 908204.0, 2832.0, 602.0, 232.0, 145.0, 96.0, 66.0, 39.0, 34.0, 39.0, 19.0, 20.0, 14.0, 11.0, 12.0, 9.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.038604736328125, -0.03723478317260742, -0.035864830017089844, -0.034494876861572266, -0.03312492370605469, -0.03175497055053711, -0.03038501739501953, -0.029015064239501953, -0.027645111083984375, -0.026275157928466797, -0.02490520477294922, -0.02353525161743164, -0.022165298461914062, -0.020795345306396484, -0.019425392150878906, -0.018055438995361328, -0.01668548583984375, -0.015315532684326172, -0.013945579528808594, -0.012575626373291016, -0.011205673217773438, -0.00983572006225586, -0.008465766906738281, -0.007095813751220703, -0.005725860595703125, -0.004355907440185547, -0.0029859542846679688, -0.0016160011291503906, -0.0002460479736328125, 0.0011239051818847656, 0.0024938583374023438, 0.003863811492919922, 0.0052337646484375, 0.006603717803955078, 0.007973670959472656, 0.009343624114990234, 0.010713577270507812, 0.01208353042602539, 0.013453483581542969, 0.014823436737060547, 0.016193389892578125, 0.017563343048095703, 0.01893329620361328, 0.02030324935913086, 0.021673202514648438, 0.023043155670166016, 0.024413108825683594, 0.025783061981201172, 0.02715301513671875, 0.028522968292236328, 0.029892921447753906, 0.031262874603271484, 0.03263282775878906, 0.03400278091430664, 0.03537273406982422, 0.0367426872253418, 0.038112640380859375, 0.03948259353637695, 0.04085254669189453, 0.04222249984741211, 0.04359245300292969, 0.044962406158447266, 0.046332359313964844, 0.04770231246948242, 0.049072265625]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 10.0, 26.0, 168.0, 350.0, 318.0, 115.0, 24.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0029191887006163597, -0.0027646366506814957, -0.0026100848335772753, -0.0024555327836424112, -0.002300980733707547, -0.002146428916603327, -0.0019918768666684628, -0.0018373248167335987, -0.0016827728832140565, -0.0015282209496945143, -0.0013736688997596502, -0.001219116966240108, -0.0010645650327205658, -0.0009100129827857018, -0.0007554610492661595, -0.0006009089993312955, -0.0004463570658117533, -0.00029180507408455014, -0.00013725311146117747, 1.7298851162195206e-05, 0.00017185084288939834, 0.00032640283461660147, 0.0004809547681361437, 0.0006355068180710077, 0.00079005875159055, 0.0009446107433177531, 0.0010991627350449562, 0.0012537146685644984, 0.0014082666020840406, 0.0015628186520189047, 0.001717370585538447, 0.001871922635473311, 0.002026474568992853, 0.002181026618927717, 0.0023355784360319376, 0.0024901304859668016, 0.0026446825359016657, 0.002799234353005886, 0.00295378640294075, 0.003108338452875614, 0.003262890502810478, 0.0034174425527453423, 0.0035719943698495626, 0.0037265464197844267, 0.0038810984697192907, 0.004035650286823511, 0.004190202336758375, 0.004344754386693239, 0.004499305970966816, 0.00465385802090168, 0.004808410070836544, 0.004962962120771408, 0.005117513705044985, 0.005272065754979849, 0.005426617804914713, 0.005581169854849577, 0.005735721904784441, 0.005890273954719305, 0.006044826004654169, 0.006199377588927746, 0.00635392963886261, 0.006508481688797474, 0.006663033738732338, 0.006817585788667202, 0.006972137838602066]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 2.0, 3.0, 10.0, 6.0, 6.0, 14.0, 15.0, 16.0, 19.0, 23.0, 26.0, 22.0, 22.0, 36.0, 28.0, 25.0, 38.0, 26.0, 45.0, 38.0, 44.0, 31.0, 58.0, 38.0, 43.0, 39.0, 36.0, 34.0, 31.0, 25.0, 21.0, 19.0, 26.0, 25.0, 16.0, 18.0, 19.0, 13.0, 11.0, 7.0, 11.0, 4.0, 5.0, 4.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010277628898620605, -0.0009970394894480705, -0.0009663160890340805, -0.0009355926886200905, -0.0009048692882061005, -0.0008741458877921104, -0.0008434224873781204, -0.0008126990869641304, -0.0007819756865501404, -0.0007512522861361504, -0.0007205288857221603, -0.0006898054853081703, -0.0006590820848941803, -0.0006283586844801903, -0.0005976352840662003, -0.0005669118836522102, -0.0005361884832382202, -0.0005054650828242302, -0.0004747416824102402, -0.00044401828199625015, -0.00041329488158226013, -0.0003825714811682701, -0.0003518480807542801, -0.00032112468034029007, -0.00029040127992630005, -0.00025967787951231003, -0.00022895447909832, -0.00019823107868433, -0.00016750767827033997, -0.00013678427785634995, -0.00010606087744235992, -7.53374770283699e-05, -4.461407661437988e-05, -1.3890676200389862e-05, 1.683272421360016e-05, 4.755612462759018e-05, 7.82795250415802e-05, 0.00010900292545557022, 0.00013972632586956024, 0.00017044972628355026, 0.00020117312669754028, 0.0002318965271115303, 0.0002626199275255203, 0.00029334332793951035, 0.00032406672835350037, 0.0003547901287674904, 0.0003855135291814804, 0.00041623692959547043, 0.00044696033000946045, 0.00047768373042345047, 0.0005084071308374405, 0.0005391305312514305, 0.0005698539316654205, 0.0006005773320794106, 0.0006313007324934006, 0.0006620241329073906, 0.0006927475333213806, 0.0007234709337353706, 0.0007541943341493607, 0.0007849177345633507, 0.0008156411349773407, 0.0008463645353913307, 0.0008770879358053207, 0.0009078113362193108, 0.0009385347366333008]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 6.0, 2.0, 3.0, 6.0, 9.0, 3.0, 6.0, 9.0, 8.0, 15.0, 11.0, 17.0, 19.0, 23.0, 30.0, 31.0, 38.0, 46.0, 37.0, 50.0, 61.0, 50.0, 43.0, 52.0, 39.0, 40.0, 48.0, 46.0, 33.0, 40.0, 32.0, 27.0, 29.0, 22.0, 8.0, 17.0, 13.0, 12.0, 9.0, 8.0, 3.0, 4.0, 4.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.0625, -7.8306884765625, -7.598876953125, -7.3670654296875, -7.13525390625, -6.9034423828125, -6.671630859375, -6.4398193359375, -6.2080078125, -5.9761962890625, -5.744384765625, -5.5125732421875, -5.28076171875, -5.0489501953125, -4.817138671875, -4.5853271484375, -4.353515625, -4.1217041015625, -3.889892578125, -3.6580810546875, -3.42626953125, -3.1944580078125, -2.962646484375, -2.7308349609375, -2.4990234375, -2.2672119140625, -2.035400390625, -1.8035888671875, -1.57177734375, -1.3399658203125, -1.108154296875, -0.8763427734375, -0.64453125, -0.4127197265625, -0.180908203125, 0.0509033203125, 0.28271484375, 0.5145263671875, 0.746337890625, 0.9781494140625, 1.2099609375, 1.4417724609375, 1.673583984375, 1.9053955078125, 2.13720703125, 2.3690185546875, 2.600830078125, 2.8326416015625, 3.064453125, 3.2962646484375, 3.528076171875, 3.7598876953125, 3.99169921875, 4.2235107421875, 4.455322265625, 4.6871337890625, 4.9189453125, 5.1507568359375, 5.382568359375, 5.6143798828125, 5.84619140625, 6.0780029296875, 6.309814453125, 6.5416259765625, 6.7734375]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 3.0, 4.0, 2.0, 5.0, 5.0, 8.0, 13.0, 25.0, 27.0, 35.0, 38.0, 60.0, 85.0, 119.0, 167.0, 293.0, 425.0, 719.0, 1277.0, 2302.0, 4534.0, 9128.0, 19500.0, 42975.0, 100814.0, 304362.0, 359391.0, 112466.0, 47488.0, 21500.0, 9897.0, 4857.0, 2558.0, 1278.0, 779.0, 489.0, 303.0, 161.0, 128.0, 90.0, 70.0, 58.0, 35.0, 22.0, 12.0, 20.0, 14.0, 2.0, 7.0, 6.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.4921875, -5.3309326171875, -5.169677734375, -5.0084228515625, -4.84716796875, -4.6859130859375, -4.524658203125, -4.3634033203125, -4.2021484375, -4.0408935546875, -3.879638671875, -3.7183837890625, -3.55712890625, -3.3958740234375, -3.234619140625, -3.0733642578125, -2.912109375, -2.7508544921875, -2.589599609375, -2.4283447265625, -2.26708984375, -2.1058349609375, -1.944580078125, -1.7833251953125, -1.6220703125, -1.4608154296875, -1.299560546875, -1.1383056640625, -0.97705078125, -0.8157958984375, -0.654541015625, -0.4932861328125, -0.33203125, -0.1707763671875, -0.009521484375, 0.1517333984375, 0.31298828125, 0.4742431640625, 0.635498046875, 0.7967529296875, 0.9580078125, 1.1192626953125, 1.280517578125, 1.4417724609375, 1.60302734375, 1.7642822265625, 1.925537109375, 2.0867919921875, 2.248046875, 2.4093017578125, 2.570556640625, 2.7318115234375, 2.89306640625, 3.0543212890625, 3.215576171875, 3.3768310546875, 3.5380859375, 3.6993408203125, 3.860595703125, 4.0218505859375, 4.18310546875, 4.3443603515625, 4.505615234375, 4.6668701171875, 4.828125]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 5.0, 6.0, 10.0, 8.0, 8.0, 13.0, 13.0, 16.0, 21.0, 23.0, 31.0, 40.0, 36.0, 37.0, 49.0, 41.0, 60.0, 82.0, 148.0, 1595.0, 280.0, 105.0, 69.0, 51.0, 52.0, 26.0, 35.0, 25.0, 20.0, 25.0, 22.0, 17.0, 15.0, 15.0, 14.0, 7.0, 5.0, 7.0, 6.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-20.734375, -20.036865234375, -19.33935546875, -18.641845703125, -17.9443359375, -17.246826171875, -16.54931640625, -15.851806640625, -15.154296875, -14.456787109375, -13.75927734375, -13.061767578125, -12.3642578125, -11.666748046875, -10.96923828125, -10.271728515625, -9.57421875, -8.876708984375, -8.17919921875, -7.481689453125, -6.7841796875, -6.086669921875, -5.38916015625, -4.691650390625, -3.994140625, -3.296630859375, -2.59912109375, -1.901611328125, -1.2041015625, -0.506591796875, 0.19091796875, 0.888427734375, 1.5859375, 2.283447265625, 2.98095703125, 3.678466796875, 4.3759765625, 5.073486328125, 5.77099609375, 6.468505859375, 7.166015625, 7.863525390625, 8.56103515625, 9.258544921875, 9.9560546875, 10.653564453125, 11.35107421875, 12.048583984375, 12.74609375, 13.443603515625, 14.14111328125, 14.838623046875, 15.5361328125, 16.233642578125, 16.93115234375, 17.628662109375, 18.326171875, 19.023681640625, 19.72119140625, 20.418701171875, 21.1162109375, 21.813720703125, 22.51123046875, 23.208740234375, 23.90625]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 6.0, 2.0, 3.0, 3.0, 12.0, 14.0, 13.0, 30.0, 39.0, 47.0, 62.0, 90.0, 138.0, 225.0, 386.0, 1086.0, 52010.0, 3086167.0, 3844.0, 607.0, 321.0, 191.0, 128.0, 82.0, 68.0, 49.0, 22.0, 23.0, 16.0, 8.0, 7.0, 7.0, 2.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.4375, -51.9921875, -49.546875, -47.1015625, -44.65625, -42.2109375, -39.765625, -37.3203125, -34.875, -32.4296875, -29.984375, -27.5390625, -25.09375, -22.6484375, -20.203125, -17.7578125, -15.3125, -12.8671875, -10.421875, -7.9765625, -5.53125, -3.0859375, -0.640625, 1.8046875, 4.25, 6.6953125, 9.140625, 11.5859375, 14.03125, 16.4765625, 18.921875, 21.3671875, 23.8125, 26.2578125, 28.703125, 31.1484375, 33.59375, 36.0390625, 38.484375, 40.9296875, 43.375, 45.8203125, 48.265625, 50.7109375, 53.15625, 55.6015625, 58.046875, 60.4921875, 62.9375, 65.3828125, 67.828125, 70.2734375, 72.71875, 75.1640625, 77.609375, 80.0546875, 82.5, 84.9453125, 87.390625, 89.8359375, 92.28125, 94.7265625, 97.171875, 99.6171875, 102.0625]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 31.0, 282.0, 556.0, 134.0, 13.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.40947723388672, -31.1434268951416, -26.877376556396484, -22.611328125, -18.345277786254883, -14.079227447509766, -9.813179016113281, -5.547128677368164, -1.2810783386230469, 2.984971523284912, 7.251021385192871, 11.517070770263672, 15.783121109008789, 20.049171447753906, 24.31521987915039, 28.581270217895508, 32.847320556640625, 37.11336898803711, 41.37942123413086, 45.645469665527344, 49.911521911621094, 54.17757034301758, 58.44361877441406, 62.70967102050781, 66.97572326660156, 71.24177551269531, 75.50782012939453, 79.77387237548828, 84.03992462158203, 88.30596923828125, 92.572021484375, 96.83807373046875, 101.1041259765625, 105.37017822265625, 109.63622283935547, 113.90227508544922, 118.16832733154297, 122.43437194824219, 126.70042419433594, 130.9664764404297, 135.23252868652344, 139.4985809326172, 143.76463317871094, 148.03067016601562, 152.29672241210938, 156.56277465820312, 160.82882690429688, 165.09487915039062, 169.36093139648438, 173.62698364257812, 177.89303588867188, 182.15908813476562, 186.4251251220703, 190.69117736816406, 194.9572296142578, 199.22328186035156, 203.48931884765625, 207.75537109375, 212.02142333984375, 216.2874755859375, 220.5535125732422, 224.81956481933594, 229.0856170654297, 233.35166931152344, 237.6177215576172]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 3.0, 11.0, 5.0, 12.0, 13.0, 10.0, 16.0, 19.0, 24.0, 15.0, 20.0, 26.0, 22.0, 36.0, 24.0, 30.0, 29.0, 36.0, 40.0, 46.0, 48.0, 34.0, 46.0, 42.0, 34.0, 38.0, 39.0, 41.0, 28.0, 30.0, 31.0, 15.0, 15.0, 15.0, 29.0, 13.0, 14.0, 15.0, 7.0, 11.0, 3.0, 2.0, 5.0, 4.0, 3.0, 7.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-58.328643798828125, -56.432769775390625, -54.536895751953125, -52.64101791381836, -50.74514389038086, -48.84926986694336, -46.953392028808594, -45.057518005371094, -43.161643981933594, -41.265769958496094, -39.369895935058594, -37.47401809692383, -35.57814407348633, -33.68227005004883, -31.786394119262695, -29.890518188476562, -27.994644165039062, -26.098770141601562, -24.20289421081543, -22.307018280029297, -20.411144256591797, -18.515270233154297, -16.619394302368164, -14.723519325256348, -12.827644348144531, -10.931769371032715, -9.035894393920898, -7.140019416809082, -5.244144439697266, -3.348269462585449, -1.4523944854736328, 0.4434804916381836, 2.33935546875, 4.235230445861816, 6.131105422973633, 8.02698040008545, 9.922855377197266, 11.818730354309082, 13.714605331420898, 15.610480308532715, 17.50635528564453, 19.40222930908203, 21.298105239868164, 23.193981170654297, 25.089855194091797, 26.985729217529297, 28.88160514831543, 30.777481079101562, 32.67335510253906, 34.56922912597656, 36.46510314941406, 38.36098098754883, 40.25685501098633, 42.15272903442383, 44.048606872558594, 45.944480895996094, 47.840354919433594, 49.736228942871094, 51.632102966308594, 53.52798080444336, 55.42385482788086, 57.31972885131836, 59.215606689453125, 61.111480712890625, 63.007354736328125]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 1.0, 1.0, 4.0, 6.0, 2.0, 6.0, 5.0, 12.0, 16.0, 15.0, 16.0, 13.0, 23.0, 28.0, 28.0, 35.0, 34.0, 36.0, 62.0, 50.0, 51.0, 41.0, 46.0, 45.0, 48.0, 49.0, 43.0, 48.0, 30.0, 29.0, 29.0, 38.0, 20.0, 23.0, 18.0, 12.0, 9.0, 7.0, 5.0, 6.0, 1.0, 8.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.5390625, -8.2896728515625, -8.040283203125, -7.7908935546875, -7.54150390625, -7.2921142578125, -7.042724609375, -6.7933349609375, -6.5439453125, -6.2945556640625, -6.045166015625, -5.7957763671875, -5.54638671875, -5.2969970703125, -5.047607421875, -4.7982177734375, -4.548828125, -4.2994384765625, -4.050048828125, -3.8006591796875, -3.55126953125, -3.3018798828125, -3.052490234375, -2.8031005859375, -2.5537109375, -2.3043212890625, -2.054931640625, -1.8055419921875, -1.55615234375, -1.3067626953125, -1.057373046875, -0.8079833984375, -0.55859375, -0.3092041015625, -0.059814453125, 0.1895751953125, 0.43896484375, 0.6883544921875, 0.937744140625, 1.1871337890625, 1.4365234375, 1.6859130859375, 1.935302734375, 2.1846923828125, 2.43408203125, 2.6834716796875, 2.932861328125, 3.1822509765625, 3.431640625, 3.6810302734375, 3.930419921875, 4.1798095703125, 4.42919921875, 4.6785888671875, 4.927978515625, 5.1773681640625, 5.4267578125, 5.6761474609375, 5.925537109375, 6.1749267578125, 6.42431640625, 6.6737060546875, 6.923095703125, 7.1724853515625, 7.421875]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 0.0, 3.0, 3.0, 2.0, 2.0, 10.0, 6.0, 7.0, 14.0, 18.0, 19.0, 16.0, 18.0, 18.0, 32.0, 46.0, 57.0, 141.0, 338.0, 1243.0, 8945.0, 379451.0, 3636256.0, 160926.0, 5274.0, 842.0, 245.0, 78.0, 55.0, 33.0, 37.0, 40.0, 18.0, 20.0, 19.0, 14.0, 9.0, 5.0, 9.0, 6.0, 4.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.1875, -30.25390625, -29.3203125, -28.38671875, -27.453125, -26.51953125, -25.5859375, -24.65234375, -23.71875, -22.78515625, -21.8515625, -20.91796875, -19.984375, -19.05078125, -18.1171875, -17.18359375, -16.25, -15.31640625, -14.3828125, -13.44921875, -12.515625, -11.58203125, -10.6484375, -9.71484375, -8.78125, -7.84765625, -6.9140625, -5.98046875, -5.046875, -4.11328125, -3.1796875, -2.24609375, -1.3125, -0.37890625, 0.5546875, 1.48828125, 2.421875, 3.35546875, 4.2890625, 5.22265625, 6.15625, 7.08984375, 8.0234375, 8.95703125, 9.890625, 10.82421875, 11.7578125, 12.69140625, 13.625, 14.55859375, 15.4921875, 16.42578125, 17.359375, 18.29296875, 19.2265625, 20.16015625, 21.09375, 22.02734375, 22.9609375, 23.89453125, 24.828125, 25.76171875, 26.6953125, 27.62890625, 28.5625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 6.0, 5.0, 6.0, 9.0, 11.0, 20.0, 51.0, 54.0, 85.0, 115.0, 198.0, 259.0, 404.0, 514.0, 614.0, 495.0, 407.0, 265.0, 162.0, 127.0, 86.0, 52.0, 45.0, 23.0, 15.0, 15.0, 9.0, 7.0, 2.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.578125, -17.020263671875, -16.46240234375, -15.904541015625, -15.3466796875, -14.788818359375, -14.23095703125, -13.673095703125, -13.115234375, -12.557373046875, -11.99951171875, -11.441650390625, -10.8837890625, -10.325927734375, -9.76806640625, -9.210205078125, -8.65234375, -8.094482421875, -7.53662109375, -6.978759765625, -6.4208984375, -5.863037109375, -5.30517578125, -4.747314453125, -4.189453125, -3.631591796875, -3.07373046875, -2.515869140625, -1.9580078125, -1.400146484375, -0.84228515625, -0.284423828125, 0.2734375, 0.831298828125, 1.38916015625, 1.947021484375, 2.5048828125, 3.062744140625, 3.62060546875, 4.178466796875, 4.736328125, 5.294189453125, 5.85205078125, 6.409912109375, 6.9677734375, 7.525634765625, 8.08349609375, 8.641357421875, 9.19921875, 9.757080078125, 10.31494140625, 10.872802734375, 11.4306640625, 11.988525390625, 12.54638671875, 13.104248046875, 13.662109375, 14.219970703125, 14.77783203125, 15.335693359375, 15.8935546875, 16.451416015625, 17.00927734375, 17.567138671875, 18.125]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 8.0, 6.0, 4.0, 9.0, 13.0, 18.0, 19.0, 32.0, 46.0, 58.0, 56.0, 101.0, 124.0, 162.0, 205.0, 318.0, 653.0, 3065.0, 275106.0, 3891356.0, 20363.0, 1137.0, 432.0, 250.0, 204.0, 146.0, 100.0, 78.0, 53.0, 31.0, 29.0, 37.0, 21.0, 10.0, 9.0, 10.0, 4.0, 5.0, 1.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.96875, -57.0830078125, -55.197265625, -53.3115234375, -51.42578125, -49.5400390625, -47.654296875, -45.7685546875, -43.8828125, -41.9970703125, -40.111328125, -38.2255859375, -36.33984375, -34.4541015625, -32.568359375, -30.6826171875, -28.796875, -26.9111328125, -25.025390625, -23.1396484375, -21.25390625, -19.3681640625, -17.482421875, -15.5966796875, -13.7109375, -11.8251953125, -9.939453125, -8.0537109375, -6.16796875, -4.2822265625, -2.396484375, -0.5107421875, 1.375, 3.2607421875, 5.146484375, 7.0322265625, 8.91796875, 10.8037109375, 12.689453125, 14.5751953125, 16.4609375, 18.3466796875, 20.232421875, 22.1181640625, 24.00390625, 25.8896484375, 27.775390625, 29.6611328125, 31.546875, 33.4326171875, 35.318359375, 37.2041015625, 39.08984375, 40.9755859375, 42.861328125, 44.7470703125, 46.6328125, 48.5185546875, 50.404296875, 52.2900390625, 54.17578125, 56.0615234375, 57.947265625, 59.8330078125, 61.71875]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 131.0, 712.0, 168.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-400.0184631347656, -386.9118347167969, -373.80523681640625, -360.6986083984375, -347.5920104980469, -334.4853820800781, -321.3787841796875, -308.27215576171875, -295.16552734375, -282.05889892578125, -268.9523010253906, -255.84567260742188, -242.7390594482422, -229.6324462890625, -216.5258331298828, -203.41921997070312, -190.31260681152344, -177.20599365234375, -164.09938049316406, -150.99276733398438, -137.88613891601562, -124.77952575683594, -111.67291259765625, -98.56629180908203, -85.45967864990234, -72.35306549072266, -59.24644470214844, -46.13983154296875, -33.0332145690918, -19.926597595214844, -6.819984436035156, 6.2866363525390625, 19.39324951171875, 32.4998664855957, 45.606483459472656, 58.713096618652344, 71.81971740722656, 84.92633056640625, 98.03294372558594, 111.13956451416016, 124.24617767333984, 137.35279846191406, 150.45941162109375, 163.56602478027344, 176.67263793945312, 189.77926635742188, 202.8858642578125, 215.99249267578125, 229.09910583496094, 242.20571899414062, 255.3123321533203, 268.4189453125, 281.52557373046875, 294.6322021484375, 307.7388000488281, 320.8454284667969, 333.9520263671875, 347.05865478515625, 360.1652526855469, 373.2718811035156, 386.37847900390625, 399.485107421875, 412.59173583984375, 425.6983337402344, 438.8049621582031]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 7.0, 4.0, 4.0, 5.0, 6.0, 9.0, 14.0, 15.0, 14.0, 18.0, 20.0, 26.0, 18.0, 20.0, 26.0, 27.0, 34.0, 38.0, 37.0, 32.0, 35.0, 33.0, 50.0, 33.0, 35.0, 42.0, 35.0, 29.0, 36.0, 25.0, 36.0, 34.0, 17.0, 33.0, 26.0, 23.0, 21.0, 23.0, 9.0, 8.0, 10.0, 8.0, 7.0, 5.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-43.46864318847656, -42.09502029418945, -40.72139358520508, -39.34777069091797, -37.97414779663086, -36.600521087646484, -35.226898193359375, -33.853271484375, -32.47964859008789, -31.10602378845215, -29.73240089416504, -28.358776092529297, -26.985151290893555, -25.611526489257812, -24.237903594970703, -22.86427879333496, -21.49065589904785, -20.11703109741211, -18.743408203125, -17.369783401489258, -15.996158599853516, -14.62253475189209, -13.248910903930664, -11.875286102294922, -10.501662254333496, -9.12803840637207, -7.754413604736328, -6.380789756774902, -5.007165431976318, -3.6335411071777344, -2.2599172592163086, -0.8862924575805664, 0.4873313903808594, 1.8609555959701538, 3.2345798015594482, 4.608203887939453, 5.981828212738037, 7.355452537536621, 8.729076385498047, 10.102701187133789, 11.476325035095215, 12.84994888305664, 14.223573684692383, 15.597197532653809, 16.970821380615234, 18.344446182250977, 19.71807098388672, 21.091693878173828, 22.46531867980957, 23.838943481445312, 25.212566375732422, 26.586191177368164, 27.959815979003906, 29.333438873291016, 30.707063674926758, 32.0806884765625, 33.45431137084961, 34.82793426513672, 36.201560974121094, 37.5751838684082, 38.94880676269531, 40.32243347167969, 41.6960563659668, 43.069679260253906, 44.44330596923828]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 4.0, 1.0, 5.0, 3.0, 3.0, 6.0, 4.0, 5.0, 11.0, 5.0, 22.0, 10.0, 22.0, 25.0, 25.0, 25.0, 28.0, 38.0, 29.0, 37.0, 47.0, 58.0, 34.0, 41.0, 35.0, 54.0, 54.0, 45.0, 37.0, 46.0, 31.0, 27.0, 35.0, 24.0, 25.0, 22.0, 15.0, 15.0, 10.0, 11.0, 11.0, 8.0, 8.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.99609375, -6.771484375, -6.546875, -6.322265625, -6.09765625, -5.873046875, -5.6484375, -5.423828125, -5.19921875, -4.974609375, -4.75, -4.525390625, -4.30078125, -4.076171875, -3.8515625, -3.626953125, -3.40234375, -3.177734375, -2.953125, -2.728515625, -2.50390625, -2.279296875, -2.0546875, -1.830078125, -1.60546875, -1.380859375, -1.15625, -0.931640625, -0.70703125, -0.482421875, -0.2578125, -0.033203125, 0.19140625, 0.416015625, 0.640625, 0.865234375, 1.08984375, 1.314453125, 1.5390625, 1.763671875, 1.98828125, 2.212890625, 2.4375, 2.662109375, 2.88671875, 3.111328125, 3.3359375, 3.560546875, 3.78515625, 4.009765625, 4.234375, 4.458984375, 4.68359375, 4.908203125, 5.1328125, 5.357421875, 5.58203125, 5.806640625, 6.03125, 6.255859375, 6.48046875, 6.705078125, 6.9296875, 7.154296875, 7.37890625]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 7.0, 12.0, 12.0, 16.0, 29.0, 42.0, 66.0, 90.0, 114.0, 194.0, 325.0, 385.0, 598.0, 932.0, 1371.0, 2032.0, 3006.0, 4805.0, 7178.0, 10951.0, 17592.0, 28411.0, 47938.0, 86745.0, 170054.0, 268211.0, 176793.0, 90873.0, 50007.0, 28951.0, 17878.0, 11301.0, 7340.0, 4805.0, 3142.0, 2086.0, 1357.0, 955.0, 645.0, 423.0, 288.0, 189.0, 136.0, 76.0, 66.0, 37.0, 24.0, 21.0, 25.0, 6.0, 6.0, 7.0, 0.0, 4.0, 1.0, 3.0, 0.0, 2.0], "bins": [-1.013671875, -0.9815216064453125, -0.949371337890625, -0.9172210693359375, -0.88507080078125, -0.8529205322265625, -0.820770263671875, -0.7886199951171875, -0.7564697265625, -0.7243194580078125, -0.692169189453125, -0.6600189208984375, -0.62786865234375, -0.5957183837890625, -0.563568115234375, -0.5314178466796875, -0.499267578125, -0.4671173095703125, -0.434967041015625, -0.4028167724609375, -0.37066650390625, -0.3385162353515625, -0.306365966796875, -0.2742156982421875, -0.2420654296875, -0.2099151611328125, -0.177764892578125, -0.1456146240234375, -0.11346435546875, -0.0813140869140625, -0.049163818359375, -0.0170135498046875, 0.01513671875, 0.0472869873046875, 0.079437255859375, 0.1115875244140625, 0.14373779296875, 0.1758880615234375, 0.208038330078125, 0.2401885986328125, 0.2723388671875, 0.3044891357421875, 0.336639404296875, 0.3687896728515625, 0.40093994140625, 0.4330902099609375, 0.465240478515625, 0.4973907470703125, 0.529541015625, 0.5616912841796875, 0.593841552734375, 0.6259918212890625, 0.65814208984375, 0.6902923583984375, 0.722442626953125, 0.7545928955078125, 0.7867431640625, 0.8188934326171875, 0.851043701171875, 0.8831939697265625, 0.91534423828125, 0.9474945068359375, 0.979644775390625, 1.0117950439453125, 1.0439453125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 7.0, 10.0, 15.0, 9.0, 20.0, 19.0, 19.0, 13.0, 33.0, 32.0, 41.0, 33.0, 40.0, 49.0, 60.0, 52.0, 50.0, 1066.0, 42.0, 45.0, 47.0, 46.0, 40.0, 23.0, 27.0, 38.0, 28.0, 23.0, 26.0, 17.0, 15.0, 9.0, 4.0, 7.0, 4.0, 3.0, 6.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.546875, -4.39080810546875, -4.2347412109375, -4.07867431640625, -3.922607421875, -3.76654052734375, -3.6104736328125, -3.45440673828125, -3.29833984375, -3.14227294921875, -2.9862060546875, -2.83013916015625, -2.674072265625, -2.51800537109375, -2.3619384765625, -2.20587158203125, -2.0498046875, -1.89373779296875, -1.7376708984375, -1.58160400390625, -1.425537109375, -1.26947021484375, -1.1134033203125, -0.95733642578125, -0.80126953125, -0.64520263671875, -0.4891357421875, -0.33306884765625, -0.177001953125, -0.02093505859375, 0.1351318359375, 0.29119873046875, 0.447265625, 0.60333251953125, 0.7593994140625, 0.91546630859375, 1.071533203125, 1.22760009765625, 1.3836669921875, 1.53973388671875, 1.69580078125, 1.85186767578125, 2.0079345703125, 2.16400146484375, 2.320068359375, 2.47613525390625, 2.6322021484375, 2.78826904296875, 2.9443359375, 3.10040283203125, 3.2564697265625, 3.41253662109375, 3.568603515625, 3.72467041015625, 3.8807373046875, 4.03680419921875, 4.19287109375, 4.34893798828125, 4.5050048828125, 4.66107177734375, 4.817138671875, 4.97320556640625, 5.1292724609375, 5.28533935546875, 5.44140625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 7.0, 16.0, 12.0, 27.0, 33.0, 42.0, 84.0, 110.0, 166.0, 242.0, 390.0, 641.0, 915.0, 1405.0, 2234.0, 3559.0, 5618.0, 9217.0, 15619.0, 26462.0, 45356.0, 79990.0, 152430.0, 1307931.0, 200672.0, 104155.0, 57037.0, 32956.0, 19408.0, 11458.0, 7003.0, 4331.0, 2739.0, 1741.0, 1076.0, 707.0, 462.0, 307.0, 196.0, 104.0, 108.0, 47.0, 42.0, 34.0, 15.0, 3.0, 9.0, 6.0, 5.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.85400390625, -0.8261947631835938, -0.7983856201171875, -0.7705764770507812, -0.742767333984375, -0.7149581909179688, -0.6871490478515625, -0.6593399047851562, -0.63153076171875, -0.6037216186523438, -0.5759124755859375, -0.5481033325195312, -0.520294189453125, -0.49248504638671875, -0.4646759033203125, -0.43686676025390625, -0.4090576171875, -0.38124847412109375, -0.3534393310546875, -0.32563018798828125, -0.297821044921875, -0.27001190185546875, -0.2422027587890625, -0.21439361572265625, -0.18658447265625, -0.15877532958984375, -0.1309661865234375, -0.10315704345703125, -0.075347900390625, -0.04753875732421875, -0.0197296142578125, 0.00807952880859375, 0.035888671875, 0.06369781494140625, 0.0915069580078125, 0.11931610107421875, 0.147125244140625, 0.17493438720703125, 0.2027435302734375, 0.23055267333984375, 0.25836181640625, 0.28617095947265625, 0.3139801025390625, 0.34178924560546875, 0.369598388671875, 0.39740753173828125, 0.4252166748046875, 0.45302581787109375, 0.4808349609375, 0.5086441040039062, 0.5364532470703125, 0.5642623901367188, 0.592071533203125, 0.6198806762695312, 0.6476898193359375, 0.6754989624023438, 0.70330810546875, 0.7311172485351562, 0.7589263916015625, 0.7867355346679688, 0.814544677734375, 0.8423538208007812, 0.8701629638671875, 0.8979721069335938, 0.92578125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 5.0, 3.0, 5.0, 7.0, 13.0, 11.0, 16.0, 20.0, 14.0, 29.0, 38.0, 35.0, 44.0, 46.0, 46.0, 65.0, 54.0, 55.0, 70.0, 69.0, 58.0, 60.0, 42.0, 44.0, 34.0, 25.0, 18.0, 17.0, 11.0, 13.0, 8.0, 8.0, 5.0, 2.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0029659271240234375, -0.002886861562728882, -0.002807796001434326, -0.0027287304401397705, -0.002649664878845215, -0.002570599317550659, -0.0024915337562561035, -0.002412468194961548, -0.002333402633666992, -0.0022543370723724365, -0.002175271511077881, -0.002096205949783325, -0.0020171403884887695, -0.0019380748271942139, -0.0018590092658996582, -0.0017799437046051025, -0.0017008781433105469, -0.0016218125820159912, -0.0015427470207214355, -0.0014636814594268799, -0.0013846158981323242, -0.0013055503368377686, -0.0012264847755432129, -0.0011474192142486572, -0.0010683536529541016, -0.000989288091659546, -0.0009102225303649902, -0.0008311569690704346, -0.0007520914077758789, -0.0006730258464813232, -0.0005939602851867676, -0.0005148947238922119, -0.00043582916259765625, -0.0003567636013031006, -0.0002776980400085449, -0.00019863247871398926, -0.0001195669174194336, -4.050135612487793e-05, 3.8564205169677734e-05, 0.0001176297664642334, 0.00019669532775878906, 0.0002757608890533447, 0.0003548264503479004, 0.00043389201164245605, 0.0005129575729370117, 0.0005920231342315674, 0.000671088695526123, 0.0007501542568206787, 0.0008292198181152344, 0.00090828537940979, 0.0009873509407043457, 0.0010664165019989014, 0.001145482063293457, 0.0012245476245880127, 0.0013036131858825684, 0.001382678747177124, 0.0014617443084716797, 0.0015408098697662354, 0.001619875431060791, 0.0016989409923553467, 0.0017780065536499023, 0.001857072114944458, 0.0019361376762390137, 0.0020152032375335693, 0.002094268798828125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 8.0, 6.0, 3.0, 10.0, 16.0, 19.0, 18.0, 25.0, 40.0, 61.0, 69.0, 113.0, 146.0, 332.0, 1001.0, 124840.0, 919193.0, 1609.0, 431.0, 188.0, 101.0, 74.0, 60.0, 46.0, 33.0, 26.0, 17.0, 12.0, 10.0, 17.0, 8.0, 3.0, 6.0, 2.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.050537109375, -0.04874134063720703, -0.04694557189941406, -0.045149803161621094, -0.043354034423828125, -0.041558265686035156, -0.03976249694824219, -0.03796672821044922, -0.03617095947265625, -0.03437519073486328, -0.03257942199707031, -0.030783653259277344, -0.028987884521484375, -0.027192115783691406, -0.025396347045898438, -0.02360057830810547, -0.0218048095703125, -0.02000904083251953, -0.018213272094726562, -0.016417503356933594, -0.014621734619140625, -0.012825965881347656, -0.011030197143554688, -0.009234428405761719, -0.00743865966796875, -0.005642890930175781, -0.0038471221923828125, -0.0020513534545898438, -0.000255584716796875, 0.0015401840209960938, 0.0033359527587890625, 0.005131721496582031, 0.006927490234375, 0.008723258972167969, 0.010519027709960938, 0.012314796447753906, 0.014110565185546875, 0.015906333923339844, 0.017702102661132812, 0.01949787139892578, 0.02129364013671875, 0.02308940887451172, 0.024885177612304688, 0.026680946350097656, 0.028476715087890625, 0.030272483825683594, 0.03206825256347656, 0.03386402130126953, 0.0356597900390625, 0.03745555877685547, 0.03925132751464844, 0.041047096252441406, 0.042842864990234375, 0.044638633728027344, 0.04643440246582031, 0.04823017120361328, 0.05002593994140625, 0.05182170867919922, 0.05361747741699219, 0.055413246154785156, 0.057209014892578125, 0.059004783630371094, 0.06080055236816406, 0.06259632110595703, 0.06439208984375]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 17.0, 124.0, 433.0, 360.0, 73.0, 5.0, 3.0, 1.0, 1.0], "bins": [-0.010284267365932465, -0.010106420144438744, -0.009928571991622448, -0.009750724770128727, -0.009572876617312431, -0.00939502939581871, -0.009217181243002415, -0.009039334021508694, -0.008861485868692398, -0.008683638647198677, -0.008505790494382381, -0.00832794327288866, -0.008150095120072365, -0.007972247898578644, -0.007794399745762348, -0.00761655205860734, -0.0074387043714523315, -0.007260856684297323, -0.007083008997142315, -0.006905161309987307, -0.006727313622832298, -0.00654946593567729, -0.006371618248522282, -0.006193770561367273, -0.006015923339873552, -0.005838075652718544, -0.005660227965563536, -0.005482380278408527, -0.005304532591253519, -0.005126684904098511, -0.004948837216943502, -0.004770989529788494, -0.0045931413769721985, -0.00441529368981719, -0.004237446002662182, -0.0040595983155071735, -0.0038817506283521652, -0.003703902941197157, -0.0035260552540421486, -0.0033482075668871403, -0.0031703601125627756, -0.0029925124254077673, -0.002814664738252759, -0.0026368170510977507, -0.0024589693639427423, -0.002281121676787734, -0.0021032742224633694, -0.0019254264188930392, -0.001747578731738031, -0.0015697310445830226, -0.0013918833574280143, -0.0012140357866883278, -0.0010361880995333195, -0.0008583403541706502, -0.0006804927252233028, -0.0005026450380682945, -0.0003247973509132862, -0.00014694967831019312, 3.0897994292899966e-05, 0.00020874565234407783, 0.00038659333949908614, 0.0005644410266540945, 0.0007422886556014419, 0.0009201363427564502, 0.0010979840299114585]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 3.0, 7.0, 1.0, 8.0, 5.0, 8.0, 16.0, 8.0, 4.0, 20.0, 20.0, 14.0, 22.0, 19.0, 23.0, 27.0, 30.0, 29.0, 33.0, 35.0, 40.0, 47.0, 44.0, 35.0, 41.0, 43.0, 44.0, 40.0, 39.0, 27.0, 33.0, 34.0, 28.0, 22.0, 21.0, 18.0, 17.0, 23.0, 16.0, 12.0, 9.0, 7.0, 11.0, 6.0, 6.0, 6.0, 3.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0010445117950439453, -0.0010075448080897331, -0.0009705778211355209, -0.0009336108341813087, -0.0008966438472270966, -0.0008596768602728844, -0.0008227098733186722, -0.00078574288636446, -0.0007487758994102478, -0.0007118089124560356, -0.0006748419255018234, -0.0006378749385476112, -0.000600907951593399, -0.0005639409646391869, -0.0005269739776849747, -0.0004900069907307625, -0.0004530400037765503, -0.0004160730168223381, -0.0003791060298681259, -0.0003421390429139137, -0.00030517205595970154, -0.00026820506900548935, -0.00023123808205127716, -0.00019427109509706497, -0.00015730410814285278, -0.0001203371211886406, -8.33701342344284e-05, -4.640314728021622e-05, -9.436160326004028e-06, 2.753082662820816e-05, 6.449781358242035e-05, 0.00010146480053663254, 0.00013843178749084473, 0.00017539877444505692, 0.0002123657613992691, 0.0002493327483534813, 0.0002862997353076935, 0.00032326672226190567, 0.00036023370921611786, 0.00039720069617033005, 0.00043416768312454224, 0.0004711346700787544, 0.0005081016570329666, 0.0005450686439871788, 0.000582035630941391, 0.0006190026178956032, 0.0006559696048498154, 0.0006929365918040276, 0.0007299035787582397, 0.0007668705657124519, 0.0008038375526666641, 0.0008408045396208763, 0.0008777715265750885, 0.0009147385135293007, 0.0009517055004835129, 0.000988672487437725, 0.0010256394743919373, 0.0010626064613461494, 0.0010995734483003616, 0.0011365404352545738, 0.001173507422208786, 0.0012104744091629982, 0.0012474413961172104, 0.0012844083830714226, 0.0013213753700256348]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 4.0, 1.0, 5.0, 3.0, 3.0, 6.0, 4.0, 5.0, 11.0, 5.0, 22.0, 10.0, 22.0, 25.0, 25.0, 25.0, 28.0, 37.0, 30.0, 37.0, 47.0, 57.0, 35.0, 41.0, 35.0, 54.0, 54.0, 45.0, 37.0, 46.0, 30.0, 28.0, 34.0, 25.0, 25.0, 22.0, 15.0, 15.0, 10.0, 11.0, 11.0, 8.0, 8.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.99609375, -6.77154541015625, -6.5469970703125, -6.32244873046875, -6.097900390625, -5.87335205078125, -5.6488037109375, -5.42425537109375, -5.19970703125, -4.97515869140625, -4.7506103515625, -4.52606201171875, -4.301513671875, -4.07696533203125, -3.8524169921875, -3.62786865234375, -3.4033203125, -3.17877197265625, -2.9542236328125, -2.72967529296875, -2.505126953125, -2.28057861328125, -2.0560302734375, -1.83148193359375, -1.60693359375, -1.38238525390625, -1.1578369140625, -0.93328857421875, -0.708740234375, -0.48419189453125, -0.2596435546875, -0.03509521484375, 0.189453125, 0.41400146484375, 0.6385498046875, 0.86309814453125, 1.087646484375, 1.31219482421875, 1.5367431640625, 1.76129150390625, 1.98583984375, 2.21038818359375, 2.4349365234375, 2.65948486328125, 2.884033203125, 3.10858154296875, 3.3331298828125, 3.55767822265625, 3.7822265625, 4.00677490234375, 4.2313232421875, 4.45587158203125, 4.680419921875, 4.90496826171875, 5.1295166015625, 5.35406494140625, 5.57861328125, 5.80316162109375, 6.0277099609375, 6.25225830078125, 6.476806640625, 6.70135498046875, 6.9259033203125, 7.15045166015625, 7.375]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 8.0, 6.0, 10.0, 6.0, 8.0, 9.0, 22.0, 25.0, 24.0, 49.0, 73.0, 103.0, 140.0, 215.0, 317.0, 491.0, 781.0, 1210.0, 1960.0, 3402.0, 5850.0, 10314.0, 20166.0, 44728.0, 121303.0, 368936.0, 295138.0, 96451.0, 37142.0, 17281.0, 9292.0, 5130.0, 3029.0, 1770.0, 1135.0, 666.0, 461.0, 303.0, 175.0, 126.0, 78.0, 51.0, 51.0, 33.0, 28.0, 21.0, 19.0, 8.0, 9.0, 9.0, 5.0, 1.0, 2.0, 1.0], "bins": [-5.1875, -5.04296875, -4.8984375, -4.75390625, -4.609375, -4.46484375, -4.3203125, -4.17578125, -4.03125, -3.88671875, -3.7421875, -3.59765625, -3.453125, -3.30859375, -3.1640625, -3.01953125, -2.875, -2.73046875, -2.5859375, -2.44140625, -2.296875, -2.15234375, -2.0078125, -1.86328125, -1.71875, -1.57421875, -1.4296875, -1.28515625, -1.140625, -0.99609375, -0.8515625, -0.70703125, -0.5625, -0.41796875, -0.2734375, -0.12890625, 0.015625, 0.16015625, 0.3046875, 0.44921875, 0.59375, 0.73828125, 0.8828125, 1.02734375, 1.171875, 1.31640625, 1.4609375, 1.60546875, 1.75, 1.89453125, 2.0390625, 2.18359375, 2.328125, 2.47265625, 2.6171875, 2.76171875, 2.90625, 3.05078125, 3.1953125, 3.33984375, 3.484375, 3.62890625, 3.7734375, 3.91796875, 4.0625]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 4.0, 9.0, 6.0, 5.0, 8.0, 14.0, 13.0, 20.0, 8.0, 24.0, 33.0, 24.0, 27.0, 42.0, 33.0, 47.0, 43.0, 68.0, 100.0, 418.0, 1501.0, 124.0, 62.0, 56.0, 49.0, 45.0, 35.0, 33.0, 31.0, 20.0, 24.0, 18.0, 18.0, 20.0, 11.0, 10.0, 7.0, 11.0, 6.0, 6.0, 8.0, 4.0, 2.0, 3.0, 0.0, 0.0, 3.0, 0.0, 3.0], "bins": [-23.765625, -23.087158203125, -22.40869140625, -21.730224609375, -21.0517578125, -20.373291015625, -19.69482421875, -19.016357421875, -18.337890625, -17.659423828125, -16.98095703125, -16.302490234375, -15.6240234375, -14.945556640625, -14.26708984375, -13.588623046875, -12.91015625, -12.231689453125, -11.55322265625, -10.874755859375, -10.1962890625, -9.517822265625, -8.83935546875, -8.160888671875, -7.482421875, -6.803955078125, -6.12548828125, -5.447021484375, -4.7685546875, -4.090087890625, -3.41162109375, -2.733154296875, -2.0546875, -1.376220703125, -0.69775390625, -0.019287109375, 0.6591796875, 1.337646484375, 2.01611328125, 2.694580078125, 3.373046875, 4.051513671875, 4.72998046875, 5.408447265625, 6.0869140625, 6.765380859375, 7.44384765625, 8.122314453125, 8.80078125, 9.479248046875, 10.15771484375, 10.836181640625, 11.5146484375, 12.193115234375, 12.87158203125, 13.550048828125, 14.228515625, 14.906982421875, 15.58544921875, 16.263916015625, 16.9423828125, 17.620849609375, 18.29931640625, 18.977783203125, 19.65625]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 8.0, 14.0, 17.0, 30.0, 32.0, 56.0, 64.0, 89.0, 146.0, 208.0, 305.0, 537.0, 3038.0, 3095564.0, 43684.0, 817.0, 365.0, 248.0, 159.0, 93.0, 69.0, 50.0, 26.0, 24.0, 17.0, 7.0, 10.0, 8.0, 3.0, 2.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-71.8125, -69.314453125, -66.81640625, -64.318359375, -61.8203125, -59.322265625, -56.82421875, -54.326171875, -51.828125, -49.330078125, -46.83203125, -44.333984375, -41.8359375, -39.337890625, -36.83984375, -34.341796875, -31.84375, -29.345703125, -26.84765625, -24.349609375, -21.8515625, -19.353515625, -16.85546875, -14.357421875, -11.859375, -9.361328125, -6.86328125, -4.365234375, -1.8671875, 0.630859375, 3.12890625, 5.626953125, 8.125, 10.623046875, 13.12109375, 15.619140625, 18.1171875, 20.615234375, 23.11328125, 25.611328125, 28.109375, 30.607421875, 33.10546875, 35.603515625, 38.1015625, 40.599609375, 43.09765625, 45.595703125, 48.09375, 50.591796875, 53.08984375, 55.587890625, 58.0859375, 60.583984375, 63.08203125, 65.580078125, 68.078125, 70.576171875, 73.07421875, 75.572265625, 78.0703125, 80.568359375, 83.06640625, 85.564453125, 88.0625]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 7.0, 709.0, 298.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.23029327392578, -29.586578369140625, -21.94286346435547, -14.299150466918945, -6.655435562133789, 0.9882774353027344, 8.63199234008789, 16.275707244873047, 23.919422149658203, 31.56313705444336, 39.206851959228516, 46.850563049316406, 54.49427795410156, 62.13799285888672, 69.78170776367188, 77.42542266845703, 85.06913757324219, 92.71285247802734, 100.3565673828125, 108.00028228759766, 115.64399719238281, 123.28770446777344, 130.93142700195312, 138.57513427734375, 146.21885681152344, 153.86256408691406, 161.50628662109375, 169.14999389648438, 176.79371643066406, 184.4374237060547, 192.08114624023438, 199.724853515625, 207.3685760498047, 215.0122833251953, 222.656005859375, 230.29971313476562, 237.9434356689453, 245.58714294433594, 253.23086547851562, 260.87457275390625, 268.5182800292969, 276.1619873046875, 283.8056945800781, 291.4494323730469, 299.0931396484375, 306.7368469238281, 314.38055419921875, 322.0242919921875, 329.6679992675781, 337.31170654296875, 344.9554138183594, 352.5991516113281, 360.24285888671875, 367.8865661621094, 375.5302734375, 383.17401123046875, 390.8177185058594, 398.46142578125, 406.1051330566406, 413.7488708496094, 421.392578125, 429.0362854003906, 436.67999267578125, 444.32373046875, 451.9674377441406]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 4.0, 5.0, 8.0, 6.0, 13.0, 9.0, 12.0, 15.0, 13.0, 23.0, 16.0, 19.0, 23.0, 23.0, 31.0, 38.0, 35.0, 38.0, 40.0, 39.0, 40.0, 38.0, 48.0, 33.0, 31.0, 46.0, 38.0, 38.0, 34.0, 30.0, 35.0, 22.0, 21.0, 14.0, 17.0, 18.0, 12.0, 18.0, 12.0, 12.0, 7.0, 8.0, 4.0, 6.0, 3.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-49.44548797607422, -47.808387756347656, -46.171287536621094, -44.53418731689453, -42.89708709716797, -41.259986877441406, -39.622886657714844, -37.98578643798828, -36.34868621826172, -34.711585998535156, -33.074485778808594, -31.43738555908203, -29.80028533935547, -28.163185119628906, -26.526084899902344, -24.88898468017578, -23.25188446044922, -21.614784240722656, -19.977684020996094, -18.34058380126953, -16.70348358154297, -15.066383361816406, -13.429283142089844, -11.792182922363281, -10.155082702636719, -8.517982482910156, -6.880882263183594, -5.243782043457031, -3.6066818237304688, -1.9695816040039062, -0.33248138427734375, 1.3046188354492188, 2.9417190551757812, 4.578819274902344, 6.215919494628906, 7.853019714355469, 9.490119934082031, 11.127220153808594, 12.764320373535156, 14.401420593261719, 16.03852081298828, 17.675621032714844, 19.312721252441406, 20.94982147216797, 22.58692169189453, 24.224021911621094, 25.861122131347656, 27.49822235107422, 29.13532257080078, 30.772422790527344, 32.409523010253906, 34.04662322998047, 35.68372344970703, 37.320823669433594, 38.957923889160156, 40.59502410888672, 42.23212432861328, 43.869224548339844, 45.506324768066406, 47.14342498779297, 48.78052520751953, 50.417625427246094, 52.054725646972656, 53.69182586669922, 55.32892608642578]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 2.0, 2.0, 4.0, 8.0, 4.0, 5.0, 8.0, 7.0, 8.0, 13.0, 16.0, 21.0, 25.0, 25.0, 30.0, 36.0, 33.0, 36.0, 37.0, 31.0, 45.0, 41.0, 47.0, 51.0, 41.0, 45.0, 51.0, 38.0, 36.0, 41.0, 29.0, 30.0, 27.0, 25.0, 11.0, 18.0, 18.0, 14.0, 12.0, 6.0, 11.0, 4.0, 3.0, 1.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-7.65625, -7.42388916015625, -7.1915283203125, -6.95916748046875, -6.726806640625, -6.49444580078125, -6.2620849609375, -6.02972412109375, -5.79736328125, -5.56500244140625, -5.3326416015625, -5.10028076171875, -4.867919921875, -4.63555908203125, -4.4031982421875, -4.17083740234375, -3.9384765625, -3.70611572265625, -3.4737548828125, -3.24139404296875, -3.009033203125, -2.77667236328125, -2.5443115234375, -2.31195068359375, -2.07958984375, -1.84722900390625, -1.6148681640625, -1.38250732421875, -1.150146484375, -0.91778564453125, -0.6854248046875, -0.45306396484375, -0.220703125, 0.01165771484375, 0.2440185546875, 0.47637939453125, 0.708740234375, 0.94110107421875, 1.1734619140625, 1.40582275390625, 1.63818359375, 1.87054443359375, 2.1029052734375, 2.33526611328125, 2.567626953125, 2.79998779296875, 3.0323486328125, 3.26470947265625, 3.4970703125, 3.72943115234375, 3.9617919921875, 4.19415283203125, 4.426513671875, 4.65887451171875, 4.8912353515625, 5.12359619140625, 5.35595703125, 5.58831787109375, 5.8206787109375, 6.05303955078125, 6.285400390625, 6.51776123046875, 6.7501220703125, 6.98248291015625, 7.21484375]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 7.0, 3.0, 7.0, 7.0, 11.0, 9.0, 12.0, 19.0, 20.0, 36.0, 25.0, 41.0, 84.0, 108.0, 208.0, 416.0, 1025.0, 3206.0, 16757.0, 250208.0, 2602015.0, 1237472.0, 72396.0, 7118.0, 1719.0, 631.0, 263.0, 140.0, 79.0, 55.0, 33.0, 23.0, 20.0, 19.0, 24.0, 11.0, 9.0, 8.0, 10.0, 4.0, 6.0, 5.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-18.984375, -18.42236328125, -17.8603515625, -17.29833984375, -16.736328125, -16.17431640625, -15.6123046875, -15.05029296875, -14.48828125, -13.92626953125, -13.3642578125, -12.80224609375, -12.240234375, -11.67822265625, -11.1162109375, -10.55419921875, -9.9921875, -9.43017578125, -8.8681640625, -8.30615234375, -7.744140625, -7.18212890625, -6.6201171875, -6.05810546875, -5.49609375, -4.93408203125, -4.3720703125, -3.81005859375, -3.248046875, -2.68603515625, -2.1240234375, -1.56201171875, -1.0, -0.43798828125, 0.1240234375, 0.68603515625, 1.248046875, 1.81005859375, 2.3720703125, 2.93408203125, 3.49609375, 4.05810546875, 4.6201171875, 5.18212890625, 5.744140625, 6.30615234375, 6.8681640625, 7.43017578125, 7.9921875, 8.55419921875, 9.1162109375, 9.67822265625, 10.240234375, 10.80224609375, 11.3642578125, 11.92626953125, 12.48828125, 13.05029296875, 13.6123046875, 14.17431640625, 14.736328125, 15.29833984375, 15.8603515625, 16.42236328125, 16.984375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 8.0, 10.0, 5.0, 9.0, 20.0, 29.0, 40.0, 80.0, 80.0, 106.0, 165.0, 224.0, 338.0, 428.0, 493.0, 528.0, 419.0, 315.0, 226.0, 155.0, 106.0, 88.0, 56.0, 38.0, 26.0, 23.0, 12.0, 16.0, 10.0, 3.0, 7.0, 3.0, 1.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-16.78125, -16.3271484375, -15.873046875, -15.4189453125, -14.96484375, -14.5107421875, -14.056640625, -13.6025390625, -13.1484375, -12.6943359375, -12.240234375, -11.7861328125, -11.33203125, -10.8779296875, -10.423828125, -9.9697265625, -9.515625, -9.0615234375, -8.607421875, -8.1533203125, -7.69921875, -7.2451171875, -6.791015625, -6.3369140625, -5.8828125, -5.4287109375, -4.974609375, -4.5205078125, -4.06640625, -3.6123046875, -3.158203125, -2.7041015625, -2.25, -1.7958984375, -1.341796875, -0.8876953125, -0.43359375, 0.0205078125, 0.474609375, 0.9287109375, 1.3828125, 1.8369140625, 2.291015625, 2.7451171875, 3.19921875, 3.6533203125, 4.107421875, 4.5615234375, 5.015625, 5.4697265625, 5.923828125, 6.3779296875, 6.83203125, 7.2861328125, 7.740234375, 8.1943359375, 8.6484375, 9.1025390625, 9.556640625, 10.0107421875, 10.46484375, 10.9189453125, 11.373046875, 11.8271484375, 12.28125]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 0.0, 0.0, 3.0, 6.0, 6.0, 7.0, 6.0, 10.0, 12.0, 16.0, 29.0, 31.0, 36.0, 42.0, 57.0, 75.0, 87.0, 117.0, 146.0, 200.0, 301.0, 520.0, 1257.0, 21363.0, 3603105.0, 559970.0, 4623.0, 782.0, 402.0, 258.0, 181.0, 148.0, 109.0, 101.0, 60.0, 44.0, 41.0, 34.0, 24.0, 17.0, 14.0, 12.0, 11.0, 10.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-48.15625, -46.5927734375, -45.029296875, -43.4658203125, -41.90234375, -40.3388671875, -38.775390625, -37.2119140625, -35.6484375, -34.0849609375, -32.521484375, -30.9580078125, -29.39453125, -27.8310546875, -26.267578125, -24.7041015625, -23.140625, -21.5771484375, -20.013671875, -18.4501953125, -16.88671875, -15.3232421875, -13.759765625, -12.1962890625, -10.6328125, -9.0693359375, -7.505859375, -5.9423828125, -4.37890625, -2.8154296875, -1.251953125, 0.3115234375, 1.875, 3.4384765625, 5.001953125, 6.5654296875, 8.12890625, 9.6923828125, 11.255859375, 12.8193359375, 14.3828125, 15.9462890625, 17.509765625, 19.0732421875, 20.63671875, 22.2001953125, 23.763671875, 25.3271484375, 26.890625, 28.4541015625, 30.017578125, 31.5810546875, 33.14453125, 34.7080078125, 36.271484375, 37.8349609375, 39.3984375, 40.9619140625, 42.525390625, 44.0888671875, 45.65234375, 47.2158203125, 48.779296875, 50.3427734375, 51.90625]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 14.0, 41.0, 77.0, 124.0, 179.0, 191.0, 168.0, 110.0, 60.0, 24.0, 14.0, 5.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-143.77023315429688, -140.96571350097656, -138.1612091064453, -135.356689453125, -132.55218505859375, -129.74766540527344, -126.94316101074219, -124.1386489868164, -121.33413696289062, -118.52962493896484, -115.72511291503906, -112.92060089111328, -110.1160888671875, -107.31157684326172, -104.50706481933594, -101.70255279541016, -98.89804077148438, -96.0935287475586, -93.28901672363281, -90.48450469970703, -87.67999267578125, -84.87548065185547, -82.07096862792969, -79.2664566040039, -76.4619369506836, -73.65742492675781, -70.85291290283203, -68.04840087890625, -65.24388885498047, -62.43937683105469, -59.634864807128906, -56.830352783203125, -54.02584457397461, -51.22133255004883, -48.41682052612305, -45.612308502197266, -42.807796478271484, -40.0032844543457, -37.198768615722656, -34.394256591796875, -31.589746475219727, -28.785234451293945, -25.980722427368164, -23.17620849609375, -20.37169647216797, -17.567184448242188, -14.762672424316406, -11.958160400390625, -9.153648376464844, -6.3491363525390625, -3.544623851776123, -0.7401113510131836, 2.0644006729125977, 4.868912696838379, 7.673425674438477, 10.477937698364258, 13.282449722290039, 16.08696174621582, 18.8914737701416, 21.695987701416016, 24.500499725341797, 27.305011749267578, 30.10952377319336, 32.91403579711914, 35.71854782104492]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 2.0, 8.0, 6.0, 6.0, 11.0, 11.0, 17.0, 11.0, 20.0, 21.0, 24.0, 23.0, 26.0, 33.0, 35.0, 42.0, 33.0, 37.0, 46.0, 37.0, 38.0, 40.0, 55.0, 40.0, 39.0, 45.0, 34.0, 34.0, 23.0, 17.0, 24.0, 23.0, 20.0, 22.0, 18.0, 12.0, 15.0, 13.0, 10.0, 4.0, 6.0, 3.0, 13.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-39.9771728515625, -38.68795394897461, -37.39873123168945, -36.10951232910156, -34.820289611816406, -33.531070709228516, -32.241851806640625, -30.9526309967041, -29.663410186767578, -28.374189376831055, -27.08496856689453, -25.79574966430664, -24.506528854370117, -23.217308044433594, -21.928089141845703, -20.63886833190918, -19.349647521972656, -18.060426712036133, -16.77120590209961, -15.481986999511719, -14.192766189575195, -12.903545379638672, -11.614325523376465, -10.325105667114258, -9.035884857177734, -7.746664524078369, -6.457444190979004, -5.168223857879639, -3.8790035247802734, -2.589783191680908, -1.300562858581543, -0.011343002319335938, 1.2778778076171875, 2.5670981407165527, 3.856318473815918, 5.145538806915283, 6.434759140014648, 7.723979473114014, 9.013199806213379, 10.302419662475586, 11.59164047241211, 12.880861282348633, 14.17008113861084, 15.459300994873047, 16.74852180480957, 18.037742614746094, 19.326961517333984, 20.616182327270508, 21.90540313720703, 23.194623947143555, 24.483844757080078, 25.77306365966797, 27.062284469604492, 28.351505279541016, 29.640724182128906, 30.92994499206543, 32.21916580200195, 33.508384704589844, 34.797607421875, 36.08682632446289, 37.37604522705078, 38.66526794433594, 39.95448684692383, 41.24370574951172, 42.532928466796875]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 8.0, 8.0, 9.0, 14.0, 23.0, 17.0, 15.0, 14.0, 24.0, 27.0, 25.0, 42.0, 36.0, 34.0, 40.0, 42.0, 47.0, 39.0, 51.0, 40.0, 48.0, 47.0, 41.0, 46.0, 36.0, 32.0, 33.0, 23.0, 26.0, 22.0, 10.0, 21.0, 15.0, 11.0, 7.0, 4.0, 6.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.2734375, -7.04705810546875, -6.8206787109375, -6.59429931640625, -6.367919921875, -6.14154052734375, -5.9151611328125, -5.68878173828125, -5.46240234375, -5.23602294921875, -5.0096435546875, -4.78326416015625, -4.556884765625, -4.33050537109375, -4.1041259765625, -3.87774658203125, -3.6513671875, -3.42498779296875, -3.1986083984375, -2.97222900390625, -2.745849609375, -2.51947021484375, -2.2930908203125, -2.06671142578125, -1.84033203125, -1.61395263671875, -1.3875732421875, -1.16119384765625, -0.934814453125, -0.70843505859375, -0.4820556640625, -0.25567626953125, -0.029296875, 0.19708251953125, 0.4234619140625, 0.64984130859375, 0.876220703125, 1.10260009765625, 1.3289794921875, 1.55535888671875, 1.78173828125, 2.00811767578125, 2.2344970703125, 2.46087646484375, 2.687255859375, 2.91363525390625, 3.1400146484375, 3.36639404296875, 3.5927734375, 3.81915283203125, 4.0455322265625, 4.27191162109375, 4.498291015625, 4.72467041015625, 4.9510498046875, 5.17742919921875, 5.40380859375, 5.63018798828125, 5.8565673828125, 6.08294677734375, 6.309326171875, 6.53570556640625, 6.7620849609375, 6.98846435546875, 7.21484375]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 3.0, 3.0, 4.0, 10.0, 15.0, 20.0, 39.0, 47.0, 64.0, 104.0, 149.0, 227.0, 367.0, 597.0, 1016.0, 1653.0, 2657.0, 4565.0, 7797.0, 13340.0, 23410.0, 42577.0, 85791.0, 200466.0, 331554.0, 169827.0, 73874.0, 37940.0, 20965.0, 12132.0, 6989.0, 4117.0, 2376.0, 1490.0, 933.0, 532.0, 324.0, 216.0, 107.0, 89.0, 60.0, 43.0, 27.0, 17.0, 17.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.32421875, -1.284576416015625, -1.24493408203125, -1.205291748046875, -1.1656494140625, -1.126007080078125, -1.08636474609375, -1.046722412109375, -1.007080078125, -0.967437744140625, -0.92779541015625, -0.888153076171875, -0.8485107421875, -0.808868408203125, -0.76922607421875, -0.729583740234375, -0.68994140625, -0.650299072265625, -0.61065673828125, -0.571014404296875, -0.5313720703125, -0.491729736328125, -0.45208740234375, -0.412445068359375, -0.372802734375, -0.333160400390625, -0.29351806640625, -0.253875732421875, -0.2142333984375, -0.174591064453125, -0.13494873046875, -0.095306396484375, -0.0556640625, -0.016021728515625, 0.02362060546875, 0.063262939453125, 0.1029052734375, 0.142547607421875, 0.18218994140625, 0.221832275390625, 0.261474609375, 0.301116943359375, 0.34075927734375, 0.380401611328125, 0.4200439453125, 0.459686279296875, 0.49932861328125, 0.538970947265625, 0.57861328125, 0.618255615234375, 0.65789794921875, 0.697540283203125, 0.7371826171875, 0.776824951171875, 0.81646728515625, 0.856109619140625, 0.895751953125, 0.935394287109375, 0.97503662109375, 1.014678955078125, 1.0543212890625, 1.093963623046875, 1.13360595703125, 1.173248291015625, 1.212890625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 7.0, 4.0, 8.0, 10.0, 17.0, 13.0, 17.0, 26.0, 23.0, 30.0, 29.0, 35.0, 39.0, 44.0, 58.0, 44.0, 57.0, 1071.0, 63.0, 30.0, 45.0, 49.0, 35.0, 44.0, 27.0, 30.0, 32.0, 31.0, 21.0, 14.0, 14.0, 17.0, 12.0, 6.0, 4.0, 8.0, 4.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.33203125, -5.1788330078125, -5.025634765625, -4.8724365234375, -4.71923828125, -4.5660400390625, -4.412841796875, -4.2596435546875, -4.1064453125, -3.9532470703125, -3.800048828125, -3.6468505859375, -3.49365234375, -3.3404541015625, -3.187255859375, -3.0340576171875, -2.880859375, -2.7276611328125, -2.574462890625, -2.4212646484375, -2.26806640625, -2.1148681640625, -1.961669921875, -1.8084716796875, -1.6552734375, -1.5020751953125, -1.348876953125, -1.1956787109375, -1.04248046875, -0.8892822265625, -0.736083984375, -0.5828857421875, -0.4296875, -0.2764892578125, -0.123291015625, 0.0299072265625, 0.18310546875, 0.3363037109375, 0.489501953125, 0.6427001953125, 0.7958984375, 0.9490966796875, 1.102294921875, 1.2554931640625, 1.40869140625, 1.5618896484375, 1.715087890625, 1.8682861328125, 2.021484375, 2.1746826171875, 2.327880859375, 2.4810791015625, 2.63427734375, 2.7874755859375, 2.940673828125, 3.0938720703125, 3.2470703125, 3.4002685546875, 3.553466796875, 3.7066650390625, 3.85986328125, 4.0130615234375, 4.166259765625, 4.3194580078125, 4.47265625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 3.0, 2.0, 9.0, 18.0, 13.0, 20.0, 38.0, 57.0, 97.0, 131.0, 210.0, 293.0, 406.0, 636.0, 859.0, 1225.0, 1899.0, 2701.0, 3960.0, 5985.0, 8940.0, 13788.0, 21232.0, 33347.0, 54337.0, 92945.0, 166896.0, 1286126.0, 163465.0, 90705.0, 52642.0, 32753.0, 20920.0, 13602.0, 8762.0, 5767.0, 3841.0, 2620.0, 1815.0, 1264.0, 826.0, 649.0, 426.0, 284.0, 207.0, 126.0, 105.0, 51.0, 40.0, 26.0, 29.0, 17.0, 7.0, 8.0, 5.0, 4.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.75244140625, -0.7285385131835938, -0.7046356201171875, -0.6807327270507812, -0.656829833984375, -0.6329269409179688, -0.6090240478515625, -0.5851211547851562, -0.56121826171875, -0.5373153686523438, -0.5134124755859375, -0.48950958251953125, -0.465606689453125, -0.44170379638671875, -0.4178009033203125, -0.39389801025390625, -0.3699951171875, -0.34609222412109375, -0.3221893310546875, -0.29828643798828125, -0.274383544921875, -0.25048065185546875, -0.2265777587890625, -0.20267486572265625, -0.17877197265625, -0.15486907958984375, -0.1309661865234375, -0.10706329345703125, -0.083160400390625, -0.05925750732421875, -0.0353546142578125, -0.01145172119140625, 0.012451171875, 0.03635406494140625, 0.0602569580078125, 0.08415985107421875, 0.108062744140625, 0.13196563720703125, 0.1558685302734375, 0.17977142333984375, 0.20367431640625, 0.22757720947265625, 0.2514801025390625, 0.27538299560546875, 0.299285888671875, 0.32318878173828125, 0.3470916748046875, 0.37099456787109375, 0.3948974609375, 0.41880035400390625, 0.4427032470703125, 0.46660614013671875, 0.490509033203125, 0.5144119262695312, 0.5383148193359375, 0.5622177124023438, 0.58612060546875, 0.6100234985351562, 0.6339263916015625, 0.6578292846679688, 0.681732177734375, 0.7056350708007812, 0.7295379638671875, 0.7534408569335938, 0.77734375]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 10.0, 4.0, 16.0, 10.0, 14.0, 23.0, 24.0, 27.0, 29.0, 34.0, 29.0, 34.0, 50.0, 54.0, 51.0, 62.0, 62.0, 58.0, 63.0, 45.0, 40.0, 48.0, 33.0, 27.0, 28.0, 28.0, 22.0, 11.0, 8.0, 6.0, 16.0, 7.0, 6.0, 7.0, 4.0, 2.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0022449493408203125, -0.0021731555461883545, -0.0021013617515563965, -0.0020295679569244385, -0.0019577741622924805, -0.0018859803676605225, -0.0018141865730285645, -0.0017423927783966064, -0.0016705989837646484, -0.0015988051891326904, -0.0015270113945007324, -0.0014552175998687744, -0.0013834238052368164, -0.0013116300106048584, -0.0012398362159729004, -0.0011680424213409424, -0.0010962486267089844, -0.0010244548320770264, -0.0009526610374450684, -0.0008808672428131104, -0.0008090734481811523, -0.0007372796535491943, -0.0006654858589172363, -0.0005936920642852783, -0.0005218982696533203, -0.0004501044750213623, -0.0003783106803894043, -0.0003065168857574463, -0.00023472309112548828, -0.00016292929649353027, -9.113550186157227e-05, -1.9341707229614258e-05, 5.245208740234375e-05, 0.00012424588203430176, 0.00019603967666625977, 0.0002678334712982178, 0.0003396272659301758, 0.0004114210605621338, 0.0004832148551940918, 0.0005550086498260498, 0.0006268024444580078, 0.0006985962390899658, 0.0007703900337219238, 0.0008421838283538818, 0.0009139776229858398, 0.0009857714176177979, 0.0010575652122497559, 0.0011293590068817139, 0.0012011528015136719, 0.0012729465961456299, 0.0013447403907775879, 0.001416534185409546, 0.001488327980041504, 0.001560121774673462, 0.00163191556930542, 0.001703709363937378, 0.001775503158569336, 0.001847296953201294, 0.001919090747833252, 0.00199088454246521, 0.002062678337097168, 0.002134472131729126, 0.002206265926361084, 0.002278059720993042, 0.002349853515625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 1.0, 7.0, 5.0, 5.0, 14.0, 13.0, 7.0, 20.0, 23.0, 24.0, 22.0, 51.0, 54.0, 87.0, 102.0, 182.0, 443.0, 2359.0, 1002963.0, 40532.0, 899.0, 242.0, 114.0, 93.0, 63.0, 50.0, 41.0, 31.0, 21.0, 20.0, 16.0, 11.0, 9.0, 8.0, 6.0, 3.0, 3.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.05712890625, -0.055384159088134766, -0.05363941192626953, -0.0518946647644043, -0.05014991760253906, -0.04840517044067383, -0.046660423278808594, -0.04491567611694336, -0.043170928955078125, -0.04142618179321289, -0.039681434631347656, -0.03793668746948242, -0.03619194030761719, -0.03444719314575195, -0.03270244598388672, -0.030957698822021484, -0.02921295166015625, -0.027468204498291016, -0.02572345733642578, -0.023978710174560547, -0.022233963012695312, -0.020489215850830078, -0.018744468688964844, -0.01699972152709961, -0.015254974365234375, -0.01351022720336914, -0.011765480041503906, -0.010020732879638672, -0.008275985717773438, -0.006531238555908203, -0.004786491394042969, -0.0030417442321777344, -0.0012969970703125, 0.0004477500915527344, 0.0021924972534179688, 0.003937244415283203, 0.0056819915771484375, 0.007426738739013672, 0.009171485900878906, 0.01091623306274414, 0.012660980224609375, 0.01440572738647461, 0.016150474548339844, 0.017895221710205078, 0.019639968872070312, 0.021384716033935547, 0.02312946319580078, 0.024874210357666016, 0.02661895751953125, 0.028363704681396484, 0.03010845184326172, 0.03185319900512695, 0.03359794616699219, 0.03534269332885742, 0.037087440490722656, 0.03883218765258789, 0.040576934814453125, 0.04232168197631836, 0.044066429138183594, 0.04581117630004883, 0.04755592346191406, 0.0493006706237793, 0.05104541778564453, 0.052790164947509766, 0.054534912109375]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 19.0, 154.0, 387.0, 339.0, 91.0, 18.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008039196953177452, -0.007878146134316921, -0.00771709531545639, -0.0075560444965958595, -0.007394993677735329, -0.0072339423932135105, -0.00707289157435298, -0.006911840755492449, -0.006750789936631918, -0.006589739117771387, -0.006428688298910856, -0.006267637480050325, -0.006106586195528507, -0.005945535376667976, -0.0057844845578074455, -0.005623433738946915, -0.005462382920086384, -0.005301332101225853, -0.005140281282365322, -0.004979230463504791, -0.00481817964464426, -0.004657128360122442, -0.004496077541261911, -0.0043350267224013805, -0.00417397590354085, -0.004012925084680319, -0.003851874265819788, -0.0036908232141286135, -0.0035297723952680826, -0.0033687215764075518, -0.0032076705247163773, -0.0030466197058558464, -0.002885569352656603, -0.002724518533796072, -0.002563467714935541, -0.0024024166632443666, -0.002241365844383836, -0.002080315025523305, -0.0019192640902474523, -0.0017582131549715996, -0.0015971623361110687, -0.0014361115172505379, -0.0012750605819746852, -0.0011140096466988325, -0.0009529588278383017, -0.0007919079507701099, -0.0006308570737019181, -0.00046980613842606544, -0.0003087553195655346, -0.00014770444249734282, 1.3346434570848942e-05, 0.0001743973116390407, 0.0003354481887072325, 0.0004964990657754242, 0.000657549942843616, 0.0008186008781194687, 0.0009796516969799995, 0.0011407025158405304, 0.001301753451116383, 0.0014628043863922358, 0.0016238552052527666, 0.0017849060241132975, 0.0019459569593891501, 0.002107007894665003, 0.0022680587135255337]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 2.0, 3.0, 6.0, 10.0, 7.0, 7.0, 6.0, 6.0, 9.0, 24.0, 16.0, 23.0, 21.0, 19.0, 22.0, 24.0, 28.0, 40.0, 42.0, 28.0, 33.0, 26.0, 44.0, 28.0, 39.0, 45.0, 30.0, 48.0, 39.0, 38.0, 46.0, 36.0, 24.0, 21.0, 26.0, 20.0, 27.0, 16.0, 17.0, 7.0, 17.0, 5.0, 6.0, 7.0, 6.0, 5.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0011587142944335938, -0.0011224783957004547, -0.0010862424969673157, -0.0010500065982341766, -0.0010137706995010376, -0.0009775348007678986, -0.0009412989020347595, -0.0009050630033016205, -0.0008688271045684814, -0.0008325912058353424, -0.0007963553071022034, -0.0007601194083690643, -0.0007238835096359253, -0.0006876476109027863, -0.0006514117121696472, -0.0006151758134365082, -0.0005789399147033691, -0.0005427040159702301, -0.0005064681172370911, -0.000470232218503952, -0.000433996319770813, -0.00039776042103767395, -0.0003615245223045349, -0.0003252886235713959, -0.00028905272483825684, -0.0002528168261051178, -0.00021658092737197876, -0.00018034502863883972, -0.00014410912990570068, -0.00010787323117256165, -7.163733243942261e-05, -3.540143370628357e-05, 8.344650268554688e-07, 3.707036375999451e-05, 7.330626249313354e-05, 0.00010954216122627258, 0.00014577805995941162, 0.00018201395869255066, 0.0002182498574256897, 0.00025448575615882874, 0.0002907216548919678, 0.0003269575536251068, 0.00036319345235824585, 0.0003994293510913849, 0.0004356652498245239, 0.00047190114855766296, 0.000508137047290802, 0.000544372946023941, 0.0005806088447570801, 0.0006168447434902191, 0.0006530806422233582, 0.0006893165409564972, 0.0007255524396896362, 0.0007617883384227753, 0.0007980242371559143, 0.0008342601358890533, 0.0008704960346221924, 0.0009067319333553314, 0.0009429678320884705, 0.0009792037308216095, 0.0010154396295547485, 0.0010516755282878876, 0.0010879114270210266, 0.0011241473257541656, 0.0011603832244873047]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 8.0, 8.0, 9.0, 14.0, 23.0, 17.0, 15.0, 14.0, 24.0, 27.0, 25.0, 42.0, 36.0, 34.0, 40.0, 42.0, 47.0, 39.0, 51.0, 40.0, 48.0, 47.0, 41.0, 46.0, 36.0, 32.0, 33.0, 23.0, 26.0, 22.0, 10.0, 21.0, 15.0, 11.0, 7.0, 4.0, 6.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.2734375, -7.04705810546875, -6.8206787109375, -6.59429931640625, -6.367919921875, -6.14154052734375, -5.9151611328125, -5.68878173828125, -5.46240234375, -5.23602294921875, -5.0096435546875, -4.78326416015625, -4.556884765625, -4.33050537109375, -4.1041259765625, -3.87774658203125, -3.6513671875, -3.42498779296875, -3.1986083984375, -2.97222900390625, -2.745849609375, -2.51947021484375, -2.2930908203125, -2.06671142578125, -1.84033203125, -1.61395263671875, -1.3875732421875, -1.16119384765625, -0.934814453125, -0.70843505859375, -0.4820556640625, -0.25567626953125, -0.029296875, 0.19708251953125, 0.4234619140625, 0.64984130859375, 0.876220703125, 1.10260009765625, 1.3289794921875, 1.55535888671875, 1.78173828125, 2.00811767578125, 2.2344970703125, 2.46087646484375, 2.687255859375, 2.91363525390625, 3.1400146484375, 3.36639404296875, 3.5927734375, 3.81915283203125, 4.0455322265625, 4.27191162109375, 4.498291015625, 4.72467041015625, 4.9510498046875, 5.17742919921875, 5.40380859375, 5.63018798828125, 5.8565673828125, 6.08294677734375, 6.309326171875, 6.53570556640625, 6.7620849609375, 6.98846435546875, 7.21484375]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 6.0, 11.0, 11.0, 15.0, 18.0, 36.0, 34.0, 42.0, 78.0, 118.0, 203.0, 328.0, 690.0, 1236.0, 2507.0, 5625.0, 14856.0, 56201.0, 326771.0, 522375.0, 84228.0, 19846.0, 6907.0, 3033.0, 1464.0, 775.0, 415.0, 261.0, 154.0, 102.0, 50.0, 35.0, 40.0, 25.0, 17.0, 12.0, 4.0, 9.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.03515625, -6.816162109375, -6.59716796875, -6.378173828125, -6.1591796875, -5.940185546875, -5.72119140625, -5.502197265625, -5.283203125, -5.064208984375, -4.84521484375, -4.626220703125, -4.4072265625, -4.188232421875, -3.96923828125, -3.750244140625, -3.53125, -3.312255859375, -3.09326171875, -2.874267578125, -2.6552734375, -2.436279296875, -2.21728515625, -1.998291015625, -1.779296875, -1.560302734375, -1.34130859375, -1.122314453125, -0.9033203125, -0.684326171875, -0.46533203125, -0.246337890625, -0.02734375, 0.191650390625, 0.41064453125, 0.629638671875, 0.8486328125, 1.067626953125, 1.28662109375, 1.505615234375, 1.724609375, 1.943603515625, 2.16259765625, 2.381591796875, 2.6005859375, 2.819580078125, 3.03857421875, 3.257568359375, 3.4765625, 3.695556640625, 3.91455078125, 4.133544921875, 4.3525390625, 4.571533203125, 4.79052734375, 5.009521484375, 5.228515625, 5.447509765625, 5.66650390625, 5.885498046875, 6.1044921875, 6.323486328125, 6.54248046875, 6.761474609375, 6.98046875]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 1.0, 6.0, 6.0, 5.0, 7.0, 10.0, 14.0, 9.0, 11.0, 22.0, 28.0, 18.0, 28.0, 30.0, 43.0, 31.0, 35.0, 33.0, 63.0, 56.0, 156.0, 1752.0, 205.0, 62.0, 48.0, 50.0, 36.0, 44.0, 32.0, 30.0, 36.0, 25.0, 21.0, 20.0, 18.0, 15.0, 10.0, 6.0, 7.0, 6.0, 6.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-24.375, -23.66943359375, -22.9638671875, -22.25830078125, -21.552734375, -20.84716796875, -20.1416015625, -19.43603515625, -18.73046875, -18.02490234375, -17.3193359375, -16.61376953125, -15.908203125, -15.20263671875, -14.4970703125, -13.79150390625, -13.0859375, -12.38037109375, -11.6748046875, -10.96923828125, -10.263671875, -9.55810546875, -8.8525390625, -8.14697265625, -7.44140625, -6.73583984375, -6.0302734375, -5.32470703125, -4.619140625, -3.91357421875, -3.2080078125, -2.50244140625, -1.796875, -1.09130859375, -0.3857421875, 0.31982421875, 1.025390625, 1.73095703125, 2.4365234375, 3.14208984375, 3.84765625, 4.55322265625, 5.2587890625, 5.96435546875, 6.669921875, 7.37548828125, 8.0810546875, 8.78662109375, 9.4921875, 10.19775390625, 10.9033203125, 11.60888671875, 12.314453125, 13.02001953125, 13.7255859375, 14.43115234375, 15.13671875, 15.84228515625, 16.5478515625, 17.25341796875, 17.958984375, 18.66455078125, 19.3701171875, 20.07568359375, 20.78125]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 3.0, 11.0, 7.0, 14.0, 11.0, 15.0, 23.0, 28.0, 48.0, 49.0, 76.0, 109.0, 163.0, 228.0, 365.0, 807.0, 8967.0, 3119899.0, 12804.0, 912.0, 390.0, 230.0, 150.0, 106.0, 75.0, 49.0, 54.0, 21.0, 17.0, 18.0, 16.0, 14.0, 8.0, 5.0, 4.0, 6.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-71.8125, -69.84716796875, -67.8818359375, -65.91650390625, -63.951171875, -61.98583984375, -60.0205078125, -58.05517578125, -56.08984375, -54.12451171875, -52.1591796875, -50.19384765625, -48.228515625, -46.26318359375, -44.2978515625, -42.33251953125, -40.3671875, -38.40185546875, -36.4365234375, -34.47119140625, -32.505859375, -30.54052734375, -28.5751953125, -26.60986328125, -24.64453125, -22.67919921875, -20.7138671875, -18.74853515625, -16.783203125, -14.81787109375, -12.8525390625, -10.88720703125, -8.921875, -6.95654296875, -4.9912109375, -3.02587890625, -1.060546875, 0.90478515625, 2.8701171875, 4.83544921875, 6.80078125, 8.76611328125, 10.7314453125, 12.69677734375, 14.662109375, 16.62744140625, 18.5927734375, 20.55810546875, 22.5234375, 24.48876953125, 26.4541015625, 28.41943359375, 30.384765625, 32.35009765625, 34.3154296875, 36.28076171875, 38.24609375, 40.21142578125, 42.1767578125, 44.14208984375, 46.107421875, 48.07275390625, 50.0380859375, 52.00341796875, 53.96875]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 7.0, 114.0, 410.0, 370.0, 98.0, 12.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.324606895446777, -10.261812210083008, -8.199018478393555, -6.136223793029785, -4.073429107666016, -2.010634422302246, 0.05215930938720703, 2.1149539947509766, 4.177748680114746, 6.240543365478516, 8.303337097167969, 10.366131782531738, 12.428926467895508, 14.491721153259277, 16.554515838623047, 18.6173095703125, 20.680103302001953, 22.742897033691406, 24.805692672729492, 26.868486404418945, 28.93128204345703, 30.994075775146484, 33.05686950683594, 35.11966323852539, 37.18246078491211, 39.24525451660156, 41.308048248291016, 43.37084197998047, 45.43363952636719, 47.49643325805664, 49.559226989746094, 51.62202072143555, 53.68482208251953, 55.747615814208984, 57.81040954589844, 59.873207092285156, 61.93600082397461, 63.99879455566406, 66.06158447265625, 68.12438201904297, 70.18717956542969, 72.2499771118164, 74.3127670288086, 76.37556457519531, 78.4383544921875, 80.50115203857422, 82.56394958496094, 84.62673950195312, 86.68952941894531, 88.75232696533203, 90.81511688232422, 92.87791442871094, 94.94070434570312, 97.00350189208984, 99.06629943847656, 101.12908935546875, 103.19188690185547, 105.25468444824219, 107.31747436523438, 109.3802719116211, 111.44306182861328, 113.505859375, 115.56864929199219, 117.6314468383789, 119.69424438476562]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 5.0, 5.0, 4.0, 11.0, 4.0, 9.0, 8.0, 20.0, 15.0, 16.0, 26.0, 22.0, 24.0, 27.0, 33.0, 35.0, 35.0, 31.0, 32.0, 46.0, 38.0, 44.0, 41.0, 37.0, 44.0, 39.0, 34.0, 38.0, 30.0, 27.0, 35.0, 28.0, 19.0, 23.0, 15.0, 16.0, 18.0, 13.0, 8.0, 9.0, 6.0, 2.0, 5.0, 3.0, 4.0, 6.0, 6.0, 2.0, 1.0, 2.0, 3.0], "bins": [-56.34214782714844, -54.72157669067383, -53.10100173950195, -51.480430603027344, -49.85985565185547, -48.23928451538086, -46.61871337890625, -44.998138427734375, -43.3775634765625, -41.75699234008789, -40.136417388916016, -38.515846252441406, -36.89527130126953, -35.27470016479492, -33.65412902832031, -32.03355407714844, -30.412982940673828, -28.792409896850586, -27.171836853027344, -25.551265716552734, -23.93069076538086, -22.31011962890625, -20.689546585083008, -19.068973541259766, -17.448400497436523, -15.827827453613281, -14.207254409790039, -12.586682319641113, -10.966109275817871, -9.345536231994629, -7.724964141845703, -6.104391098022461, -4.483818054199219, -2.8632452487945557, -1.2426724433898926, 0.3779001235961914, 1.9984731674194336, 3.619046211242676, 5.239618301391602, 6.860191345214844, 8.480764389038086, 10.101337432861328, 11.72191047668457, 13.342482566833496, 14.963055610656738, 16.583629608154297, 18.204200744628906, 19.82477378845215, 21.44534683227539, 23.065919876098633, 24.686492919921875, 26.307064056396484, 27.92763900756836, 29.54821014404297, 31.16878318786621, 32.78935623168945, 34.40992736816406, 36.03049850463867, 37.65107345581055, 39.271644592285156, 40.89221954345703, 42.51279067993164, 44.13336181640625, 45.753936767578125, 47.37451171875]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 6.0, 7.0, 7.0, 12.0, 21.0, 15.0, 18.0, 18.0, 18.0, 24.0, 30.0, 35.0, 38.0, 38.0, 47.0, 45.0, 44.0, 36.0, 45.0, 48.0, 51.0, 46.0, 46.0, 40.0, 41.0, 39.0, 31.0, 24.0, 22.0, 27.0, 14.0, 15.0, 15.0, 9.0, 9.0, 2.0, 4.0, 4.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.015625, -7.775146484375, -7.53466796875, -7.294189453125, -7.0537109375, -6.813232421875, -6.57275390625, -6.332275390625, -6.091796875, -5.851318359375, -5.61083984375, -5.370361328125, -5.1298828125, -4.889404296875, -4.64892578125, -4.408447265625, -4.16796875, -3.927490234375, -3.68701171875, -3.446533203125, -3.2060546875, -2.965576171875, -2.72509765625, -2.484619140625, -2.244140625, -2.003662109375, -1.76318359375, -1.522705078125, -1.2822265625, -1.041748046875, -0.80126953125, -0.560791015625, -0.3203125, -0.079833984375, 0.16064453125, 0.401123046875, 0.6416015625, 0.882080078125, 1.12255859375, 1.363037109375, 1.603515625, 1.843994140625, 2.08447265625, 2.324951171875, 2.5654296875, 2.805908203125, 3.04638671875, 3.286865234375, 3.52734375, 3.767822265625, 4.00830078125, 4.248779296875, 4.4892578125, 4.729736328125, 4.97021484375, 5.210693359375, 5.451171875, 5.691650390625, 5.93212890625, 6.172607421875, 6.4130859375, 6.653564453125, 6.89404296875, 7.134521484375, 7.375]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 5.0, 2.0, 5.0, 6.0, 9.0, 7.0, 10.0, 18.0, 19.0, 24.0, 37.0, 34.0, 43.0, 51.0, 77.0, 109.0, 150.0, 235.0, 398.0, 974.0, 3040.0, 15620.0, 230531.0, 2642983.0, 1226068.0, 63813.0, 6686.0, 1699.0, 662.0, 294.0, 177.0, 107.0, 82.0, 64.0, 51.0, 49.0, 31.0, 23.0, 30.0, 15.0, 9.0, 10.0, 5.0, 10.0, 4.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.734375, -17.158203125, -16.58203125, -16.005859375, -15.4296875, -14.853515625, -14.27734375, -13.701171875, -13.125, -12.548828125, -11.97265625, -11.396484375, -10.8203125, -10.244140625, -9.66796875, -9.091796875, -8.515625, -7.939453125, -7.36328125, -6.787109375, -6.2109375, -5.634765625, -5.05859375, -4.482421875, -3.90625, -3.330078125, -2.75390625, -2.177734375, -1.6015625, -1.025390625, -0.44921875, 0.126953125, 0.703125, 1.279296875, 1.85546875, 2.431640625, 3.0078125, 3.583984375, 4.16015625, 4.736328125, 5.3125, 5.888671875, 6.46484375, 7.041015625, 7.6171875, 8.193359375, 8.76953125, 9.345703125, 9.921875, 10.498046875, 11.07421875, 11.650390625, 12.2265625, 12.802734375, 13.37890625, 13.955078125, 14.53125, 15.107421875, 15.68359375, 16.259765625, 16.8359375, 17.412109375, 17.98828125, 18.564453125, 19.140625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 5.0, 5.0, 6.0, 4.0, 7.0, 14.0, 19.0, 11.0, 37.0, 36.0, 64.0, 78.0, 98.0, 137.0, 205.0, 274.0, 406.0, 453.0, 504.0, 454.0, 379.0, 254.0, 176.0, 131.0, 94.0, 65.0, 43.0, 41.0, 23.0, 22.0, 14.0, 10.0, 2.0, 8.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.09375, -16.648193359375, -16.20263671875, -15.757080078125, -15.3115234375, -14.865966796875, -14.42041015625, -13.974853515625, -13.529296875, -13.083740234375, -12.63818359375, -12.192626953125, -11.7470703125, -11.301513671875, -10.85595703125, -10.410400390625, -9.96484375, -9.519287109375, -9.07373046875, -8.628173828125, -8.1826171875, -7.737060546875, -7.29150390625, -6.845947265625, -6.400390625, -5.954833984375, -5.50927734375, -5.063720703125, -4.6181640625, -4.172607421875, -3.72705078125, -3.281494140625, -2.8359375, -2.390380859375, -1.94482421875, -1.499267578125, -1.0537109375, -0.608154296875, -0.16259765625, 0.282958984375, 0.728515625, 1.174072265625, 1.61962890625, 2.065185546875, 2.5107421875, 2.956298828125, 3.40185546875, 3.847412109375, 4.29296875, 4.738525390625, 5.18408203125, 5.629638671875, 6.0751953125, 6.520751953125, 6.96630859375, 7.411865234375, 7.857421875, 8.302978515625, 8.74853515625, 9.194091796875, 9.6396484375, 10.085205078125, 10.53076171875, 10.976318359375, 11.421875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 6.0, 7.0, 15.0, 22.0, 24.0, 31.0, 39.0, 53.0, 59.0, 87.0, 119.0, 131.0, 216.0, 258.0, 397.0, 746.0, 3867.0, 1024166.0, 3154203.0, 7396.0, 873.0, 443.0, 278.0, 191.0, 155.0, 114.0, 84.0, 63.0, 59.0, 44.0, 23.0, 31.0, 31.0, 9.0, 14.0, 5.0, 8.0, 3.0, 4.0, 2.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.40625, -50.54052734375, -48.6748046875, -46.80908203125, -44.943359375, -43.07763671875, -41.2119140625, -39.34619140625, -37.48046875, -35.61474609375, -33.7490234375, -31.88330078125, -30.017578125, -28.15185546875, -26.2861328125, -24.42041015625, -22.5546875, -20.68896484375, -18.8232421875, -16.95751953125, -15.091796875, -13.22607421875, -11.3603515625, -9.49462890625, -7.62890625, -5.76318359375, -3.8974609375, -2.03173828125, -0.166015625, 1.69970703125, 3.5654296875, 5.43115234375, 7.296875, 9.16259765625, 11.0283203125, 12.89404296875, 14.759765625, 16.62548828125, 18.4912109375, 20.35693359375, 22.22265625, 24.08837890625, 25.9541015625, 27.81982421875, 29.685546875, 31.55126953125, 33.4169921875, 35.28271484375, 37.1484375, 39.01416015625, 40.8798828125, 42.74560546875, 44.611328125, 46.47705078125, 48.3427734375, 50.20849609375, 52.07421875, 53.93994140625, 55.8056640625, 57.67138671875, 59.537109375, 61.40283203125, 63.2685546875, 65.13427734375, 67.0]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 10.0, 13.0, 31.0, 48.0, 62.0, 108.0, 123.0, 123.0, 128.0, 115.0, 93.0, 64.0, 39.0, 30.0, 8.0, 3.0, 6.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-72.71900177001953, -70.8021469116211, -68.88528442382812, -66.96842956542969, -65.05157470703125, -63.13471221923828, -61.217857360839844, -59.30099868774414, -57.38414001464844, -55.467281341552734, -53.55042266845703, -51.633567810058594, -49.71670913696289, -47.79985046386719, -45.88299560546875, -43.96613693237305, -42.049278259277344, -40.13241958618164, -38.21556091308594, -36.2987060546875, -34.3818473815918, -32.464988708496094, -30.548131942749023, -28.631275177001953, -26.71441650390625, -24.797557830810547, -22.880701065063477, -20.963844299316406, -19.046985626220703, -17.130126953125, -15.21327018737793, -13.296412467956543, -11.379558563232422, -9.462700843811035, -7.545843124389648, -5.628985404968262, -3.712127685546875, -1.7952699661254883, 0.12158775329589844, 2.038445472717285, 3.955303192138672, 5.872160911560059, 7.789018630981445, 9.705876350402832, 11.622734069824219, 13.539591789245605, 15.456449508666992, 17.373306274414062, 19.290164947509766, 21.20702362060547, 23.12388038635254, 25.04073715209961, 26.957595825195312, 28.874454498291016, 30.791311264038086, 32.708168029785156, 34.62502670288086, 36.54188537597656, 38.458740234375, 40.3755989074707, 42.292457580566406, 44.20931625366211, 46.12617492675781, 48.04302978515625, 49.95988845825195]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 6.0, 6.0, 9.0, 4.0, 20.0, 14.0, 18.0, 15.0, 22.0, 26.0, 17.0, 26.0, 25.0, 28.0, 31.0, 42.0, 21.0, 25.0, 42.0, 39.0, 43.0, 34.0, 44.0, 45.0, 42.0, 32.0, 29.0, 34.0, 34.0, 26.0, 19.0, 26.0, 21.0, 21.0, 9.0, 22.0, 23.0, 16.0, 7.0, 10.0, 9.0, 4.0, 5.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0, 3.0, 3.0], "bins": [-41.55791473388672, -40.33024978637695, -39.10258102416992, -37.874916076660156, -36.647247314453125, -35.41958236694336, -34.19191360473633, -32.96424865722656, -31.73657989501953, -30.508913040161133, -29.281246185302734, -28.053579330444336, -26.825912475585938, -25.59824562072754, -24.37057876586914, -23.142913818359375, -21.915246963500977, -20.687580108642578, -19.45991325378418, -18.23224639892578, -17.004579544067383, -15.776912689208984, -14.549246788024902, -13.321579933166504, -12.093913078308105, -10.866246223449707, -9.638579368591309, -8.410913467407227, -7.18324613571167, -5.9555792808532715, -4.727912902832031, -3.500246047973633, -2.2725791931152344, -1.0449124574661255, 0.1827542781829834, 1.4104208946228027, 2.638087749481201, 3.8657546043395996, 5.09342098236084, 6.321087837219238, 7.548754692077637, 8.776421546936035, 10.004088401794434, 11.231754302978516, 12.459421157836914, 13.687088012695312, 14.914754867553711, 16.14242172241211, 17.370088577270508, 18.597755432128906, 19.825422286987305, 21.053089141845703, 22.2807559967041, 23.5084228515625, 24.736087799072266, 25.963756561279297, 27.191421508789062, 28.41908836364746, 29.64675521850586, 30.874422073364258, 32.102088928222656, 33.32975387573242, 34.55742263793945, 35.78508758544922, 37.01275634765625]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 5.0, 0.0, 2.0, 4.0, 9.0, 9.0, 9.0, 14.0, 25.0, 22.0, 18.0, 22.0, 27.0, 26.0, 33.0, 30.0, 35.0, 35.0, 40.0, 42.0, 58.0, 55.0, 46.0, 56.0, 44.0, 30.0, 41.0, 34.0, 39.0, 30.0, 30.0, 22.0, 23.0, 21.0, 15.0, 11.0, 9.0, 7.0, 10.0, 9.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.74609375, -7.51507568359375, -7.2840576171875, -7.05303955078125, -6.822021484375, -6.59100341796875, -6.3599853515625, -6.12896728515625, -5.89794921875, -5.66693115234375, -5.4359130859375, -5.20489501953125, -4.973876953125, -4.74285888671875, -4.5118408203125, -4.28082275390625, -4.0498046875, -3.81878662109375, -3.5877685546875, -3.35675048828125, -3.125732421875, -2.89471435546875, -2.6636962890625, -2.43267822265625, -2.20166015625, -1.97064208984375, -1.7396240234375, -1.50860595703125, -1.277587890625, -1.04656982421875, -0.8155517578125, -0.58453369140625, -0.353515625, -0.12249755859375, 0.1085205078125, 0.33953857421875, 0.570556640625, 0.80157470703125, 1.0325927734375, 1.26361083984375, 1.49462890625, 1.72564697265625, 1.9566650390625, 2.18768310546875, 2.418701171875, 2.64971923828125, 2.8807373046875, 3.11175537109375, 3.3427734375, 3.57379150390625, 3.8048095703125, 4.03582763671875, 4.266845703125, 4.49786376953125, 4.7288818359375, 4.95989990234375, 5.19091796875, 5.42193603515625, 5.6529541015625, 5.88397216796875, 6.114990234375, 6.34600830078125, 6.5770263671875, 6.80804443359375, 7.0390625]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 5.0, 14.0, 19.0, 22.0, 21.0, 38.0, 57.0, 76.0, 111.0, 194.0, 282.0, 410.0, 568.0, 869.0, 1433.0, 2236.0, 3437.0, 5385.0, 8643.0, 14493.0, 24841.0, 44640.0, 84580.0, 170664.0, 291179.0, 186523.0, 92193.0, 48125.0, 26604.0, 15457.0, 9315.0, 5797.0, 3691.0, 2255.0, 1458.0, 975.0, 658.0, 448.0, 283.0, 166.0, 134.0, 87.0, 52.0, 43.0, 26.0, 19.0, 9.0, 6.0, 6.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0], "bins": [-1.1220703125, -1.0886383056640625, -1.055206298828125, -1.0217742919921875, -0.98834228515625, -0.9549102783203125, -0.921478271484375, -0.8880462646484375, -0.8546142578125, -0.8211822509765625, -0.787750244140625, -0.7543182373046875, -0.72088623046875, -0.6874542236328125, -0.654022216796875, -0.6205902099609375, -0.587158203125, -0.5537261962890625, -0.520294189453125, -0.4868621826171875, -0.45343017578125, -0.4199981689453125, -0.386566162109375, -0.3531341552734375, -0.3197021484375, -0.2862701416015625, -0.252838134765625, -0.2194061279296875, -0.18597412109375, -0.1525421142578125, -0.119110107421875, -0.0856781005859375, -0.05224609375, -0.0188140869140625, 0.014617919921875, 0.0480499267578125, 0.08148193359375, 0.1149139404296875, 0.148345947265625, 0.1817779541015625, 0.2152099609375, 0.2486419677734375, 0.282073974609375, 0.3155059814453125, 0.34893798828125, 0.3823699951171875, 0.415802001953125, 0.4492340087890625, 0.482666015625, 0.5160980224609375, 0.549530029296875, 0.5829620361328125, 0.61639404296875, 0.6498260498046875, 0.683258056640625, 0.7166900634765625, 0.7501220703125, 0.7835540771484375, 0.816986083984375, 0.8504180908203125, 0.88385009765625, 0.9172821044921875, 0.950714111328125, 0.9841461181640625, 1.017578125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 2.0, 2.0, 3.0, 6.0, 1.0, 2.0, 9.0, 8.0, 9.0, 8.0, 16.0, 10.0, 13.0, 21.0, 27.0, 32.0, 29.0, 27.0, 20.0, 32.0, 37.0, 42.0, 44.0, 30.0, 45.0, 1064.0, 44.0, 35.0, 28.0, 47.0, 34.0, 38.0, 28.0, 25.0, 30.0, 22.0, 30.0, 16.0, 21.0, 18.0, 17.0, 12.0, 6.0, 7.0, 12.0, 4.0, 7.0, 4.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.03125, -3.90496826171875, -3.7786865234375, -3.65240478515625, -3.526123046875, -3.39984130859375, -3.2735595703125, -3.14727783203125, -3.02099609375, -2.89471435546875, -2.7684326171875, -2.64215087890625, -2.515869140625, -2.38958740234375, -2.2633056640625, -2.13702392578125, -2.0107421875, -1.88446044921875, -1.7581787109375, -1.63189697265625, -1.505615234375, -1.37933349609375, -1.2530517578125, -1.12677001953125, -1.00048828125, -0.87420654296875, -0.7479248046875, -0.62164306640625, -0.495361328125, -0.36907958984375, -0.2427978515625, -0.11651611328125, 0.009765625, 0.13604736328125, 0.2623291015625, 0.38861083984375, 0.514892578125, 0.64117431640625, 0.7674560546875, 0.89373779296875, 1.02001953125, 1.14630126953125, 1.2725830078125, 1.39886474609375, 1.525146484375, 1.65142822265625, 1.7777099609375, 1.90399169921875, 2.0302734375, 2.15655517578125, 2.2828369140625, 2.40911865234375, 2.535400390625, 2.66168212890625, 2.7879638671875, 2.91424560546875, 3.04052734375, 3.16680908203125, 3.2930908203125, 3.41937255859375, 3.545654296875, 3.67193603515625, 3.7982177734375, 3.92449951171875, 4.05078125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 2.0, 5.0, 10.0, 13.0, 17.0, 25.0, 35.0, 47.0, 86.0, 107.0, 137.0, 187.0, 281.0, 401.0, 506.0, 710.0, 1007.0, 1494.0, 2060.0, 3047.0, 4352.0, 6494.0, 10115.0, 14822.0, 23880.0, 37974.0, 63292.0, 110948.0, 196398.0, 1275546.0, 138147.0, 76685.0, 45870.0, 28236.0, 17791.0, 11792.0, 7757.0, 5219.0, 3483.0, 2401.0, 1717.0, 1187.0, 834.0, 596.0, 407.0, 311.0, 208.0, 156.0, 115.0, 65.0, 54.0, 39.0, 22.0, 20.0, 15.0, 8.0, 6.0, 3.0, 4.0, 1.0], "bins": [-0.79052734375, -0.7667083740234375, -0.742889404296875, -0.7190704345703125, -0.69525146484375, -0.6714324951171875, -0.647613525390625, -0.6237945556640625, -0.5999755859375, -0.5761566162109375, -0.552337646484375, -0.5285186767578125, -0.50469970703125, -0.4808807373046875, -0.457061767578125, -0.4332427978515625, -0.409423828125, -0.3856048583984375, -0.361785888671875, -0.3379669189453125, -0.31414794921875, -0.2903289794921875, -0.266510009765625, -0.2426910400390625, -0.2188720703125, -0.1950531005859375, -0.171234130859375, -0.1474151611328125, -0.12359619140625, -0.0997772216796875, -0.075958251953125, -0.0521392822265625, -0.0283203125, -0.0045013427734375, 0.019317626953125, 0.0431365966796875, 0.06695556640625, 0.0907745361328125, 0.114593505859375, 0.1384124755859375, 0.1622314453125, 0.1860504150390625, 0.209869384765625, 0.2336883544921875, 0.25750732421875, 0.2813262939453125, 0.305145263671875, 0.3289642333984375, 0.352783203125, 0.3766021728515625, 0.400421142578125, 0.4242401123046875, 0.44805908203125, 0.4718780517578125, 0.495697021484375, 0.5195159912109375, 0.5433349609375, 0.5671539306640625, 0.590972900390625, 0.6147918701171875, 0.63861083984375, 0.6624298095703125, 0.686248779296875, 0.7100677490234375, 0.73388671875]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 4.0, 6.0, 2.0, 5.0, 3.0, 5.0, 5.0, 10.0, 5.0, 13.0, 11.0, 17.0, 19.0, 19.0, 29.0, 27.0, 23.0, 30.0, 26.0, 42.0, 33.0, 52.0, 55.0, 55.0, 47.0, 58.0, 51.0, 38.0, 44.0, 37.0, 27.0, 38.0, 25.0, 19.0, 23.0, 14.0, 15.0, 11.0, 7.0, 5.0, 14.0, 9.0, 9.0, 3.0, 7.0, 4.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.0017375946044921875, -0.0016822516918182373, -0.0016269087791442871, -0.001571565866470337, -0.0015162229537963867, -0.0014608800411224365, -0.0014055371284484863, -0.0013501942157745361, -0.001294851303100586, -0.0012395083904266357, -0.0011841654777526855, -0.0011288225650787354, -0.0010734796524047852, -0.001018136739730835, -0.0009627938270568848, -0.0009074509143829346, -0.0008521080017089844, -0.0007967650890350342, -0.000741422176361084, -0.0006860792636871338, -0.0006307363510131836, -0.0005753934383392334, -0.0005200505256652832, -0.000464707612991333, -0.0004093647003173828, -0.0003540217876434326, -0.0002986788749694824, -0.00024333596229553223, -0.00018799304962158203, -0.00013265013694763184, -7.730722427368164e-05, -2.1964311599731445e-05, 3.337860107421875e-05, 8.872151374816895e-05, 0.00014406442642211914, 0.00019940733909606934, 0.00025475025177001953, 0.0003100931644439697, 0.0003654360771179199, 0.0004207789897918701, 0.0004761219024658203, 0.0005314648151397705, 0.0005868077278137207, 0.0006421506404876709, 0.0006974935531616211, 0.0007528364658355713, 0.0008081793785095215, 0.0008635222911834717, 0.0009188652038574219, 0.0009742081165313721, 0.0010295510292053223, 0.0010848939418792725, 0.0011402368545532227, 0.0011955797672271729, 0.001250922679901123, 0.0013062655925750732, 0.0013616085052490234, 0.0014169514179229736, 0.0014722943305969238, 0.001527637243270874, 0.0015829801559448242, 0.0016383230686187744, 0.0016936659812927246, 0.0017490088939666748, 0.001804351806640625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 4.0, 5.0, 10.0, 8.0, 10.0, 20.0, 14.0, 20.0, 21.0, 33.0, 36.0, 56.0, 55.0, 82.0, 101.0, 221.0, 527.0, 2313.0, 999491.0, 43670.0, 911.0, 333.0, 158.0, 88.0, 71.0, 58.0, 46.0, 36.0, 37.0, 22.0, 16.0, 19.0, 12.0, 11.0, 9.0, 2.0, 4.0, 6.0, 2.0, 5.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.044525146484375, -0.043076515197753906, -0.04162788391113281, -0.04017925262451172, -0.038730621337890625, -0.03728199005126953, -0.03583335876464844, -0.034384727478027344, -0.03293609619140625, -0.031487464904785156, -0.030038833618164062, -0.02859020233154297, -0.027141571044921875, -0.02569293975830078, -0.024244308471679688, -0.022795677185058594, -0.0213470458984375, -0.019898414611816406, -0.018449783325195312, -0.01700115203857422, -0.015552520751953125, -0.014103889465332031, -0.012655258178710938, -0.011206626892089844, -0.00975799560546875, -0.008309364318847656, -0.0068607330322265625, -0.005412101745605469, -0.003963470458984375, -0.0025148391723632812, -0.0010662078857421875, 0.00038242340087890625, 0.0018310546875, 0.0032796859741210938, 0.0047283172607421875, 0.006176948547363281, 0.007625579833984375, 0.009074211120605469, 0.010522842407226562, 0.011971473693847656, 0.01342010498046875, 0.014868736267089844, 0.016317367553710938, 0.01776599884033203, 0.019214630126953125, 0.02066326141357422, 0.022111892700195312, 0.023560523986816406, 0.0250091552734375, 0.026457786560058594, 0.027906417846679688, 0.02935504913330078, 0.030803680419921875, 0.03225231170654297, 0.03370094299316406, 0.035149574279785156, 0.03659820556640625, 0.038046836853027344, 0.03949546813964844, 0.04094409942626953, 0.042392730712890625, 0.04384136199951172, 0.04528999328613281, 0.046738624572753906, 0.048187255859375]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [4.0, 49.0, 532.0, 409.0, 24.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007347395294345915, -0.0004809266538359225, -0.00022711377823725343, 2.6699097361415625e-05, 0.0002805119729600847, 0.0005343248485587537, 0.0007881377241574228, 0.0010419506579637527, 0.0012957635335624218, 0.0015495764091610909, 0.00180338928475976, 0.002057202160358429, 0.002311015035957098, 0.002564827911555767, 0.002818640787154436, 0.003072453662753105, 0.003326266538351774, 0.0035800794139504433, 0.0038338922895491123, 0.004087705165147781, 0.00434151804074645, 0.0045953309163451195, 0.0048491437919437885, 0.005102956667542458, 0.005356769543141127, 0.005610582418739796, 0.005864395294338465, 0.006118208169937134, 0.006372021045535803, 0.006625833921134472, 0.006879646796733141, 0.00713345967233181, 0.007387273013591766, 0.007641085889190435, 0.007894898764789104, 0.008148711174726486, 0.008402524515986443, 0.008656337857246399, 0.00891015026718378, 0.009163962677121162, 0.009417776018381119, 0.009671589359641075, 0.009925401769578457, 0.010179214179515839, 0.010433027520775795, 0.010686840862035751, 0.010940653271973133, 0.011194465681910515, 0.011448279023170471, 0.011702092364430428, 0.01195590477436781, 0.012209717184305191, 0.012463530525565147, 0.012717343866825104, 0.012971156276762486, 0.013224968686699867, 0.013478782027959824, 0.01373259536921978, 0.013986407779157162, 0.014240220189094543, 0.0144940335303545, 0.014747846871614456, 0.015001659281551838, 0.01525547169148922, 0.015509285032749176]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 0.0, 4.0, 3.0, 4.0, 6.0, 13.0, 9.0, 13.0, 13.0, 8.0, 16.0, 16.0, 25.0, 21.0, 29.0, 22.0, 35.0, 22.0, 30.0, 37.0, 38.0, 50.0, 55.0, 38.0, 33.0, 44.0, 39.0, 41.0, 44.0, 25.0, 28.0, 35.0, 33.0, 35.0, 26.0, 20.0, 19.0, 15.0, 6.0, 11.0, 9.0, 9.0, 4.0, 8.0, 3.0, 6.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011382102966308594, -0.0011033406481146812, -0.0010684709995985031, -0.001033601351082325, -0.0009987317025661469, -0.0009638620540499687, -0.0009289924055337906, -0.0008941227570176125, -0.0008592531085014343, -0.0008243834599852562, -0.0007895138114690781, -0.0007546441629528999, -0.0007197745144367218, -0.0006849048659205437, -0.0006500352174043655, -0.0006151655688881874, -0.0005802959203720093, -0.0005454262718558311, -0.000510556623339653, -0.0004756869748234749, -0.00044081732630729675, -0.0004059476777911186, -0.0003710780292749405, -0.00033620838075876236, -0.00030133873224258423, -0.0002664690837264061, -0.00023159943521022797, -0.00019672978669404984, -0.0001618601381778717, -0.00012699048966169357, -9.212084114551544e-05, -5.725119262933731e-05, -2.238154411315918e-05, 1.2488104403018951e-05, 4.735775291919708e-05, 8.222740143537521e-05, 0.00011709704995155334, 0.00015196669846773148, 0.0001868363469839096, 0.00022170599550008774, 0.00025657564401626587, 0.000291445292532444, 0.00032631494104862213, 0.00036118458956480026, 0.0003960542380809784, 0.0004309238865971565, 0.00046579353511333466, 0.0005006631836295128, 0.0005355328321456909, 0.000570402480661869, 0.0006052721291780472, 0.0006401417776942253, 0.0006750114262104034, 0.0007098810747265816, 0.0007447507232427597, 0.0007796203717589378, 0.000814490020275116, 0.0008493596687912941, 0.0008842293173074722, 0.0009190989658236504, 0.0009539686143398285, 0.0009888382628560066, 0.0010237079113721848, 0.0010585775598883629, 0.001093447208404541]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 5.0, 0.0, 2.0, 4.0, 9.0, 9.0, 9.0, 14.0, 25.0, 22.0, 18.0, 22.0, 27.0, 26.0, 33.0, 30.0, 35.0, 35.0, 40.0, 42.0, 58.0, 55.0, 46.0, 56.0, 44.0, 30.0, 41.0, 34.0, 39.0, 30.0, 30.0, 22.0, 22.0, 22.0, 15.0, 11.0, 9.0, 7.0, 10.0, 9.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.74609375, -7.51507568359375, -7.2840576171875, -7.05303955078125, -6.822021484375, -6.59100341796875, -6.3599853515625, -6.12896728515625, -5.89794921875, -5.66693115234375, -5.4359130859375, -5.20489501953125, -4.973876953125, -4.74285888671875, -4.5118408203125, -4.28082275390625, -4.0498046875, -3.81878662109375, -3.5877685546875, -3.35675048828125, -3.125732421875, -2.89471435546875, -2.6636962890625, -2.43267822265625, -2.20166015625, -1.97064208984375, -1.7396240234375, -1.50860595703125, -1.277587890625, -1.04656982421875, -0.8155517578125, -0.58453369140625, -0.353515625, -0.12249755859375, 0.1085205078125, 0.33953857421875, 0.570556640625, 0.80157470703125, 1.0325927734375, 1.26361083984375, 1.49462890625, 1.72564697265625, 1.9566650390625, 2.18768310546875, 2.418701171875, 2.64971923828125, 2.8807373046875, 3.11175537109375, 3.3427734375, 3.57379150390625, 3.8048095703125, 4.03582763671875, 4.266845703125, 4.49786376953125, 4.7288818359375, 4.95989990234375, 5.19091796875, 5.42193603515625, 5.6529541015625, 5.88397216796875, 6.114990234375, 6.34600830078125, 6.5770263671875, 6.80804443359375, 7.0390625]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 8.0, 6.0, 10.0, 19.0, 26.0, 49.0, 67.0, 92.0, 146.0, 215.0, 320.0, 561.0, 1019.0, 1716.0, 3199.0, 6357.0, 12710.0, 27131.0, 61645.0, 159639.0, 410556.0, 217347.0, 79261.0, 34139.0, 15687.0, 7683.0, 4015.0, 2014.0, 1126.0, 659.0, 388.0, 272.0, 150.0, 102.0, 70.0, 47.0, 43.0, 19.0, 14.0, 10.0, 7.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-5.3515625, -5.201416015625, -5.05126953125, -4.901123046875, -4.7509765625, -4.600830078125, -4.45068359375, -4.300537109375, -4.150390625, -4.000244140625, -3.85009765625, -3.699951171875, -3.5498046875, -3.399658203125, -3.24951171875, -3.099365234375, -2.94921875, -2.799072265625, -2.64892578125, -2.498779296875, -2.3486328125, -2.198486328125, -2.04833984375, -1.898193359375, -1.748046875, -1.597900390625, -1.44775390625, -1.297607421875, -1.1474609375, -0.997314453125, -0.84716796875, -0.697021484375, -0.546875, -0.396728515625, -0.24658203125, -0.096435546875, 0.0537109375, 0.203857421875, 0.35400390625, 0.504150390625, 0.654296875, 0.804443359375, 0.95458984375, 1.104736328125, 1.2548828125, 1.405029296875, 1.55517578125, 1.705322265625, 1.85546875, 2.005615234375, 2.15576171875, 2.305908203125, 2.4560546875, 2.606201171875, 2.75634765625, 2.906494140625, 3.056640625, 3.206787109375, 3.35693359375, 3.507080078125, 3.6572265625, 3.807373046875, 3.95751953125, 4.107666015625, 4.2578125]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 5.0, 2.0, 2.0, 2.0, 10.0, 4.0, 12.0, 12.0, 13.0, 16.0, 12.0, 16.0, 22.0, 26.0, 27.0, 35.0, 28.0, 35.0, 51.0, 43.0, 63.0, 98.0, 262.0, 1576.0, 170.0, 91.0, 56.0, 42.0, 44.0, 39.0, 37.0, 26.0, 27.0, 17.0, 21.0, 20.0, 28.0, 13.0, 12.0, 9.0, 8.0, 6.0, 7.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-25.34375, -24.62646484375, -23.9091796875, -23.19189453125, -22.474609375, -21.75732421875, -21.0400390625, -20.32275390625, -19.60546875, -18.88818359375, -18.1708984375, -17.45361328125, -16.736328125, -16.01904296875, -15.3017578125, -14.58447265625, -13.8671875, -13.14990234375, -12.4326171875, -11.71533203125, -10.998046875, -10.28076171875, -9.5634765625, -8.84619140625, -8.12890625, -7.41162109375, -6.6943359375, -5.97705078125, -5.259765625, -4.54248046875, -3.8251953125, -3.10791015625, -2.390625, -1.67333984375, -0.9560546875, -0.23876953125, 0.478515625, 1.19580078125, 1.9130859375, 2.63037109375, 3.34765625, 4.06494140625, 4.7822265625, 5.49951171875, 6.216796875, 6.93408203125, 7.6513671875, 8.36865234375, 9.0859375, 9.80322265625, 10.5205078125, 11.23779296875, 11.955078125, 12.67236328125, 13.3896484375, 14.10693359375, 14.82421875, 15.54150390625, 16.2587890625, 16.97607421875, 17.693359375, 18.41064453125, 19.1279296875, 19.84521484375, 20.5625]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 5.0, 8.0, 16.0, 7.0, 20.0, 27.0, 46.0, 52.0, 77.0, 94.0, 169.0, 258.0, 429.0, 1117.0, 73115.0, 3066024.0, 2788.0, 554.0, 295.0, 189.0, 138.0, 75.0, 56.0, 43.0, 30.0, 28.0, 18.0, 9.0, 8.0, 6.0, 6.0, 1.0, 0.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.3125, -81.7734375, -79.234375, -76.6953125, -74.15625, -71.6171875, -69.078125, -66.5390625, -64.0, -61.4609375, -58.921875, -56.3828125, -53.84375, -51.3046875, -48.765625, -46.2265625, -43.6875, -41.1484375, -38.609375, -36.0703125, -33.53125, -30.9921875, -28.453125, -25.9140625, -23.375, -20.8359375, -18.296875, -15.7578125, -13.21875, -10.6796875, -8.140625, -5.6015625, -3.0625, -0.5234375, 2.015625, 4.5546875, 7.09375, 9.6328125, 12.171875, 14.7109375, 17.25, 19.7890625, 22.328125, 24.8671875, 27.40625, 29.9453125, 32.484375, 35.0234375, 37.5625, 40.1015625, 42.640625, 45.1796875, 47.71875, 50.2578125, 52.796875, 55.3359375, 57.875, 60.4140625, 62.953125, 65.4921875, 68.03125, 70.5703125, 73.109375, 75.6484375, 78.1875]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 94.0, 917.0, 7.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.50545120239258, -31.873199462890625, -22.240949630737305, -12.608699798583984, -2.9764480590820312, 6.655803680419922, 16.28805160522461, 25.920307159423828, 35.552555084228516, 45.18480682373047, 54.817054748535156, 64.44931030273438, 74.08155822753906, 83.71380615234375, 93.34605407714844, 102.97831726074219, 112.61056518554688, 122.24281311035156, 131.87506103515625, 141.50732421875, 151.1395721435547, 160.77182006835938, 170.40406799316406, 180.03631591796875, 189.66856384277344, 199.30081176757812, 208.9330596923828, 218.5653076171875, 228.19757080078125, 237.82981872558594, 247.46206665039062, 257.0943298339844, 266.7265930175781, 276.3588562011719, 285.9910888671875, 295.62335205078125, 305.2555847167969, 314.8878479003906, 324.52008056640625, 334.15234375, 343.78460693359375, 353.4168701171875, 363.0491027832031, 372.6813659667969, 382.3135986328125, 391.94586181640625, 401.578125, 411.2103576660156, 420.84259033203125, 430.474853515625, 440.1070861816406, 449.7393493652344, 459.37158203125, 469.00384521484375, 478.6361083984375, 488.2683410644531, 497.9006042480469, 507.5328674316406, 517.1651000976562, 526.79736328125, 536.4296264648438, 546.0618896484375, 555.694091796875, 565.3263549804688, 574.9586181640625]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 4.0, 4.0, 3.0, 6.0, 5.0, 9.0, 13.0, 14.0, 18.0, 19.0, 23.0, 35.0, 23.0, 40.0, 24.0, 32.0, 34.0, 39.0, 38.0, 49.0, 39.0, 45.0, 45.0, 51.0, 37.0, 35.0, 33.0, 31.0, 39.0, 25.0, 35.0, 33.0, 16.0, 15.0, 12.0, 15.0, 9.0, 12.0, 9.0, 11.0, 10.0, 1.0, 3.0, 9.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0], "bins": [-57.825531005859375, -56.14991760253906, -54.474308013916016, -52.7986946105957, -51.12308120727539, -49.447471618652344, -47.77185821533203, -46.09624481201172, -44.420631408691406, -42.745018005371094, -41.06940841674805, -39.393795013427734, -37.71818161010742, -36.042572021484375, -34.36695861816406, -32.69134521484375, -31.015735626220703, -29.340124130249023, -27.66451072692871, -25.98889923095703, -24.31328582763672, -22.63767433166504, -20.96206283569336, -19.286449432373047, -17.610837936401367, -15.935225486755371, -14.259613037109375, -12.584001541137695, -10.9083890914917, -9.232776641845703, -7.557165145874023, -5.881552696228027, -4.205944061279297, -2.53033185005188, -0.8547196388244629, 0.820892333984375, 2.496504783630371, 4.172117233276367, 5.847728729248047, 7.523341178894043, 9.198953628540039, 10.874566078186035, 12.550178527832031, 14.225790023803711, 15.901402473449707, 17.577014923095703, 19.252626419067383, 20.928237915039062, 22.603851318359375, 24.279462814331055, 25.955076217651367, 27.630687713623047, 29.30630111694336, 30.98191261291504, 32.65752410888672, 34.33313751220703, 36.008750915527344, 37.684364318847656, 39.3599739074707, 41.035587310791016, 42.71120071411133, 44.386810302734375, 46.06242370605469, 47.738037109375, 49.41364669799805]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 3.0, 5.0, 8.0, 4.0, 15.0, 17.0, 19.0, 24.0, 24.0, 25.0, 22.0, 26.0, 31.0, 37.0, 27.0, 36.0, 51.0, 50.0, 52.0, 49.0, 44.0, 47.0, 42.0, 41.0, 25.0, 38.0, 39.0, 36.0, 24.0, 29.0, 20.0, 18.0, 15.0, 15.0, 7.0, 7.0, 7.0, 7.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0], "bins": [-8.4609375, -8.22119140625, -7.9814453125, -7.74169921875, -7.501953125, -7.26220703125, -7.0224609375, -6.78271484375, -6.54296875, -6.30322265625, -6.0634765625, -5.82373046875, -5.583984375, -5.34423828125, -5.1044921875, -4.86474609375, -4.625, -4.38525390625, -4.1455078125, -3.90576171875, -3.666015625, -3.42626953125, -3.1865234375, -2.94677734375, -2.70703125, -2.46728515625, -2.2275390625, -1.98779296875, -1.748046875, -1.50830078125, -1.2685546875, -1.02880859375, -0.7890625, -0.54931640625, -0.3095703125, -0.06982421875, 0.169921875, 0.40966796875, 0.6494140625, 0.88916015625, 1.12890625, 1.36865234375, 1.6083984375, 1.84814453125, 2.087890625, 2.32763671875, 2.5673828125, 2.80712890625, 3.046875, 3.28662109375, 3.5263671875, 3.76611328125, 4.005859375, 4.24560546875, 4.4853515625, 4.72509765625, 4.96484375, 5.20458984375, 5.4443359375, 5.68408203125, 5.923828125, 6.16357421875, 6.4033203125, 6.64306640625, 6.8828125]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 3.0, 5.0, 1.0, 0.0, 3.0, 5.0, 5.0, 7.0, 7.0, 9.0, 11.0, 16.0, 16.0, 19.0, 15.0, 23.0, 33.0, 36.0, 55.0, 109.0, 154.0, 378.0, 1043.0, 3665.0, 25887.0, 994601.0, 3017218.0, 139627.0, 8278.0, 1807.0, 604.0, 229.0, 109.0, 64.0, 51.0, 33.0, 34.0, 22.0, 13.0, 13.0, 19.0, 12.0, 11.0, 4.0, 8.0, 5.0, 8.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-23.625, -22.892333984375, -22.15966796875, -21.427001953125, -20.6943359375, -19.961669921875, -19.22900390625, -18.496337890625, -17.763671875, -17.031005859375, -16.29833984375, -15.565673828125, -14.8330078125, -14.100341796875, -13.36767578125, -12.635009765625, -11.90234375, -11.169677734375, -10.43701171875, -9.704345703125, -8.9716796875, -8.239013671875, -7.50634765625, -6.773681640625, -6.041015625, -5.308349609375, -4.57568359375, -3.843017578125, -3.1103515625, -2.377685546875, -1.64501953125, -0.912353515625, -0.1796875, 0.552978515625, 1.28564453125, 2.018310546875, 2.7509765625, 3.483642578125, 4.21630859375, 4.948974609375, 5.681640625, 6.414306640625, 7.14697265625, 7.879638671875, 8.6123046875, 9.344970703125, 10.07763671875, 10.810302734375, 11.54296875, 12.275634765625, 13.00830078125, 13.740966796875, 14.4736328125, 15.206298828125, 15.93896484375, 16.671630859375, 17.404296875, 18.136962890625, 18.86962890625, 19.602294921875, 20.3349609375, 21.067626953125, 21.80029296875, 22.532958984375, 23.265625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 8.0, 9.0, 7.0, 19.0, 19.0, 26.0, 65.0, 112.0, 183.0, 320.0, 538.0, 733.0, 740.0, 514.0, 308.0, 182.0, 116.0, 84.0, 45.0, 21.0, 14.0, 6.0, 9.0, 1.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.71875, -23.041259765625, -22.36376953125, -21.686279296875, -21.0087890625, -20.331298828125, -19.65380859375, -18.976318359375, -18.298828125, -17.621337890625, -16.94384765625, -16.266357421875, -15.5888671875, -14.911376953125, -14.23388671875, -13.556396484375, -12.87890625, -12.201416015625, -11.52392578125, -10.846435546875, -10.1689453125, -9.491455078125, -8.81396484375, -8.136474609375, -7.458984375, -6.781494140625, -6.10400390625, -5.426513671875, -4.7490234375, -4.071533203125, -3.39404296875, -2.716552734375, -2.0390625, -1.361572265625, -0.68408203125, -0.006591796875, 0.6708984375, 1.348388671875, 2.02587890625, 2.703369140625, 3.380859375, 4.058349609375, 4.73583984375, 5.413330078125, 6.0908203125, 6.768310546875, 7.44580078125, 8.123291015625, 8.80078125, 9.478271484375, 10.15576171875, 10.833251953125, 11.5107421875, 12.188232421875, 12.86572265625, 13.543212890625, 14.220703125, 14.898193359375, 15.57568359375, 16.253173828125, 16.9306640625, 17.608154296875, 18.28564453125, 18.963134765625, 19.640625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 7.0, 13.0, 20.0, 35.0, 44.0, 59.0, 109.0, 134.0, 201.0, 325.0, 558.0, 1591.0, 329494.0, 3856412.0, 3511.0, 724.0, 359.0, 253.0, 153.0, 93.0, 68.0, 45.0, 32.0, 15.0, 13.0, 12.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.5, -84.69140625, -81.8828125, -79.07421875, -76.265625, -73.45703125, -70.6484375, -67.83984375, -65.03125, -62.22265625, -59.4140625, -56.60546875, -53.796875, -50.98828125, -48.1796875, -45.37109375, -42.5625, -39.75390625, -36.9453125, -34.13671875, -31.328125, -28.51953125, -25.7109375, -22.90234375, -20.09375, -17.28515625, -14.4765625, -11.66796875, -8.859375, -6.05078125, -3.2421875, -0.43359375, 2.375, 5.18359375, 7.9921875, 10.80078125, 13.609375, 16.41796875, 19.2265625, 22.03515625, 24.84375, 27.65234375, 30.4609375, 33.26953125, 36.078125, 38.88671875, 41.6953125, 44.50390625, 47.3125, 50.12109375, 52.9296875, 55.73828125, 58.546875, 61.35546875, 64.1640625, 66.97265625, 69.78125, 72.58984375, 75.3984375, 78.20703125, 81.015625, 83.82421875, 86.6328125, 89.44140625, 92.25]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 73.0, 559.0, 359.0, 19.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-101.29222106933594, -91.90959167480469, -82.5269546508789, -73.14432525634766, -63.76169204711914, -54.379058837890625, -44.996429443359375, -35.613792419433594, -26.231163024902344, -16.848529815673828, -7.465898513793945, 1.9167327880859375, 11.299365997314453, 20.68199920654297, 30.06462860107422, 39.447265625, 48.82989501953125, 58.212528228759766, 67.59516143798828, 76.97779083251953, 86.36042785644531, 95.74305725097656, 105.12568664550781, 114.5083236694336, 123.89095306396484, 133.27359008789062, 142.65621948242188, 152.03884887695312, 161.42147827148438, 170.80410766601562, 180.18673706054688, 189.5693817138672, 198.95199584960938, 208.33462524414062, 217.71725463867188, 227.09988403320312, 236.48252868652344, 245.8651580810547, 255.24778747558594, 264.63043212890625, 274.0130615234375, 283.39569091796875, 292.7783203125, 302.16094970703125, 311.5435791015625, 320.92620849609375, 330.308837890625, 339.6914978027344, 349.0740966796875, 358.45672607421875, 367.83935546875, 377.22198486328125, 386.6046142578125, 395.98724365234375, 405.369873046875, 414.7525329589844, 424.1351623535156, 433.5177917480469, 442.9004211425781, 452.2830505371094, 461.6656799316406, 471.04833984375, 480.43096923828125, 489.8135986328125, 499.19622802734375]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 6.0, 4.0, 3.0, 7.0, 6.0, 9.0, 8.0, 11.0, 16.0, 18.0, 16.0, 21.0, 25.0, 22.0, 31.0, 28.0, 40.0, 31.0, 49.0, 28.0, 39.0, 45.0, 45.0, 55.0, 45.0, 44.0, 35.0, 45.0, 31.0, 40.0, 25.0, 27.0, 24.0, 24.0, 21.0, 17.0, 9.0, 10.0, 9.0, 6.0, 10.0, 5.0, 9.0, 9.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.98966979980469, -41.68730545043945, -40.38494110107422, -39.082576751708984, -37.78021240234375, -36.477848052978516, -35.17548370361328, -33.87312316894531, -32.57075500488281, -31.268390655517578, -29.966026306152344, -28.66366195678711, -27.361297607421875, -26.05893325805664, -24.75657081604004, -23.454206466674805, -22.151844024658203, -20.84947967529297, -19.547115325927734, -18.2447509765625, -16.942386627197266, -15.640023231506348, -14.33765983581543, -13.035295486450195, -11.732931137084961, -10.430566787719727, -9.128202438354492, -7.825839042663574, -6.52347469329834, -5.2211103439331055, -3.9187464714050293, -2.616382598876953, -1.3140182495117188, -0.011654138565063477, 1.2907099723815918, 2.593074083328247, 3.8954381942749023, 5.197802543640137, 6.500166416168213, 7.802530288696289, 9.104894638061523, 10.407258987426758, 11.709623336791992, 13.01198673248291, 14.314351081848145, 15.616715431213379, 16.919078826904297, 18.22144317626953, 19.523807525634766, 20.826171875, 22.128536224365234, 23.43090057373047, 24.733264923095703, 26.035629272460938, 27.33799171447754, 28.640356063842773, 29.942720413208008, 31.245084762573242, 32.547447204589844, 33.84981155395508, 35.15217590332031, 36.45454025268555, 37.75690460205078, 39.059268951416016, 40.36163330078125]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 8.0, 4.0, 5.0, 7.0, 6.0, 11.0, 10.0, 11.0, 18.0, 16.0, 10.0, 25.0, 26.0, 27.0, 24.0, 24.0, 35.0, 34.0, 45.0, 34.0, 47.0, 38.0, 46.0, 40.0, 50.0, 36.0, 44.0, 35.0, 39.0, 32.0, 32.0, 22.0, 26.0, 12.0, 18.0, 29.0, 12.0, 17.0, 13.0, 10.0, 9.0, 5.0, 7.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 4.0], "bins": [-8.0703125, -7.85040283203125, -7.6304931640625, -7.41058349609375, -7.190673828125, -6.97076416015625, -6.7508544921875, -6.53094482421875, -6.31103515625, -6.09112548828125, -5.8712158203125, -5.65130615234375, -5.431396484375, -5.21148681640625, -4.9915771484375, -4.77166748046875, -4.5517578125, -4.33184814453125, -4.1119384765625, -3.89202880859375, -3.672119140625, -3.45220947265625, -3.2322998046875, -3.01239013671875, -2.79248046875, -2.57257080078125, -2.3526611328125, -2.13275146484375, -1.912841796875, -1.69293212890625, -1.4730224609375, -1.25311279296875, -1.033203125, -0.81329345703125, -0.5933837890625, -0.37347412109375, -0.153564453125, 0.06634521484375, 0.2862548828125, 0.50616455078125, 0.72607421875, 0.94598388671875, 1.1658935546875, 1.38580322265625, 1.605712890625, 1.82562255859375, 2.0455322265625, 2.26544189453125, 2.4853515625, 2.70526123046875, 2.9251708984375, 3.14508056640625, 3.364990234375, 3.58489990234375, 3.8048095703125, 4.02471923828125, 4.24462890625, 4.46453857421875, 4.6844482421875, 4.90435791015625, 5.124267578125, 5.34417724609375, 5.5640869140625, 5.78399658203125, 6.00390625]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 6.0, 12.0, 18.0, 13.0, 32.0, 38.0, 57.0, 83.0, 137.0, 181.0, 311.0, 438.0, 691.0, 1202.0, 1826.0, 2794.0, 4257.0, 6622.0, 10568.0, 16768.0, 27485.0, 46293.0, 81158.0, 153561.0, 271272.0, 187902.0, 96606.0, 53858.0, 31800.0, 19160.0, 12017.0, 7724.0, 4924.0, 3038.0, 2020.0, 1272.0, 810.0, 544.0, 379.0, 237.0, 157.0, 101.0, 68.0, 49.0, 30.0, 8.0, 15.0, 6.0, 7.0, 6.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9814453125, -0.9494171142578125, -0.917388916015625, -0.8853607177734375, -0.85333251953125, -0.8213043212890625, -0.789276123046875, -0.7572479248046875, -0.7252197265625, -0.6931915283203125, -0.661163330078125, -0.6291351318359375, -0.59710693359375, -0.5650787353515625, -0.533050537109375, -0.5010223388671875, -0.468994140625, -0.4369659423828125, -0.404937744140625, -0.3729095458984375, -0.34088134765625, -0.3088531494140625, -0.276824951171875, -0.2447967529296875, -0.2127685546875, -0.1807403564453125, -0.148712158203125, -0.1166839599609375, -0.08465576171875, -0.0526275634765625, -0.020599365234375, 0.0114288330078125, 0.04345703125, 0.0754852294921875, 0.107513427734375, 0.1395416259765625, 0.17156982421875, 0.2035980224609375, 0.235626220703125, 0.2676544189453125, 0.2996826171875, 0.3317108154296875, 0.363739013671875, 0.3957672119140625, 0.42779541015625, 0.4598236083984375, 0.491851806640625, 0.5238800048828125, 0.555908203125, 0.5879364013671875, 0.619964599609375, 0.6519927978515625, 0.68402099609375, 0.7160491943359375, 0.748077392578125, 0.7801055908203125, 0.8121337890625, 0.8441619873046875, 0.876190185546875, 0.9082183837890625, 0.94024658203125, 0.9722747802734375, 1.004302978515625, 1.0363311767578125, 1.068359375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 8.0, 6.0, 4.0, 8.0, 11.0, 8.0, 18.0, 12.0, 15.0, 14.0, 27.0, 28.0, 23.0, 22.0, 28.0, 39.0, 39.0, 37.0, 32.0, 28.0, 36.0, 1068.0, 56.0, 30.0, 40.0, 39.0, 38.0, 27.0, 47.0, 39.0, 16.0, 23.0, 23.0, 18.0, 23.0, 12.0, 17.0, 10.0, 10.0, 10.0, 15.0, 5.0, 7.0, 5.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-4.5, -4.365966796875, -4.23193359375, -4.097900390625, -3.9638671875, -3.829833984375, -3.69580078125, -3.561767578125, -3.427734375, -3.293701171875, -3.15966796875, -3.025634765625, -2.8916015625, -2.757568359375, -2.62353515625, -2.489501953125, -2.35546875, -2.221435546875, -2.08740234375, -1.953369140625, -1.8193359375, -1.685302734375, -1.55126953125, -1.417236328125, -1.283203125, -1.149169921875, -1.01513671875, -0.881103515625, -0.7470703125, -0.613037109375, -0.47900390625, -0.344970703125, -0.2109375, -0.076904296875, 0.05712890625, 0.191162109375, 0.3251953125, 0.459228515625, 0.59326171875, 0.727294921875, 0.861328125, 0.995361328125, 1.12939453125, 1.263427734375, 1.3974609375, 1.531494140625, 1.66552734375, 1.799560546875, 1.93359375, 2.067626953125, 2.20166015625, 2.335693359375, 2.4697265625, 2.603759765625, 2.73779296875, 2.871826171875, 3.005859375, 3.139892578125, 3.27392578125, 3.407958984375, 3.5419921875, 3.676025390625, 3.81005859375, 3.944091796875, 4.078125]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [5.0, 0.0, 4.0, 1.0, 3.0, 6.0, 12.0, 14.0, 22.0, 27.0, 49.0, 53.0, 85.0, 156.0, 221.0, 277.0, 484.0, 704.0, 1002.0, 1466.0, 2045.0, 2958.0, 4496.0, 6990.0, 10623.0, 16256.0, 25742.0, 40777.0, 67166.0, 116804.0, 203490.0, 1264490.0, 130907.0, 74756.0, 44905.0, 27828.0, 17872.0, 11430.0, 7526.0, 5010.0, 3273.0, 2236.0, 1544.0, 1062.0, 737.0, 536.0, 323.0, 272.0, 160.0, 103.0, 80.0, 54.0, 36.0, 21.0, 15.0, 12.0, 9.0, 5.0, 7.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.78564453125, -0.7603836059570312, -0.7351226806640625, -0.7098617553710938, -0.684600830078125, -0.6593399047851562, -0.6340789794921875, -0.6088180541992188, -0.58355712890625, -0.5582962036132812, -0.5330352783203125, -0.5077743530273438, -0.482513427734375, -0.45725250244140625, -0.4319915771484375, -0.40673065185546875, -0.3814697265625, -0.35620880126953125, -0.3309478759765625, -0.30568695068359375, -0.280426025390625, -0.25516510009765625, -0.2299041748046875, -0.20464324951171875, -0.17938232421875, -0.15412139892578125, -0.1288604736328125, -0.10359954833984375, -0.078338623046875, -0.05307769775390625, -0.0278167724609375, -0.00255584716796875, 0.022705078125, 0.04796600341796875, 0.0732269287109375, 0.09848785400390625, 0.123748779296875, 0.14900970458984375, 0.1742706298828125, 0.19953155517578125, 0.22479248046875, 0.25005340576171875, 0.2753143310546875, 0.30057525634765625, 0.325836181640625, 0.35109710693359375, 0.3763580322265625, 0.40161895751953125, 0.4268798828125, 0.45214080810546875, 0.4774017333984375, 0.5026626586914062, 0.527923583984375, 0.5531845092773438, 0.5784454345703125, 0.6037063598632812, 0.62896728515625, 0.6542282104492188, 0.6794891357421875, 0.7047500610351562, 0.730010986328125, 0.7552719116210938, 0.7805328369140625, 0.8057937622070312, 0.8310546875]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 4.0, 6.0, 8.0, 7.0, 10.0, 13.0, 11.0, 16.0, 17.0, 32.0, 33.0, 34.0, 38.0, 41.0, 35.0, 49.0, 64.0, 54.0, 57.0, 73.0, 47.0, 56.0, 52.0, 31.0, 38.0, 44.0, 29.0, 24.0, 19.0, 12.0, 10.0, 9.0, 10.0, 3.0, 1.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0027980804443359375, -0.002721160650253296, -0.0026442408561706543, -0.0025673210620880127, -0.002490401268005371, -0.0024134814739227295, -0.002336561679840088, -0.0022596418857574463, -0.0021827220916748047, -0.002105802297592163, -0.0020288825035095215, -0.0019519627094268799, -0.0018750429153442383, -0.0017981231212615967, -0.001721203327178955, -0.0016442835330963135, -0.0015673637390136719, -0.0014904439449310303, -0.0014135241508483887, -0.001336604356765747, -0.0012596845626831055, -0.0011827647686004639, -0.0011058449745178223, -0.0010289251804351807, -0.0009520053863525391, -0.0008750855922698975, -0.0007981657981872559, -0.0007212460041046143, -0.0006443262100219727, -0.0005674064159393311, -0.0004904866218566895, -0.00041356682777404785, -0.00033664703369140625, -0.00025972723960876465, -0.00018280744552612305, -0.00010588765144348145, -2.8967857360839844e-05, 4.795193672180176e-05, 0.00012487173080444336, 0.00020179152488708496, 0.00027871131896972656, 0.00035563111305236816, 0.00043255090713500977, 0.0005094707012176514, 0.000586390495300293, 0.0006633102893829346, 0.0007402300834655762, 0.0008171498775482178, 0.0008940696716308594, 0.000970989465713501, 0.0010479092597961426, 0.0011248290538787842, 0.0012017488479614258, 0.0012786686420440674, 0.001355588436126709, 0.0014325082302093506, 0.0015094280242919922, 0.0015863478183746338, 0.0016632676124572754, 0.001740187406539917, 0.0018171072006225586, 0.0018940269947052002, 0.001970946788787842, 0.0020478665828704834, 0.002124786376953125]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 6.0, 1.0, 1.0, 8.0, 9.0, 12.0, 15.0, 12.0, 38.0, 37.0, 49.0, 57.0, 71.0, 130.0, 206.0, 563.0, 14552.0, 1029590.0, 2236.0, 363.0, 172.0, 99.0, 84.0, 50.0, 39.0, 29.0, 28.0, 19.0, 10.0, 16.0, 10.0, 13.0, 7.0, 2.0, 4.0, 7.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.054962158203125, -0.053021907806396484, -0.05108165740966797, -0.04914140701293945, -0.04720115661621094, -0.04526090621948242, -0.043320655822753906, -0.04138040542602539, -0.039440155029296875, -0.03749990463256836, -0.035559654235839844, -0.03361940383911133, -0.03167915344238281, -0.029738903045654297, -0.02779865264892578, -0.025858402252197266, -0.02391815185546875, -0.021977901458740234, -0.02003765106201172, -0.018097400665283203, -0.016157150268554688, -0.014216899871826172, -0.012276649475097656, -0.01033639907836914, -0.008396148681640625, -0.006455898284912109, -0.004515647888183594, -0.002575397491455078, -0.0006351470947265625, 0.0013051033020019531, 0.0032453536987304688, 0.005185604095458984, 0.0071258544921875, 0.009066104888916016, 0.011006355285644531, 0.012946605682373047, 0.014886856079101562, 0.016827106475830078, 0.018767356872558594, 0.02070760726928711, 0.022647857666015625, 0.02458810806274414, 0.026528358459472656, 0.028468608856201172, 0.030408859252929688, 0.0323491096496582, 0.03428936004638672, 0.036229610443115234, 0.03816986083984375, 0.040110111236572266, 0.04205036163330078, 0.0439906120300293, 0.04593086242675781, 0.04787111282348633, 0.049811363220214844, 0.05175161361694336, 0.053691864013671875, 0.05563211441040039, 0.057572364807128906, 0.05951261520385742, 0.06145286560058594, 0.06339311599731445, 0.06533336639404297, 0.06727361679077148, 0.0692138671875]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 256.0, 696.0, 59.0, 2.0], "bins": [-0.020843908190727234, -0.020503737032413483, -0.02016356773674488, -0.01982339657843113, -0.019483225420117378, -0.019143056124448776, -0.018802884966135025, -0.018462713807821274, -0.018122544512152672, -0.01778237335383892, -0.01744220405817032, -0.017102032899856567, -0.016761861741542816, -0.016421692445874214, -0.016081521287560463, -0.01574135012924671, -0.01540117897093296, -0.015061008743941784, -0.014720837585628033, -0.014380667358636856, -0.01404049713164568, -0.013700325973331928, -0.013360155746340752, -0.013019984588027, -0.012679815292358398, -0.012339645065367222, -0.01199947390705347, -0.011659303680062294, -0.011319133453071117, -0.010978962294757366, -0.01063879206776619, -0.010298620909452438, -0.009958450682461262, -0.009618280455470085, -0.009278109297156334, -0.008937939070165157, -0.00859776884317398, -0.00825759768486023, -0.007917427457869053, -0.007577256765216589, -0.007237086072564125, -0.006896915379911661, -0.0065567451529204845, -0.006216574460268021, -0.005876403767615557, -0.005536233074963093, -0.005196062847971916, -0.004855892155319452, -0.004515721928328276, -0.004175551235675812, -0.0038353807758539915, -0.0034952103160321712, -0.0031550396233797073, -0.002814869163557887, -0.002474698703736067, -0.002134528011083603, -0.0017943574348464608, -0.0014541868586093187, -0.0011140163987874985, -0.0007738458225503564, -0.0004336752463132143, -9.350467007607222e-05, 0.00024666578974574804, 0.000586836482398212, 0.0009270069422200322]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 4.0, 2.0, 7.0, 10.0, 12.0, 9.0, 19.0, 19.0, 28.0, 22.0, 24.0, 21.0, 18.0, 35.0, 38.0, 48.0, 40.0, 47.0, 42.0, 39.0, 44.0, 55.0, 49.0, 40.0, 41.0, 50.0, 40.0, 36.0, 36.0, 25.0, 15.0, 18.0, 9.0, 9.0, 16.0, 9.0, 7.0, 7.0, 7.0, 5.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012969970703125, -0.0012514535337686539, -0.0012059099972248077, -0.0011603664606809616, -0.0011148229241371155, -0.0010692793875932693, -0.0010237358510494232, -0.000978192314505577, -0.000932648777961731, -0.0008871052414178848, -0.0008415617048740387, -0.0007960181683301926, -0.0007504746317863464, -0.0007049310952425003, -0.0006593875586986542, -0.000613844022154808, -0.0005683004856109619, -0.0005227569490671158, -0.00047721341252326965, -0.0004316698759794235, -0.0003861263394355774, -0.00034058280289173126, -0.00029503926634788513, -0.000249495729804039, -0.00020395219326019287, -0.00015840865671634674, -0.00011286512017250061, -6.732158362865448e-05, -2.177804708480835e-05, 2.376548945903778e-05, 6.930902600288391e-05, 0.00011485256254673004, 0.00016039609909057617, 0.0002059396356344223, 0.00025148317217826843, 0.00029702670872211456, 0.0003425702452659607, 0.0003881137818098068, 0.00043365731835365295, 0.0004792008548974991, 0.0005247443914413452, 0.0005702879279851913, 0.0006158314645290375, 0.0006613750010728836, 0.0007069185376167297, 0.0007524620741605759, 0.000798005610704422, 0.0008435491472482681, 0.0008890926837921143, 0.0009346362203359604, 0.0009801797568798065, 0.0010257232934236526, 0.0010712668299674988, 0.001116810366511345, 0.001162353903055191, 0.0012078974395990372, 0.0012534409761428833, 0.0012989845126867294, 0.0013445280492305756, 0.0013900715857744217, 0.0014356151223182678, 0.001481158658862114, 0.00152670219540596, 0.0015722457319498062, 0.0016177892684936523]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 8.0, 4.0, 5.0, 7.0, 6.0, 11.0, 10.0, 11.0, 18.0, 16.0, 10.0, 25.0, 26.0, 27.0, 24.0, 24.0, 35.0, 34.0, 45.0, 34.0, 47.0, 38.0, 46.0, 40.0, 50.0, 36.0, 44.0, 34.0, 40.0, 32.0, 32.0, 22.0, 26.0, 12.0, 18.0, 29.0, 12.0, 17.0, 13.0, 10.0, 9.0, 5.0, 7.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 4.0], "bins": [-8.0703125, -7.85040283203125, -7.6304931640625, -7.41058349609375, -7.190673828125, -6.97076416015625, -6.7508544921875, -6.53094482421875, -6.31103515625, -6.09112548828125, -5.8712158203125, -5.65130615234375, -5.431396484375, -5.21148681640625, -4.9915771484375, -4.77166748046875, -4.5517578125, -4.33184814453125, -4.1119384765625, -3.89202880859375, -3.672119140625, -3.45220947265625, -3.2322998046875, -3.01239013671875, -2.79248046875, -2.57257080078125, -2.3526611328125, -2.13275146484375, -1.912841796875, -1.69293212890625, -1.4730224609375, -1.25311279296875, -1.033203125, -0.81329345703125, -0.5933837890625, -0.37347412109375, -0.153564453125, 0.06634521484375, 0.2862548828125, 0.50616455078125, 0.72607421875, 0.94598388671875, 1.1658935546875, 1.38580322265625, 1.605712890625, 1.82562255859375, 2.0455322265625, 2.26544189453125, 2.4853515625, 2.70526123046875, 2.9251708984375, 3.14508056640625, 3.364990234375, 3.58489990234375, 3.8048095703125, 4.02471923828125, 4.24462890625, 4.46453857421875, 4.6844482421875, 4.90435791015625, 5.124267578125, 5.34417724609375, 5.5640869140625, 5.78399658203125, 6.00390625]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 7.0, 4.0, 8.0, 4.0, 13.0, 13.0, 25.0, 31.0, 37.0, 41.0, 70.0, 80.0, 129.0, 186.0, 289.0, 482.0, 805.0, 1541.0, 3408.0, 7936.0, 19861.0, 55908.0, 190053.0, 516114.0, 168220.0, 50632.0, 18592.0, 7341.0, 3098.0, 1481.0, 781.0, 431.0, 277.0, 177.0, 151.0, 95.0, 64.0, 39.0, 38.0, 22.0, 20.0, 12.0, 13.0, 13.0, 5.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-7.44921875, -7.2265625, -7.00390625, -6.78125, -6.55859375, -6.3359375, -6.11328125, -5.890625, -5.66796875, -5.4453125, -5.22265625, -5.0, -4.77734375, -4.5546875, -4.33203125, -4.109375, -3.88671875, -3.6640625, -3.44140625, -3.21875, -2.99609375, -2.7734375, -2.55078125, -2.328125, -2.10546875, -1.8828125, -1.66015625, -1.4375, -1.21484375, -0.9921875, -0.76953125, -0.546875, -0.32421875, -0.1015625, 0.12109375, 0.34375, 0.56640625, 0.7890625, 1.01171875, 1.234375, 1.45703125, 1.6796875, 1.90234375, 2.125, 2.34765625, 2.5703125, 2.79296875, 3.015625, 3.23828125, 3.4609375, 3.68359375, 3.90625, 4.12890625, 4.3515625, 4.57421875, 4.796875, 5.01953125, 5.2421875, 5.46484375, 5.6875, 5.91015625, 6.1328125, 6.35546875, 6.578125, 6.80078125]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 3.0, 4.0, 6.0, 4.0, 6.0, 13.0, 9.0, 16.0, 19.0, 15.0, 18.0, 25.0, 22.0, 35.0, 36.0, 39.0, 36.0, 44.0, 43.0, 58.0, 83.0, 367.0, 1601.0, 134.0, 53.0, 52.0, 43.0, 42.0, 22.0, 22.0, 18.0, 35.0, 23.0, 16.0, 19.0, 20.0, 13.0, 7.0, 10.0, 10.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.75, -20.0615234375, -19.373046875, -18.6845703125, -17.99609375, -17.3076171875, -16.619140625, -15.9306640625, -15.2421875, -14.5537109375, -13.865234375, -13.1767578125, -12.48828125, -11.7998046875, -11.111328125, -10.4228515625, -9.734375, -9.0458984375, -8.357421875, -7.6689453125, -6.98046875, -6.2919921875, -5.603515625, -4.9150390625, -4.2265625, -3.5380859375, -2.849609375, -2.1611328125, -1.47265625, -0.7841796875, -0.095703125, 0.5927734375, 1.28125, 1.9697265625, 2.658203125, 3.3466796875, 4.03515625, 4.7236328125, 5.412109375, 6.1005859375, 6.7890625, 7.4775390625, 8.166015625, 8.8544921875, 9.54296875, 10.2314453125, 10.919921875, 11.6083984375, 12.296875, 12.9853515625, 13.673828125, 14.3623046875, 15.05078125, 15.7392578125, 16.427734375, 17.1162109375, 17.8046875, 18.4931640625, 19.181640625, 19.8701171875, 20.55859375, 21.2470703125, 21.935546875, 22.6240234375, 23.3125]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 4.0, 10.0, 5.0, 11.0, 10.0, 27.0, 19.0, 37.0, 55.0, 66.0, 75.0, 121.0, 167.0, 272.0, 554.0, 3295.0, 3026852.0, 111512.0, 1321.0, 455.0, 260.0, 170.0, 99.0, 75.0, 74.0, 34.0, 38.0, 32.0, 17.0, 10.0, 12.0, 1.0, 4.0, 4.0, 7.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.875, -48.7392578125, -46.603515625, -44.4677734375, -42.33203125, -40.1962890625, -38.060546875, -35.9248046875, -33.7890625, -31.6533203125, -29.517578125, -27.3818359375, -25.24609375, -23.1103515625, -20.974609375, -18.8388671875, -16.703125, -14.5673828125, -12.431640625, -10.2958984375, -8.16015625, -6.0244140625, -3.888671875, -1.7529296875, 0.3828125, 2.5185546875, 4.654296875, 6.7900390625, 8.92578125, 11.0615234375, 13.197265625, 15.3330078125, 17.46875, 19.6044921875, 21.740234375, 23.8759765625, 26.01171875, 28.1474609375, 30.283203125, 32.4189453125, 34.5546875, 36.6904296875, 38.826171875, 40.9619140625, 43.09765625, 45.2333984375, 47.369140625, 49.5048828125, 51.640625, 53.7763671875, 55.912109375, 58.0478515625, 60.18359375, 62.3193359375, 64.455078125, 66.5908203125, 68.7265625, 70.8623046875, 72.998046875, 75.1337890625, 77.26953125, 79.4052734375, 81.541015625, 83.6767578125, 85.8125]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 241.0, 746.0, 29.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.654178619384766, -28.29014778137207, -22.926116943359375, -17.562084197998047, -12.198053359985352, -6.834022521972656, -1.4699897766113281, 3.8940391540527344, 9.258071899414062, 14.622102737426758, 19.986133575439453, 25.35016632080078, 30.714197158813477, 36.07822799682617, 41.4422607421875, 46.80628967285156, 52.17032241821289, 57.53435516357422, 62.89838409423828, 68.26242065429688, 73.62644958496094, 78.990478515625, 84.35450744628906, 89.71853637695312, 95.08257293701172, 100.44660186767578, 105.81063842773438, 111.17466735839844, 116.5386962890625, 121.90272521972656, 127.26676177978516, 132.63079833984375, 137.9948272705078, 143.35885620117188, 148.72288513183594, 154.0869140625, 159.45095825195312, 164.8149871826172, 170.17901611328125, 175.5430450439453, 180.90707397460938, 186.27110290527344, 191.6351318359375, 196.99917602539062, 202.3632049560547, 207.72723388671875, 213.0912628173828, 218.45529174804688, 223.8193359375, 229.18336486816406, 234.54739379882812, 239.91143798828125, 245.2754669189453, 250.63949584960938, 256.0035400390625, 261.3675537109375, 266.7315673828125, 272.0956115722656, 277.4596252441406, 282.82366943359375, 288.18768310546875, 293.5517272949219, 298.915771484375, 304.27978515625, 309.6438293457031]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 8.0, 9.0, 9.0, 6.0, 9.0, 17.0, 19.0, 27.0, 27.0, 32.0, 27.0, 32.0, 42.0, 41.0, 47.0, 45.0, 61.0, 41.0, 50.0, 44.0, 45.0, 40.0, 52.0, 42.0, 38.0, 29.0, 31.0, 23.0, 18.0, 20.0, 12.0, 10.0, 14.0, 7.0, 8.0, 4.0, 8.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-64.50402069091797, -62.609405517578125, -60.71479034423828, -58.82017517089844, -56.925559997558594, -55.03094482421875, -53.136329650878906, -51.24171829223633, -49.347103118896484, -47.45248794555664, -45.5578727722168, -43.66325759887695, -41.76864242553711, -39.87403106689453, -37.97941589355469, -36.084800720214844, -34.190185546875, -32.295570373535156, -30.400955200195312, -28.50634002685547, -26.611726760864258, -24.717111587524414, -22.82249641418457, -20.92788314819336, -19.03326416015625, -17.138648986816406, -15.244034767150879, -13.349419593811035, -11.454805374145508, -9.560190200805664, -7.66557502746582, -5.770960807800293, -3.8763465881347656, -1.9817317724227905, -0.08711695671081543, 1.8074979782104492, 3.7021126747131348, 5.59672737121582, 7.491342544555664, 9.385956764221191, 11.280571937561035, 13.175187110900879, 15.069801330566406, 16.96441650390625, 18.859031677246094, 20.753646850585938, 22.64826202392578, 24.542875289916992, 26.437490463256836, 28.33210563659668, 30.226720809936523, 32.121334075927734, 34.01594924926758, 35.91056442260742, 37.805179595947266, 39.69979476928711, 41.59440994262695, 43.4890251159668, 45.38364028930664, 47.278255462646484, 49.17287063598633, 51.067481994628906, 52.96209716796875, 54.856712341308594, 56.75132751464844]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 8.0, 4.0, 5.0, 5.0, 7.0, 11.0, 11.0, 5.0, 17.0, 14.0, 16.0, 20.0, 20.0, 31.0, 18.0, 32.0, 34.0, 33.0, 28.0, 39.0, 32.0, 53.0, 43.0, 42.0, 55.0, 26.0, 41.0, 42.0, 38.0, 27.0, 32.0, 34.0, 29.0, 24.0, 17.0, 20.0, 14.0, 13.0, 11.0, 18.0, 10.0, 8.0, 4.0, 5.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 3.0], "bins": [-8.1953125, -7.96917724609375, -7.7430419921875, -7.51690673828125, -7.290771484375, -7.06463623046875, -6.8385009765625, -6.61236572265625, -6.38623046875, -6.16009521484375, -5.9339599609375, -5.70782470703125, -5.481689453125, -5.25555419921875, -5.0294189453125, -4.80328369140625, -4.5771484375, -4.35101318359375, -4.1248779296875, -3.89874267578125, -3.672607421875, -3.44647216796875, -3.2203369140625, -2.99420166015625, -2.76806640625, -2.54193115234375, -2.3157958984375, -2.08966064453125, -1.863525390625, -1.63739013671875, -1.4112548828125, -1.18511962890625, -0.958984375, -0.73284912109375, -0.5067138671875, -0.28057861328125, -0.054443359375, 0.17169189453125, 0.3978271484375, 0.62396240234375, 0.85009765625, 1.07623291015625, 1.3023681640625, 1.52850341796875, 1.754638671875, 1.98077392578125, 2.2069091796875, 2.43304443359375, 2.6591796875, 2.88531494140625, 3.1114501953125, 3.33758544921875, 3.563720703125, 3.78985595703125, 4.0159912109375, 4.24212646484375, 4.46826171875, 4.69439697265625, 4.9205322265625, 5.14666748046875, 5.372802734375, 5.59893798828125, 5.8250732421875, 6.05120849609375, 6.27734375]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 5.0, 2.0, 3.0, 0.0, 4.0, 3.0, 4.0, 4.0, 4.0, 4.0, 9.0, 6.0, 18.0, 16.0, 14.0, 18.0, 26.0, 26.0, 42.0, 52.0, 63.0, 71.0, 118.0, 157.0, 285.0, 676.0, 1691.0, 7979.0, 121125.0, 2798810.0, 1220386.0, 36152.0, 4138.0, 1110.0, 449.0, 235.0, 149.0, 99.0, 63.0, 60.0, 52.0, 29.0, 22.0, 19.0, 15.0, 7.0, 17.0, 7.0, 16.0, 10.0, 9.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0], "bins": [-23.171875, -22.486572265625, -21.80126953125, -21.115966796875, -20.4306640625, -19.745361328125, -19.06005859375, -18.374755859375, -17.689453125, -17.004150390625, -16.31884765625, -15.633544921875, -14.9482421875, -14.262939453125, -13.57763671875, -12.892333984375, -12.20703125, -11.521728515625, -10.83642578125, -10.151123046875, -9.4658203125, -8.780517578125, -8.09521484375, -7.409912109375, -6.724609375, -6.039306640625, -5.35400390625, -4.668701171875, -3.9833984375, -3.298095703125, -2.61279296875, -1.927490234375, -1.2421875, -0.556884765625, 0.12841796875, 0.813720703125, 1.4990234375, 2.184326171875, 2.86962890625, 3.554931640625, 4.240234375, 4.925537109375, 5.61083984375, 6.296142578125, 6.9814453125, 7.666748046875, 8.35205078125, 9.037353515625, 9.72265625, 10.407958984375, 11.09326171875, 11.778564453125, 12.4638671875, 13.149169921875, 13.83447265625, 14.519775390625, 15.205078125, 15.890380859375, 16.57568359375, 17.260986328125, 17.9462890625, 18.631591796875, 19.31689453125, 20.002197265625, 20.6875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 14.0, 15.0, 35.0, 45.0, 55.0, 96.0, 186.0, 305.0, 414.0, 677.0, 773.0, 569.0, 351.0, 188.0, 129.0, 89.0, 41.0, 28.0, 21.0, 16.0, 9.0, 7.0, 4.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-27.328125, -26.7105712890625, -26.093017578125, -25.4754638671875, -24.85791015625, -24.2403564453125, -23.622802734375, -23.0052490234375, -22.3876953125, -21.7701416015625, -21.152587890625, -20.5350341796875, -19.91748046875, -19.2999267578125, -18.682373046875, -18.0648193359375, -17.447265625, -16.8297119140625, -16.212158203125, -15.5946044921875, -14.97705078125, -14.3594970703125, -13.741943359375, -13.1243896484375, -12.5068359375, -11.8892822265625, -11.271728515625, -10.6541748046875, -10.03662109375, -9.4190673828125, -8.801513671875, -8.1839599609375, -7.56640625, -6.9488525390625, -6.331298828125, -5.7137451171875, -5.09619140625, -4.4786376953125, -3.861083984375, -3.2435302734375, -2.6259765625, -2.0084228515625, -1.390869140625, -0.7733154296875, -0.15576171875, 0.4617919921875, 1.079345703125, 1.6968994140625, 2.314453125, 2.9320068359375, 3.549560546875, 4.1671142578125, 4.78466796875, 5.4022216796875, 6.019775390625, 6.6373291015625, 7.2548828125, 7.8724365234375, 8.489990234375, 9.1075439453125, 9.72509765625, 10.3426513671875, 10.960205078125, 11.5777587890625, 12.1953125]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 8.0, 10.0, 8.0, 16.0, 21.0, 30.0, 60.0, 73.0, 98.0, 183.0, 226.0, 338.0, 621.0, 2859.0, 3823455.0, 363385.0, 1387.0, 515.0, 351.0, 207.0, 151.0, 93.0, 80.0, 33.0, 33.0, 19.0, 11.0, 8.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.6875, -61.728515625, -58.76953125, -55.810546875, -52.8515625, -49.892578125, -46.93359375, -43.974609375, -41.015625, -38.056640625, -35.09765625, -32.138671875, -29.1796875, -26.220703125, -23.26171875, -20.302734375, -17.34375, -14.384765625, -11.42578125, -8.466796875, -5.5078125, -2.548828125, 0.41015625, 3.369140625, 6.328125, 9.287109375, 12.24609375, 15.205078125, 18.1640625, 21.123046875, 24.08203125, 27.041015625, 30.0, 32.958984375, 35.91796875, 38.876953125, 41.8359375, 44.794921875, 47.75390625, 50.712890625, 53.671875, 56.630859375, 59.58984375, 62.548828125, 65.5078125, 68.466796875, 71.42578125, 74.384765625, 77.34375, 80.302734375, 83.26171875, 86.220703125, 89.1796875, 92.138671875, 95.09765625, 98.056640625, 101.015625, 103.974609375, 106.93359375, 109.892578125, 112.8515625, 115.810546875, 118.76953125, 121.728515625, 124.6875]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [2.0, 3.0, 12.0, 291.0, 674.0, 40.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.37624740600586, -41.611297607421875, -28.846351623535156, -16.081401824951172, -3.316455841064453, 9.448490142822266, 22.213443756103516, 34.978389739990234, 47.74333572387695, 60.50828552246094, 73.27323150634766, 86.03817749023438, 98.80313110351562, 111.56806945800781, 124.33302307128906, 137.0979766845703, 149.8629150390625, 162.62786865234375, 175.39280700683594, 188.1577606201172, 200.92269897460938, 213.68765258789062, 226.45260620117188, 239.21755981445312, 251.9824981689453, 264.7474365234375, 277.51239013671875, 290.27734375, 303.04229736328125, 315.8072509765625, 328.57220458984375, 341.3371276855469, 354.10211181640625, 366.8670654296875, 379.63201904296875, 392.39697265625, 405.1618957519531, 417.9268493652344, 430.6918029785156, 443.4567565917969, 456.2216796875, 468.98663330078125, 481.7515869140625, 494.51654052734375, 507.2814636230469, 520.04638671875, 532.8114013671875, 545.5762939453125, 558.34130859375, 571.1062622070312, 583.8712158203125, 596.6361694335938, 609.401123046875, 622.166015625, 634.9310302734375, 647.6959228515625, 660.4608764648438, 673.225830078125, 685.9907836914062, 698.7557373046875, 711.5206909179688, 724.28564453125, 737.050537109375, 749.8154907226562, 762.5804443359375]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 2.0, 7.0, 5.0, 6.0, 6.0, 3.0, 8.0, 14.0, 15.0, 14.0, 14.0, 22.0, 26.0, 24.0, 26.0, 42.0, 22.0, 37.0, 31.0, 33.0, 46.0, 45.0, 29.0, 29.0, 39.0, 34.0, 38.0, 32.0, 32.0, 36.0, 43.0, 24.0, 35.0, 27.0, 23.0, 23.0, 20.0, 24.0, 12.0, 15.0, 10.0, 13.0, 4.0, 4.0, 2.0, 5.0, 3.0, 0.0, 2.0], "bins": [-45.539703369140625, -44.339481353759766, -43.13925552368164, -41.93903350830078, -40.738807678222656, -39.5385856628418, -38.33836364746094, -37.13813781738281, -35.93791580200195, -34.737693786621094, -33.53746795654297, -32.33724594116211, -31.137022018432617, -29.936798095703125, -28.736576080322266, -27.536352157592773, -26.33612823486328, -25.13590431213379, -23.935680389404297, -22.735458374023438, -21.535234451293945, -20.335010528564453, -19.134788513183594, -17.9345645904541, -16.73434066772461, -15.534116744995117, -14.333893775939941, -13.133670806884766, -11.933446884155273, -10.733222961425781, -9.532999992370605, -8.33277702331543, -7.1325531005859375, -5.9323296546936035, -4.7321062088012695, -3.5318827629089355, -2.3316593170166016, -1.1314358711242676, 0.0687875747680664, 1.2690105438232422, 2.4692344665527344, 3.6694579124450684, 4.869681358337402, 6.069904804229736, 7.27012825012207, 8.470352172851562, 9.670575141906738, 10.870798110961914, 12.071022033691406, 13.271245956420898, 14.471468925476074, 15.67169189453125, 16.871915817260742, 18.072139739990234, 19.272361755371094, 20.472585678100586, 21.672809600830078, 22.87303352355957, 24.073257446289062, 25.273479461669922, 26.473703384399414, 27.673927307128906, 28.874149322509766, 30.074373245239258, 31.27459716796875]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 2.0, 4.0, 4.0, 5.0, 4.0, 13.0, 7.0, 16.0, 14.0, 22.0, 27.0, 29.0, 40.0, 32.0, 46.0, 48.0, 38.0, 41.0, 54.0, 54.0, 59.0, 48.0, 45.0, 40.0, 53.0, 49.0, 36.0, 28.0, 31.0, 22.0, 16.0, 17.0, 14.0, 10.0, 9.0, 6.0, 8.0, 5.0, 4.0, 1.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.8125, -10.5267333984375, -10.240966796875, -9.9552001953125, -9.66943359375, -9.3836669921875, -9.097900390625, -8.8121337890625, -8.5263671875, -8.2406005859375, -7.954833984375, -7.6690673828125, -7.38330078125, -7.0975341796875, -6.811767578125, -6.5260009765625, -6.240234375, -5.9544677734375, -5.668701171875, -5.3829345703125, -5.09716796875, -4.8114013671875, -4.525634765625, -4.2398681640625, -3.9541015625, -3.6683349609375, -3.382568359375, -3.0968017578125, -2.81103515625, -2.5252685546875, -2.239501953125, -1.9537353515625, -1.66796875, -1.3822021484375, -1.096435546875, -0.8106689453125, -0.52490234375, -0.2391357421875, 0.046630859375, 0.3323974609375, 0.6181640625, 0.9039306640625, 1.189697265625, 1.4754638671875, 1.76123046875, 2.0469970703125, 2.332763671875, 2.6185302734375, 2.904296875, 3.1900634765625, 3.475830078125, 3.7615966796875, 4.04736328125, 4.3331298828125, 4.618896484375, 4.9046630859375, 5.1904296875, 5.4761962890625, 5.761962890625, 6.0477294921875, 6.33349609375, 6.6192626953125, 6.905029296875, 7.1907958984375, 7.4765625]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 3.0, 6.0, 3.0, 9.0, 13.0, 10.0, 21.0, 37.0, 39.0, 73.0, 101.0, 167.0, 250.0, 371.0, 553.0, 818.0, 1257.0, 1867.0, 2638.0, 3949.0, 5947.0, 8987.0, 13689.0, 21012.0, 33716.0, 56008.0, 99467.0, 190835.0, 254240.0, 147146.0, 78761.0, 45961.0, 27941.0, 17742.0, 11647.0, 7706.0, 5164.0, 3391.0, 2335.0, 1525.0, 1009.0, 738.0, 443.0, 337.0, 208.0, 155.0, 73.0, 78.0, 34.0, 24.0, 21.0, 14.0, 7.0, 6.0, 8.0, 4.0, 2.0, 1.0, 2.0, 2.0], "bins": [-1.080078125, -1.0466461181640625, -1.013214111328125, -0.9797821044921875, -0.94635009765625, -0.9129180908203125, -0.879486083984375, -0.8460540771484375, -0.8126220703125, -0.7791900634765625, -0.745758056640625, -0.7123260498046875, -0.67889404296875, -0.6454620361328125, -0.612030029296875, -0.5785980224609375, -0.545166015625, -0.5117340087890625, -0.478302001953125, -0.4448699951171875, -0.41143798828125, -0.3780059814453125, -0.344573974609375, -0.3111419677734375, -0.2777099609375, -0.2442779541015625, -0.210845947265625, -0.1774139404296875, -0.14398193359375, -0.1105499267578125, -0.077117919921875, -0.0436859130859375, -0.01025390625, 0.0231781005859375, 0.056610107421875, 0.0900421142578125, 0.12347412109375, 0.1569061279296875, 0.190338134765625, 0.2237701416015625, 0.2572021484375, 0.2906341552734375, 0.324066162109375, 0.3574981689453125, 0.39093017578125, 0.4243621826171875, 0.457794189453125, 0.4912261962890625, 0.524658203125, 0.5580902099609375, 0.591522216796875, 0.6249542236328125, 0.65838623046875, 0.6918182373046875, 0.725250244140625, 0.7586822509765625, 0.7921142578125, 0.8255462646484375, 0.858978271484375, 0.8924102783203125, 0.92584228515625, 0.9592742919921875, 0.992706298828125, 1.0261383056640625, 1.0595703125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 7.0, 7.0, 13.0, 8.0, 15.0, 14.0, 9.0, 12.0, 13.0, 26.0, 19.0, 23.0, 25.0, 26.0, 23.0, 33.0, 31.0, 30.0, 39.0, 39.0, 37.0, 1068.0, 42.0, 40.0, 48.0, 34.0, 26.0, 38.0, 32.0, 26.0, 31.0, 25.0, 25.0, 21.0, 18.0, 23.0, 14.0, 13.0, 10.0, 8.0, 9.0, 2.0, 4.0, 4.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.328125, -4.19268798828125, -4.0572509765625, -3.92181396484375, -3.786376953125, -3.65093994140625, -3.5155029296875, -3.38006591796875, -3.24462890625, -3.10919189453125, -2.9737548828125, -2.83831787109375, -2.702880859375, -2.56744384765625, -2.4320068359375, -2.29656982421875, -2.1611328125, -2.02569580078125, -1.8902587890625, -1.75482177734375, -1.619384765625, -1.48394775390625, -1.3485107421875, -1.21307373046875, -1.07763671875, -0.94219970703125, -0.8067626953125, -0.67132568359375, -0.535888671875, -0.40045166015625, -0.2650146484375, -0.12957763671875, 0.005859375, 0.14129638671875, 0.2767333984375, 0.41217041015625, 0.547607421875, 0.68304443359375, 0.8184814453125, 0.95391845703125, 1.08935546875, 1.22479248046875, 1.3602294921875, 1.49566650390625, 1.631103515625, 1.76654052734375, 1.9019775390625, 2.03741455078125, 2.1728515625, 2.30828857421875, 2.4437255859375, 2.57916259765625, 2.714599609375, 2.85003662109375, 2.9854736328125, 3.12091064453125, 3.25634765625, 3.39178466796875, 3.5272216796875, 3.66265869140625, 3.798095703125, 3.93353271484375, 4.0689697265625, 4.20440673828125, 4.33984375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 2.0, 12.0, 10.0, 17.0, 18.0, 37.0, 49.0, 78.0, 109.0, 151.0, 237.0, 365.0, 512.0, 688.0, 1064.0, 1602.0, 2451.0, 3669.0, 5782.0, 9076.0, 14354.0, 23362.0, 38742.0, 66905.0, 123502.0, 1116143.0, 400208.0, 120991.0, 65709.0, 37963.0, 23285.0, 14474.0, 8903.0, 5747.0, 3576.0, 2461.0, 1595.0, 1068.0, 723.0, 501.0, 322.0, 246.0, 134.0, 113.0, 68.0, 36.0, 31.0, 18.0, 12.0, 4.0, 6.0, 3.0, 0.0, 1.0, 2.0, 3.0], "bins": [-1.015625, -0.9857406616210938, -0.9558563232421875, -0.9259719848632812, -0.896087646484375, -0.8662033081054688, -0.8363189697265625, -0.8064346313476562, -0.77655029296875, -0.7466659545898438, -0.7167816162109375, -0.6868972778320312, -0.657012939453125, -0.6271286010742188, -0.5972442626953125, -0.5673599243164062, -0.5374755859375, -0.5075912475585938, -0.4777069091796875, -0.44782257080078125, -0.417938232421875, -0.38805389404296875, -0.3581695556640625, -0.32828521728515625, -0.29840087890625, -0.26851654052734375, -0.2386322021484375, -0.20874786376953125, -0.178863525390625, -0.14897918701171875, -0.1190948486328125, -0.08921051025390625, -0.059326171875, -0.02944183349609375, 0.0004425048828125, 0.03032684326171875, 0.060211181640625, 0.09009552001953125, 0.1199798583984375, 0.14986419677734375, 0.17974853515625, 0.20963287353515625, 0.2395172119140625, 0.26940155029296875, 0.299285888671875, 0.32917022705078125, 0.3590545654296875, 0.38893890380859375, 0.4188232421875, 0.44870758056640625, 0.4785919189453125, 0.5084762573242188, 0.538360595703125, 0.5682449340820312, 0.5981292724609375, 0.6280136108398438, 0.65789794921875, 0.6877822875976562, 0.7176666259765625, 0.7475509643554688, 0.777435302734375, 0.8073196411132812, 0.8372039794921875, 0.8670883178710938, 0.89697265625]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 1.0, 7.0, 8.0, 7.0, 17.0, 16.0, 21.0, 28.0, 37.0, 54.0, 58.0, 75.0, 83.0, 74.0, 73.0, 78.0, 78.0, 71.0, 50.0, 31.0, 30.0, 23.0, 23.0, 13.0, 9.0, 7.0, 8.0, 4.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00327301025390625, -0.003156006336212158, -0.0030390024185180664, -0.0029219985008239746, -0.002804994583129883, -0.002687990665435791, -0.0025709867477416992, -0.0024539828300476074, -0.0023369789123535156, -0.002219974994659424, -0.002102971076965332, -0.0019859671592712402, -0.0018689632415771484, -0.0017519593238830566, -0.0016349554061889648, -0.001517951488494873, -0.0014009475708007812, -0.0012839436531066895, -0.0011669397354125977, -0.0010499358177185059, -0.0009329319000244141, -0.0008159279823303223, -0.0006989240646362305, -0.0005819201469421387, -0.0004649162292480469, -0.0003479123115539551, -0.00023090839385986328, -0.00011390447616577148, 3.0994415283203125e-06, 0.00012010335922241211, 0.0002371072769165039, 0.0003541111946105957, 0.0004711151123046875, 0.0005881190299987793, 0.0007051229476928711, 0.0008221268653869629, 0.0009391307830810547, 0.0010561347007751465, 0.0011731386184692383, 0.00129014253616333, 0.0014071464538574219, 0.0015241503715515137, 0.0016411542892456055, 0.0017581582069396973, 0.001875162124633789, 0.001992166042327881, 0.0021091699600219727, 0.0022261738777160645, 0.0023431777954101562, 0.002460181713104248, 0.00257718563079834, 0.0026941895484924316, 0.0028111934661865234, 0.0029281973838806152, 0.003045201301574707, 0.003162205219268799, 0.0032792091369628906, 0.0033962130546569824, 0.0035132169723510742, 0.003630220890045166, 0.003747224807739258, 0.0038642287254333496, 0.003981232643127441, 0.004098236560821533, 0.004215240478515625]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 4.0, 3.0, 6.0, 7.0, 8.0, 10.0, 12.0, 26.0, 22.0, 35.0, 35.0, 51.0, 80.0, 122.0, 195.0, 347.0, 1559.0, 1009222.0, 35349.0, 732.0, 245.0, 140.0, 98.0, 64.0, 43.0, 35.0, 24.0, 14.0, 15.0, 10.0, 10.0, 6.0, 4.0, 4.0, 4.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.08575439453125, -0.0833578109741211, -0.08096122741699219, -0.07856464385986328, -0.07616806030273438, -0.07377147674560547, -0.07137489318847656, -0.06897830963134766, -0.06658172607421875, -0.06418514251708984, -0.06178855895996094, -0.05939197540283203, -0.056995391845703125, -0.05459880828857422, -0.05220222473144531, -0.049805641174316406, -0.0474090576171875, -0.045012474060058594, -0.04261589050292969, -0.04021930694580078, -0.037822723388671875, -0.03542613983154297, -0.03302955627441406, -0.030632972717285156, -0.02823638916015625, -0.025839805603027344, -0.023443222045898438, -0.02104663848876953, -0.018650054931640625, -0.01625347137451172, -0.013856887817382812, -0.011460304260253906, -0.009063720703125, -0.006667137145996094, -0.0042705535888671875, -0.0018739700317382812, 0.000522613525390625, 0.0029191970825195312, 0.0053157806396484375, 0.007712364196777344, 0.01010894775390625, 0.012505531311035156, 0.014902114868164062, 0.01729869842529297, 0.019695281982421875, 0.02209186553955078, 0.024488449096679688, 0.026885032653808594, 0.0292816162109375, 0.031678199768066406, 0.03407478332519531, 0.03647136688232422, 0.038867950439453125, 0.04126453399658203, 0.04366111755371094, 0.046057701110839844, 0.04845428466796875, 0.050850868225097656, 0.05324745178222656, 0.05564403533935547, 0.058040618896484375, 0.06043720245361328, 0.06283378601074219, 0.0652303695678711, 0.067626953125]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 7.0, 109.0, 636.0, 257.0, 9.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014509019674733281, -0.0011387320701032877, -0.0008265621145255864, -0.000514392158947885, -0.00020222226157784462, 0.0001099476357921958, 0.00042211764957755804, 0.0007342874305322766, 0.0010464574443176389, 0.0013586273416876793, 0.0016707973554730415, 0.0019829673692584038, 0.0022951371502131224, 0.002607306931167841, 0.002919476944953203, 0.0032316469587385654, 0.0035438169725239277, 0.00385598698630929, 0.004168157000094652, 0.004480326548218727, 0.004792496562004089, 0.005104666575789452, 0.005416836589574814, 0.005729006603360176, 0.006041176151484251, 0.006353346165269613, 0.0066655161790549755, 0.0069776857271790504, 0.007289855740964413, 0.007602025754749775, 0.007914195768535137, 0.0082263657823205, 0.008538535796105862, 0.008850705809891224, 0.009162875823676586, 0.009475045837461948, 0.00978721585124731, 0.010099384933710098, 0.01041155494749546, 0.010723724961280823, 0.011035894975066185, 0.011348064988851547, 0.01166023500263691, 0.011972405016422272, 0.012284575030207634, 0.012596745043992996, 0.012908915057778358, 0.013221084140241146, 0.013533255085349083, 0.013845425099134445, 0.014157595112919807, 0.01446976512670517, 0.014781935140490532, 0.015094105154275894, 0.015406275168061256, 0.01571844518184662, 0.01603061333298683, 0.016342783346772194, 0.016654953360557556, 0.01696712337434292, 0.01727929338812828, 0.017591463401913643, 0.017903633415699005, 0.018215803429484367, 0.01852797344326973]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 3.0, 3.0, 8.0, 4.0, 4.0, 6.0, 8.0, 13.0, 15.0, 22.0, 10.0, 22.0, 18.0, 38.0, 23.0, 38.0, 38.0, 40.0, 43.0, 40.0, 40.0, 34.0, 40.0, 45.0, 48.0, 37.0, 35.0, 37.0, 33.0, 34.0, 32.0, 33.0, 16.0, 27.0, 23.0, 21.0, 17.0, 14.0, 14.0, 11.0, 7.0, 5.0, 5.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.001601576805114746, -0.0015521403402090073, -0.0015027038753032684, -0.0014532674103975296, -0.0014038309454917908, -0.001354394480586052, -0.0013049580156803131, -0.0012555215507745743, -0.0012060850858688354, -0.0011566486209630966, -0.0011072121560573578, -0.001057775691151619, -0.0010083392262458801, -0.0009589027613401413, -0.0009094662964344025, -0.0008600298315286636, -0.0008105933666229248, -0.000761156901717186, -0.0007117204368114471, -0.0006622839719057083, -0.0006128475069999695, -0.0005634110420942307, -0.0005139745771884918, -0.000464538112282753, -0.00041510164737701416, -0.00036566518247127533, -0.0003162287175655365, -0.00026679225265979767, -0.00021735578775405884, -0.00016791932284832, -0.00011848285794258118, -6.904639303684235e-05, -1.9609928131103516e-05, 2.9826536774635315e-05, 7.926300168037415e-05, 0.00012869946658611298, 0.0001781359314918518, 0.00022757239639759064, 0.00027700886130332947, 0.0003264453262090683, 0.00037588179111480713, 0.00042531825602054596, 0.0004747547209262848, 0.0005241911858320236, 0.0005736276507377625, 0.0006230641156435013, 0.0006725005805492401, 0.0007219370454549789, 0.0007713735103607178, 0.0008208099752664566, 0.0008702464401721954, 0.0009196829050779343, 0.0009691193699836731, 0.001018555834889412, 0.0010679922997951508, 0.0011174287647008896, 0.0011668652296066284, 0.0012163016945123672, 0.001265738159418106, 0.001315174624323845, 0.0013646110892295837, 0.0014140475541353226, 0.0014634840190410614, 0.0015129204839468002, 0.001562356948852539]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 2.0, 4.0, 4.0, 5.0, 4.0, 13.0, 7.0, 16.0, 14.0, 22.0, 27.0, 29.0, 40.0, 32.0, 46.0, 48.0, 38.0, 41.0, 54.0, 54.0, 59.0, 48.0, 44.0, 41.0, 53.0, 49.0, 36.0, 28.0, 31.0, 22.0, 16.0, 17.0, 14.0, 10.0, 9.0, 6.0, 8.0, 5.0, 4.0, 1.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.8125, -10.5267333984375, -10.240966796875, -9.9552001953125, -9.66943359375, -9.3836669921875, -9.097900390625, -8.8121337890625, -8.5263671875, -8.2406005859375, -7.954833984375, -7.6690673828125, -7.38330078125, -7.0975341796875, -6.811767578125, -6.5260009765625, -6.240234375, -5.9544677734375, -5.668701171875, -5.3829345703125, -5.09716796875, -4.8114013671875, -4.525634765625, -4.2398681640625, -3.9541015625, -3.6683349609375, -3.382568359375, -3.0968017578125, -2.81103515625, -2.5252685546875, -2.239501953125, -1.9537353515625, -1.66796875, -1.3822021484375, -1.096435546875, -0.8106689453125, -0.52490234375, -0.2391357421875, 0.046630859375, 0.3323974609375, 0.6181640625, 0.9039306640625, 1.189697265625, 1.4754638671875, 1.76123046875, 2.0469970703125, 2.332763671875, 2.6185302734375, 2.904296875, 3.1900634765625, 3.475830078125, 3.7615966796875, 4.04736328125, 4.3331298828125, 4.618896484375, 4.9046630859375, 5.1904296875, 5.4761962890625, 5.761962890625, 6.0477294921875, 6.33349609375, 6.6192626953125, 6.905029296875, 7.1907958984375, 7.4765625]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 9.0, 8.0, 16.0, 18.0, 24.0, 31.0, 49.0, 73.0, 97.0, 172.0, 299.0, 505.0, 1006.0, 2305.0, 6779.0, 38595.0, 653938.0, 310631.0, 24822.0, 5251.0, 1894.0, 852.0, 462.0, 256.0, 127.0, 99.0, 62.0, 39.0, 34.0, 26.0, 15.0, 20.0, 9.0, 8.0, 6.0, 4.0, 1.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.96875, -19.4417724609375, -18.914794921875, -18.3878173828125, -17.86083984375, -17.3338623046875, -16.806884765625, -16.2799072265625, -15.7529296875, -15.2259521484375, -14.698974609375, -14.1719970703125, -13.64501953125, -13.1180419921875, -12.591064453125, -12.0640869140625, -11.537109375, -11.0101318359375, -10.483154296875, -9.9561767578125, -9.42919921875, -8.9022216796875, -8.375244140625, -7.8482666015625, -7.3212890625, -6.7943115234375, -6.267333984375, -5.7403564453125, -5.21337890625, -4.6864013671875, -4.159423828125, -3.6324462890625, -3.10546875, -2.5784912109375, -2.051513671875, -1.5245361328125, -0.99755859375, -0.4705810546875, 0.056396484375, 0.5833740234375, 1.1103515625, 1.6373291015625, 2.164306640625, 2.6912841796875, 3.21826171875, 3.7452392578125, 4.272216796875, 4.7991943359375, 5.326171875, 5.8531494140625, 6.380126953125, 6.9071044921875, 7.43408203125, 7.9610595703125, 8.488037109375, 9.0150146484375, 9.5419921875, 10.0689697265625, 10.595947265625, 11.1229248046875, 11.64990234375, 12.1768798828125, 12.703857421875, 13.2308349609375, 13.7578125]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 4.0, 6.0, 5.0, 11.0, 14.0, 17.0, 21.0, 26.0, 26.0, 38.0, 52.0, 50.0, 45.0, 58.0, 69.0, 163.0, 1827.0, 180.0, 58.0, 62.0, 49.0, 42.0, 47.0, 28.0, 30.0, 29.0, 13.0, 22.0, 10.0, 7.0, 5.0, 12.0, 4.0, 8.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.125, -22.18310546875, -21.2412109375, -20.29931640625, -19.357421875, -18.41552734375, -17.4736328125, -16.53173828125, -15.58984375, -14.64794921875, -13.7060546875, -12.76416015625, -11.822265625, -10.88037109375, -9.9384765625, -8.99658203125, -8.0546875, -7.11279296875, -6.1708984375, -5.22900390625, -4.287109375, -3.34521484375, -2.4033203125, -1.46142578125, -0.51953125, 0.42236328125, 1.3642578125, 2.30615234375, 3.248046875, 4.18994140625, 5.1318359375, 6.07373046875, 7.015625, 7.95751953125, 8.8994140625, 9.84130859375, 10.783203125, 11.72509765625, 12.6669921875, 13.60888671875, 14.55078125, 15.49267578125, 16.4345703125, 17.37646484375, 18.318359375, 19.26025390625, 20.2021484375, 21.14404296875, 22.0859375, 23.02783203125, 23.9697265625, 24.91162109375, 25.853515625, 26.79541015625, 27.7373046875, 28.67919921875, 29.62109375, 30.56298828125, 31.5048828125, 32.44677734375, 33.388671875, 34.33056640625, 35.2724609375, 36.21435546875, 37.15625]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 3.0, 1.0, 10.0, 9.0, 11.0, 3.0, 7.0, 18.0, 20.0, 20.0, 29.0, 31.0, 54.0, 78.0, 102.0, 169.0, 393.0, 1769.0, 88620.0, 3049401.0, 3738.0, 565.0, 200.0, 106.0, 96.0, 59.0, 39.0, 35.0, 21.0, 28.0, 19.0, 12.0, 9.0, 7.0, 9.0, 6.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-110.6875, -107.8603515625, -105.033203125, -102.2060546875, -99.37890625, -96.5517578125, -93.724609375, -90.8974609375, -88.0703125, -85.2431640625, -82.416015625, -79.5888671875, -76.76171875, -73.9345703125, -71.107421875, -68.2802734375, -65.453125, -62.6259765625, -59.798828125, -56.9716796875, -54.14453125, -51.3173828125, -48.490234375, -45.6630859375, -42.8359375, -40.0087890625, -37.181640625, -34.3544921875, -31.52734375, -28.7001953125, -25.873046875, -23.0458984375, -20.21875, -17.3916015625, -14.564453125, -11.7373046875, -8.91015625, -6.0830078125, -3.255859375, -0.4287109375, 2.3984375, 5.2255859375, 8.052734375, 10.8798828125, 13.70703125, 16.5341796875, 19.361328125, 22.1884765625, 25.015625, 27.8427734375, 30.669921875, 33.4970703125, 36.32421875, 39.1513671875, 41.978515625, 44.8056640625, 47.6328125, 50.4599609375, 53.287109375, 56.1142578125, 58.94140625, 61.7685546875, 64.595703125, 67.4228515625, 70.25]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 178.0, 813.0, 25.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.71171569824219, -33.06572341918945, -25.41973114013672, -17.773738861083984, -10.12774658203125, -2.4817543029785156, 5.164237976074219, 12.810230255126953, 20.456222534179688, 28.102214813232422, 35.748207092285156, 43.39419937133789, 51.040191650390625, 58.68618392944336, 66.3321762084961, 73.97816467285156, 81.62416076660156, 89.27015686035156, 96.91614532470703, 104.5621337890625, 112.2081298828125, 119.8541259765625, 127.50011444091797, 135.14610290527344, 142.79209899902344, 150.43809509277344, 158.08407592773438, 165.73007202148438, 173.37606811523438, 181.02206420898438, 188.66806030273438, 196.3140411376953, 203.96002197265625, 211.60601806640625, 219.25201416015625, 226.8979949951172, 234.5439910888672, 242.1899871826172, 249.83596801757812, 257.4819641113281, 265.1279602050781, 272.7739562988281, 280.4199523925781, 288.0659484863281, 295.7119140625, 303.35791015625, 311.00390625, 318.64990234375, 326.2958984375, 333.94189453125, 341.587890625, 349.23388671875, 356.8798828125, 364.5258483886719, 372.1718444824219, 379.8178405761719, 387.4638366699219, 395.1098327636719, 402.7558288574219, 410.4018249511719, 418.04779052734375, 425.69378662109375, 433.33978271484375, 440.98577880859375, 448.63177490234375]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 7.0, 4.0, 5.0, 6.0, 11.0, 9.0, 9.0, 17.0, 14.0, 22.0, 17.0, 26.0, 20.0, 34.0, 32.0, 36.0, 33.0, 34.0, 42.0, 32.0, 33.0, 43.0, 36.0, 47.0, 38.0, 49.0, 42.0, 32.0, 32.0, 35.0, 26.0, 20.0, 26.0, 27.0, 28.0, 12.0, 12.0, 11.0, 9.0, 9.0, 7.0, 6.0, 4.0, 7.0, 0.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-77.7824478149414, -75.5604019165039, -73.3383560180664, -71.1163101196289, -68.8942642211914, -66.67222595214844, -64.45018005371094, -62.22813034057617, -60.00608825683594, -57.78404235839844, -55.56199645996094, -53.33995056152344, -51.1179084777832, -48.8958625793457, -46.6738166809082, -44.4517707824707, -42.2297248840332, -40.0076789855957, -37.7856330871582, -35.56359100341797, -33.34154510498047, -31.11949920654297, -28.89745330810547, -26.67540740966797, -24.4533634185791, -22.2313175201416, -20.009273529052734, -17.787227630615234, -15.56518268585205, -13.343137741088867, -11.121091842651367, -8.899046897888184, -6.677001953125, -4.454957008361816, -2.2329115867614746, -0.010866165161132812, 2.211178779602051, 4.433223724365234, 6.655269622802734, 8.877314567565918, 11.099359512329102, 13.321404457092285, 15.543449401855469, 17.76549530029297, 19.98754119873047, 22.209585189819336, 24.431631088256836, 26.653675079345703, 28.875720977783203, 31.097766876220703, 33.3198127746582, 35.54185485839844, 37.76390075683594, 39.98594665527344, 42.20799255371094, 44.43003845214844, 46.65208435058594, 48.87413024902344, 51.09617614746094, 53.31822204589844, 55.54026412963867, 57.76231002807617, 59.98435592651367, 62.20640182495117, 64.4284439086914]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 4.0, 6.0, 11.0, 10.0, 5.0, 10.0, 10.0, 14.0, 26.0, 30.0, 25.0, 31.0, 35.0, 29.0, 34.0, 51.0, 35.0, 39.0, 52.0, 50.0, 49.0, 47.0, 44.0, 49.0, 39.0, 46.0, 34.0, 31.0, 24.0, 15.0, 25.0, 17.0, 12.0, 9.0, 11.0, 8.0, 7.0, 9.0, 4.0, 5.0, 4.0, 4.0, 1.0, 4.0, 0.0, 1.0], "bins": [-10.4765625, -10.19769287109375, -9.9188232421875, -9.63995361328125, -9.361083984375, -9.08221435546875, -8.8033447265625, -8.52447509765625, -8.24560546875, -7.96673583984375, -7.6878662109375, -7.40899658203125, -7.130126953125, -6.85125732421875, -6.5723876953125, -6.29351806640625, -6.0146484375, -5.73577880859375, -5.4569091796875, -5.17803955078125, -4.899169921875, -4.62030029296875, -4.3414306640625, -4.06256103515625, -3.78369140625, -3.50482177734375, -3.2259521484375, -2.94708251953125, -2.668212890625, -2.38934326171875, -2.1104736328125, -1.83160400390625, -1.552734375, -1.27386474609375, -0.9949951171875, -0.71612548828125, -0.437255859375, -0.15838623046875, 0.1204833984375, 0.39935302734375, 0.67822265625, 0.95709228515625, 1.2359619140625, 1.51483154296875, 1.793701171875, 2.07257080078125, 2.3514404296875, 2.63031005859375, 2.9091796875, 3.18804931640625, 3.4669189453125, 3.74578857421875, 4.024658203125, 4.30352783203125, 4.5823974609375, 4.86126708984375, 5.14013671875, 5.41900634765625, 5.6978759765625, 5.97674560546875, 6.255615234375, 6.53448486328125, 6.8133544921875, 7.09222412109375, 7.37109375]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 7.0, 13.0, 13.0, 8.0, 19.0, 17.0, 37.0, 38.0, 58.0, 84.0, 137.0, 223.0, 382.0, 760.0, 1401.0, 3346.0, 9849.0, 40141.0, 259545.0, 1313562.0, 1876633.0, 569429.0, 90945.0, 17820.0, 5489.0, 2171.0, 930.0, 486.0, 258.0, 167.0, 89.0, 54.0, 50.0, 32.0, 31.0, 18.0, 19.0, 9.0, 7.0, 5.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-15.0078125, -14.6251220703125, -14.242431640625, -13.8597412109375, -13.47705078125, -13.0943603515625, -12.711669921875, -12.3289794921875, -11.9462890625, -11.5635986328125, -11.180908203125, -10.7982177734375, -10.41552734375, -10.0328369140625, -9.650146484375, -9.2674560546875, -8.884765625, -8.5020751953125, -8.119384765625, -7.7366943359375, -7.35400390625, -6.9713134765625, -6.588623046875, -6.2059326171875, -5.8232421875, -5.4405517578125, -5.057861328125, -4.6751708984375, -4.29248046875, -3.9097900390625, -3.527099609375, -3.1444091796875, -2.76171875, -2.3790283203125, -1.996337890625, -1.6136474609375, -1.23095703125, -0.8482666015625, -0.465576171875, -0.0828857421875, 0.2998046875, 0.6824951171875, 1.065185546875, 1.4478759765625, 1.83056640625, 2.2132568359375, 2.595947265625, 2.9786376953125, 3.361328125, 3.7440185546875, 4.126708984375, 4.5093994140625, 4.89208984375, 5.2747802734375, 5.657470703125, 6.0401611328125, 6.4228515625, 6.8055419921875, 7.188232421875, 7.5709228515625, 7.95361328125, 8.3363037109375, 8.718994140625, 9.1016845703125, 9.484375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 5.0, 8.0, 10.0, 7.0, 11.0, 19.0, 28.0, 34.0, 45.0, 64.0, 94.0, 106.0, 157.0, 200.0, 247.0, 356.0, 386.0, 399.0, 394.0, 348.0, 259.0, 210.0, 156.0, 128.0, 85.0, 81.0, 52.0, 52.0, 26.0, 23.0, 17.0, 13.0, 14.0, 12.0, 8.0, 3.0, 2.0, 4.0, 5.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-13.7734375, -13.3623046875, -12.951171875, -12.5400390625, -12.12890625, -11.7177734375, -11.306640625, -10.8955078125, -10.484375, -10.0732421875, -9.662109375, -9.2509765625, -8.83984375, -8.4287109375, -8.017578125, -7.6064453125, -7.1953125, -6.7841796875, -6.373046875, -5.9619140625, -5.55078125, -5.1396484375, -4.728515625, -4.3173828125, -3.90625, -3.4951171875, -3.083984375, -2.6728515625, -2.26171875, -1.8505859375, -1.439453125, -1.0283203125, -0.6171875, -0.2060546875, 0.205078125, 0.6162109375, 1.02734375, 1.4384765625, 1.849609375, 2.2607421875, 2.671875, 3.0830078125, 3.494140625, 3.9052734375, 4.31640625, 4.7275390625, 5.138671875, 5.5498046875, 5.9609375, 6.3720703125, 6.783203125, 7.1943359375, 7.60546875, 8.0166015625, 8.427734375, 8.8388671875, 9.25, 9.6611328125, 10.072265625, 10.4833984375, 10.89453125, 11.3056640625, 11.716796875, 12.1279296875, 12.5390625]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 3.0, 9.0, 11.0, 8.0, 13.0, 18.0, 31.0, 33.0, 40.0, 62.0, 76.0, 97.0, 144.0, 161.0, 237.0, 271.0, 422.0, 780.0, 2752.0, 53353.0, 3910958.0, 217038.0, 5122.0, 975.0, 446.0, 300.0, 230.0, 174.0, 135.0, 111.0, 65.0, 38.0, 46.0, 23.0, 25.0, 16.0, 11.0, 12.0, 10.0, 7.0, 5.0, 8.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.0625, -45.41943359375, -43.7763671875, -42.13330078125, -40.490234375, -38.84716796875, -37.2041015625, -35.56103515625, -33.91796875, -32.27490234375, -30.6318359375, -28.98876953125, -27.345703125, -25.70263671875, -24.0595703125, -22.41650390625, -20.7734375, -19.13037109375, -17.4873046875, -15.84423828125, -14.201171875, -12.55810546875, -10.9150390625, -9.27197265625, -7.62890625, -5.98583984375, -4.3427734375, -2.69970703125, -1.056640625, 0.58642578125, 2.2294921875, 3.87255859375, 5.515625, 7.15869140625, 8.8017578125, 10.44482421875, 12.087890625, 13.73095703125, 15.3740234375, 17.01708984375, 18.66015625, 20.30322265625, 21.9462890625, 23.58935546875, 25.232421875, 26.87548828125, 28.5185546875, 30.16162109375, 31.8046875, 33.44775390625, 35.0908203125, 36.73388671875, 38.376953125, 40.02001953125, 41.6630859375, 43.30615234375, 44.94921875, 46.59228515625, 48.2353515625, 49.87841796875, 51.521484375, 53.16455078125, 54.8076171875, 56.45068359375, 58.09375]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 8.0, 173.0, 743.0, 92.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.823184967041016, -42.15327453613281, -29.483366012573242, -16.813457489013672, -4.143547058105469, 8.526363372802734, 21.196269989013672, 33.86618423461914, 46.53609085083008, 59.20600128173828, 71.87590789794922, 84.54582214355469, 97.21572875976562, 109.88563537597656, 122.5555419921875, 135.2254638671875, 147.89537048339844, 160.56527709960938, 173.2351837158203, 185.90509033203125, 198.57501220703125, 211.2449188232422, 223.91482543945312, 236.58474731445312, 249.254638671875, 261.924560546875, 274.5944519042969, 287.2643737792969, 299.93426513671875, 312.60418701171875, 325.27410888671875, 337.9440002441406, 350.6139221191406, 363.2838439941406, 375.9537353515625, 388.6236572265625, 401.2935485839844, 413.9634704589844, 426.63336181640625, 439.30328369140625, 451.97320556640625, 464.64312744140625, 477.3130187988281, 489.9829406738281, 502.65283203125, 515.32275390625, 527.99267578125, 540.66259765625, 553.3324584960938, 566.0023803710938, 578.6723022460938, 591.3421630859375, 604.0120849609375, 616.6820068359375, 629.3519287109375, 642.0218505859375, 654.6917724609375, 667.3616943359375, 680.0316162109375, 692.7014770507812, 705.3713989257812, 718.0413208007812, 730.7112426757812, 743.3811645507812, 756.051025390625]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 6.0, 2.0, 6.0, 7.0, 15.0, 15.0, 11.0, 20.0, 21.0, 31.0, 30.0, 29.0, 32.0, 44.0, 42.0, 39.0, 51.0, 52.0, 47.0, 46.0, 40.0, 43.0, 41.0, 34.0, 45.0, 45.0, 25.0, 30.0, 30.0, 28.0, 24.0, 18.0, 16.0, 10.0, 10.0, 5.0, 4.0, 6.0, 5.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.80809020996094, -57.991485595703125, -56.17488098144531, -54.358272552490234, -52.54166793823242, -50.72506332397461, -48.90845489501953, -47.09185028076172, -45.275245666503906, -43.458641052246094, -41.64203643798828, -39.8254280090332, -38.00882339477539, -36.19221878051758, -34.3756103515625, -32.55900573730469, -30.742401123046875, -28.925796508789062, -27.109189987182617, -25.292583465576172, -23.47597885131836, -21.659374237060547, -19.8427677154541, -18.026161193847656, -16.209556579589844, -14.392951011657715, -12.576345443725586, -10.759739875793457, -8.943134307861328, -7.126528739929199, -5.30992317199707, -3.4933176040649414, -1.6767120361328125, 0.1398935317993164, 1.9564990997314453, 3.773104667663574, 5.589710235595703, 7.406315803527832, 9.222921371459961, 11.03952693939209, 12.856132507324219, 14.672738075256348, 16.489343643188477, 18.305950164794922, 20.122554779052734, 21.939159393310547, 23.755765914916992, 25.572372436523438, 27.38897705078125, 29.205581665039062, 31.022188186645508, 32.83879470825195, 34.655399322509766, 36.47200393676758, 38.288612365722656, 40.10521697998047, 41.92182159423828, 43.738426208496094, 45.555030822753906, 47.371639251708984, 49.1882438659668, 51.00484848022461, 52.82145690917969, 54.6380615234375, 56.45466613769531]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 10.0, 4.0, 7.0, 8.0, 13.0, 15.0, 13.0, 17.0, 11.0, 13.0, 17.0, 28.0, 24.0, 23.0, 44.0, 38.0, 36.0, 43.0, 41.0, 53.0, 38.0, 41.0, 44.0, 48.0, 34.0, 38.0, 39.0, 32.0, 36.0, 20.0, 28.0, 19.0, 26.0, 16.0, 20.0, 11.0, 9.0, 11.0, 5.0, 7.0, 5.0, 5.0, 7.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.75, -7.50860595703125, -7.2672119140625, -7.02581787109375, -6.784423828125, -6.54302978515625, -6.3016357421875, -6.06024169921875, -5.81884765625, -5.57745361328125, -5.3360595703125, -5.09466552734375, -4.853271484375, -4.61187744140625, -4.3704833984375, -4.12908935546875, -3.8876953125, -3.64630126953125, -3.4049072265625, -3.16351318359375, -2.922119140625, -2.68072509765625, -2.4393310546875, -2.19793701171875, -1.95654296875, -1.71514892578125, -1.4737548828125, -1.23236083984375, -0.990966796875, -0.74957275390625, -0.5081787109375, -0.26678466796875, -0.025390625, 0.21600341796875, 0.4573974609375, 0.69879150390625, 0.940185546875, 1.18157958984375, 1.4229736328125, 1.66436767578125, 1.90576171875, 2.14715576171875, 2.3885498046875, 2.62994384765625, 2.871337890625, 3.11273193359375, 3.3541259765625, 3.59552001953125, 3.8369140625, 4.07830810546875, 4.3197021484375, 4.56109619140625, 4.802490234375, 5.04388427734375, 5.2852783203125, 5.52667236328125, 5.76806640625, 6.00946044921875, 6.2508544921875, 6.49224853515625, 6.733642578125, 6.97503662109375, 7.2164306640625, 7.45782470703125, 7.69921875]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 8.0, 13.0, 19.0, 21.0, 34.0, 50.0, 66.0, 118.0, 155.0, 233.0, 303.0, 464.0, 660.0, 994.0, 1384.0, 2069.0, 2956.0, 4322.0, 6688.0, 9994.0, 15887.0, 25265.0, 42016.0, 74125.0, 143426.0, 266784.0, 204476.0, 100892.0, 55069.0, 32116.0, 20008.0, 12687.0, 8279.0, 5274.0, 3687.0, 2475.0, 1726.0, 1169.0, 805.0, 588.0, 374.0, 269.0, 181.0, 144.0, 91.0, 70.0, 33.0, 30.0, 25.0, 16.0, 7.0, 4.0, 8.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.115234375, -1.080108642578125, -1.04498291015625, -1.009857177734375, -0.9747314453125, -0.939605712890625, -0.90447998046875, -0.869354248046875, -0.834228515625, -0.799102783203125, -0.76397705078125, -0.728851318359375, -0.6937255859375, -0.658599853515625, -0.62347412109375, -0.588348388671875, -0.55322265625, -0.518096923828125, -0.48297119140625, -0.447845458984375, -0.4127197265625, -0.377593994140625, -0.34246826171875, -0.307342529296875, -0.272216796875, -0.237091064453125, -0.20196533203125, -0.166839599609375, -0.1317138671875, -0.096588134765625, -0.06146240234375, -0.026336669921875, 0.0087890625, 0.043914794921875, 0.07904052734375, 0.114166259765625, 0.1492919921875, 0.184417724609375, 0.21954345703125, 0.254669189453125, 0.289794921875, 0.324920654296875, 0.36004638671875, 0.395172119140625, 0.4302978515625, 0.465423583984375, 0.50054931640625, 0.535675048828125, 0.57080078125, 0.605926513671875, 0.64105224609375, 0.676177978515625, 0.7113037109375, 0.746429443359375, 0.78155517578125, 0.816680908203125, 0.851806640625, 0.886932373046875, 0.92205810546875, 0.957183837890625, 0.9923095703125, 1.027435302734375, 1.06256103515625, 1.097686767578125, 1.1328125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 4.0, 3.0, 10.0, 11.0, 16.0, 16.0, 15.0, 19.0, 21.0, 24.0, 18.0, 28.0, 31.0, 26.0, 50.0, 41.0, 35.0, 40.0, 39.0, 36.0, 1064.0, 31.0, 41.0, 48.0, 33.0, 39.0, 37.0, 41.0, 38.0, 27.0, 21.0, 15.0, 15.0, 17.0, 13.0, 11.0, 4.0, 11.0, 8.0, 4.0, 7.0, 7.0, 4.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-4.97265625, -4.82275390625, -4.6728515625, -4.52294921875, -4.373046875, -4.22314453125, -4.0732421875, -3.92333984375, -3.7734375, -3.62353515625, -3.4736328125, -3.32373046875, -3.173828125, -3.02392578125, -2.8740234375, -2.72412109375, -2.57421875, -2.42431640625, -2.2744140625, -2.12451171875, -1.974609375, -1.82470703125, -1.6748046875, -1.52490234375, -1.375, -1.22509765625, -1.0751953125, -0.92529296875, -0.775390625, -0.62548828125, -0.4755859375, -0.32568359375, -0.17578125, -0.02587890625, 0.1240234375, 0.27392578125, 0.423828125, 0.57373046875, 0.7236328125, 0.87353515625, 1.0234375, 1.17333984375, 1.3232421875, 1.47314453125, 1.623046875, 1.77294921875, 1.9228515625, 2.07275390625, 2.22265625, 2.37255859375, 2.5224609375, 2.67236328125, 2.822265625, 2.97216796875, 3.1220703125, 3.27197265625, 3.421875, 3.57177734375, 3.7216796875, 3.87158203125, 4.021484375, 4.17138671875, 4.3212890625, 4.47119140625, 4.62109375]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 5.0, 5.0, 12.0, 15.0, 18.0, 20.0, 36.0, 56.0, 68.0, 117.0, 138.0, 266.0, 379.0, 612.0, 1018.0, 1557.0, 2405.0, 3801.0, 6508.0, 10768.0, 18568.0, 32343.0, 59257.0, 118052.0, 277278.0, 1292873.0, 126337.0, 62376.0, 34104.0, 19453.0, 11096.0, 6625.0, 3967.0, 2539.0, 1615.0, 972.0, 662.0, 403.0, 292.0, 156.0, 98.0, 61.0, 67.0, 40.0, 27.0, 17.0, 16.0, 14.0, 6.0, 5.0, 6.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.1728515625, -1.1362457275390625, -1.099639892578125, -1.0630340576171875, -1.02642822265625, -0.9898223876953125, -0.953216552734375, -0.9166107177734375, -0.8800048828125, -0.8433990478515625, -0.806793212890625, -0.7701873779296875, -0.73358154296875, -0.6969757080078125, -0.660369873046875, -0.6237640380859375, -0.587158203125, -0.5505523681640625, -0.513946533203125, -0.4773406982421875, -0.44073486328125, -0.4041290283203125, -0.367523193359375, -0.3309173583984375, -0.2943115234375, -0.2577056884765625, -0.221099853515625, -0.1844940185546875, -0.14788818359375, -0.1112823486328125, -0.074676513671875, -0.0380706787109375, -0.00146484375, 0.0351409912109375, 0.071746826171875, 0.1083526611328125, 0.14495849609375, 0.1815643310546875, 0.218170166015625, 0.2547760009765625, 0.2913818359375, 0.3279876708984375, 0.364593505859375, 0.4011993408203125, 0.43780517578125, 0.4744110107421875, 0.511016845703125, 0.5476226806640625, 0.584228515625, 0.6208343505859375, 0.657440185546875, 0.6940460205078125, 0.73065185546875, 0.7672576904296875, 0.803863525390625, 0.8404693603515625, 0.8770751953125, 0.9136810302734375, 0.950286865234375, 0.9868927001953125, 1.02349853515625, 1.0601043701171875, 1.096710205078125, 1.1333160400390625, 1.169921875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 6.0, 0.0, 1.0, 3.0, 5.0, 7.0, 10.0, 11.0, 10.0, 20.0, 20.0, 32.0, 43.0, 39.0, 45.0, 59.0, 55.0, 53.0, 69.0, 59.0, 65.0, 87.0, 56.0, 47.0, 40.0, 27.0, 30.0, 21.0, 15.0, 16.0, 13.0, 4.0, 6.0, 4.0, 8.0, 5.0, 2.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.003643035888671875, -0.0035384297370910645, -0.003433823585510254, -0.0033292174339294434, -0.003224611282348633, -0.0031200051307678223, -0.0030153989791870117, -0.002910792827606201, -0.0028061866760253906, -0.00270158052444458, -0.0025969743728637695, -0.002492368221282959, -0.0023877620697021484, -0.002283155918121338, -0.0021785497665405273, -0.002073943614959717, -0.0019693374633789062, -0.0018647313117980957, -0.0017601251602172852, -0.0016555190086364746, -0.001550912857055664, -0.0014463067054748535, -0.001341700553894043, -0.0012370944023132324, -0.0011324882507324219, -0.0010278820991516113, -0.0009232759475708008, -0.0008186697959899902, -0.0007140636444091797, -0.0006094574928283691, -0.0005048513412475586, -0.00040024518966674805, -0.0002956390380859375, -0.00019103288650512695, -8.64267349243164e-05, 1.817941665649414e-05, 0.0001227855682373047, 0.00022739171981811523, 0.0003319978713989258, 0.00043660402297973633, 0.0005412101745605469, 0.0006458163261413574, 0.000750422477722168, 0.0008550286293029785, 0.0009596347808837891, 0.0010642409324645996, 0.0011688470840454102, 0.0012734532356262207, 0.0013780593872070312, 0.0014826655387878418, 0.0015872716903686523, 0.0016918778419494629, 0.0017964839935302734, 0.001901090145111084, 0.0020056962966918945, 0.002110302448272705, 0.0022149085998535156, 0.002319514751434326, 0.0024241209030151367, 0.0025287270545959473, 0.002633333206176758, 0.0027379393577575684, 0.002842545509338379, 0.0029471516609191895, 0.0030517578125]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 6.0, 5.0, 7.0, 8.0, 11.0, 8.0, 21.0, 23.0, 37.0, 40.0, 62.0, 103.0, 143.0, 275.0, 794.0, 253642.0, 791733.0, 828.0, 308.0, 159.0, 84.0, 64.0, 59.0, 25.0, 35.0, 14.0, 18.0, 9.0, 8.0, 6.0, 2.0, 0.0, 3.0, 1.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0791015625, -0.07637882232666016, -0.07365608215332031, -0.07093334197998047, -0.06821060180664062, -0.06548786163330078, -0.06276512145996094, -0.060042381286621094, -0.05731964111328125, -0.054596900939941406, -0.05187416076660156, -0.04915142059326172, -0.046428680419921875, -0.04370594024658203, -0.04098320007324219, -0.038260459899902344, -0.0355377197265625, -0.032814979553222656, -0.030092239379882812, -0.02736949920654297, -0.024646759033203125, -0.02192401885986328, -0.019201278686523438, -0.016478538513183594, -0.01375579833984375, -0.011033058166503906, -0.008310317993164062, -0.005587577819824219, -0.002864837646484375, -0.00014209747314453125, 0.0025806427001953125, 0.005303382873535156, 0.008026123046875, 0.010748863220214844, 0.013471603393554688, 0.01619434356689453, 0.018917083740234375, 0.02163982391357422, 0.024362564086914062, 0.027085304260253906, 0.02980804443359375, 0.032530784606933594, 0.03525352478027344, 0.03797626495361328, 0.040699005126953125, 0.04342174530029297, 0.04614448547363281, 0.048867225646972656, 0.0515899658203125, 0.054312705993652344, 0.05703544616699219, 0.05975818634033203, 0.062480926513671875, 0.06520366668701172, 0.06792640686035156, 0.0706491470336914, 0.07337188720703125, 0.0760946273803711, 0.07881736755371094, 0.08154010772705078, 0.08426284790039062, 0.08698558807373047, 0.08970832824707031, 0.09243106842041016, 0.09515380859375]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 27.0, 173.0, 510.0, 251.0, 42.0, 9.0, 0.0, 1.0], "bins": [-0.011518800631165504, -0.011322228237986565, -0.0111256567761302, -0.010929085314273834, -0.010732512921094894, -0.010535940527915955, -0.01033936906605959, -0.010142797604203224, -0.009946225211024284, -0.009749652817845345, -0.00955308135598898, -0.009356509894132614, -0.009159937500953674, -0.008963365107774734, -0.00876679364591837, -0.008570222184062004, -0.008373649790883064, -0.008177077397704124, -0.00798050593584776, -0.007783934008330107, -0.007587362080812454, -0.007390790153294802, -0.007194218225777149, -0.006997646298259497, -0.006801074370741844, -0.006604502443224192, -0.006407930515706539, -0.006211358588188887, -0.006014786660671234, -0.005818214733153582, -0.005621642805635929, -0.005425070878118277, -0.005228498950600624, -0.005031927023082972, -0.004835355095565319, -0.0046387831680476665, -0.004442211240530014, -0.0042456393130123615, -0.004049067385494709, -0.0038524954579770565, -0.0036559232976287603, -0.003459351370111108, -0.0032627794425934553, -0.003066207515075803, -0.0028696355875581503, -0.0026730636600404978, -0.0024764917325228453, -0.0022799198050051928, -0.0020833478774875402, -0.0018867759499698877, -0.0016902040224522352, -0.0014936320949345827, -0.0012970601674169302, -0.0011004882398992777, -0.0009039163123816252, -0.0007073443848639727, -0.0005107724573463202, -0.00031420052982866764, -0.00011762860231101513, 7.894332520663738e-05, 0.0002755152527242899, 0.0004720871802419424, 0.0006686591077595949, 0.0008652310352772474, 0.0010618029627949]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 7.0, 9.0, 6.0, 12.0, 15.0, 16.0, 16.0, 17.0, 18.0, 15.0, 19.0, 26.0, 27.0, 39.0, 47.0, 24.0, 37.0, 38.0, 44.0, 35.0, 45.0, 54.0, 47.0, 38.0, 38.0, 41.0, 29.0, 40.0, 25.0, 28.0, 22.0, 19.0, 18.0, 12.0, 12.0, 12.0, 8.0, 11.0, 4.0, 10.0, 8.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.0017020702362060547, -0.001650598831474781, -0.0015991274267435074, -0.0015476560220122337, -0.00149618461728096, -0.0014447132125496864, -0.0013932418078184128, -0.0013417704030871391, -0.0012902989983558655, -0.0012388275936245918, -0.0011873561888933182, -0.0011358847841620445, -0.0010844133794307709, -0.0010329419746994972, -0.0009814705699682236, -0.0009299991652369499, -0.0008785277605056763, -0.0008270563557744026, -0.000775584951043129, -0.0007241135463118553, -0.0006726421415805817, -0.000621170736849308, -0.0005696993321180344, -0.0005182279273867607, -0.00046675652265548706, -0.0004152851179242134, -0.00036381371319293976, -0.0003123423084616661, -0.00026087090373039246, -0.0002093994989991188, -0.00015792809426784515, -0.0001064566895365715, -5.498528480529785e-05, -3.5138800740242004e-06, 4.795752465724945e-05, 9.94289293885231e-05, 0.00015090033411979675, 0.0002023717388510704, 0.00025384314358234406, 0.0003053145483136177, 0.00035678595304489136, 0.000408257357776165, 0.00045972876250743866, 0.0005112001672387123, 0.000562671571969986, 0.0006141429767012596, 0.0006656143814325333, 0.0007170857861638069, 0.0007685571908950806, 0.0008200285956263542, 0.0008715000003576279, 0.0009229714050889015, 0.0009744428098201752, 0.0010259142145514488, 0.0010773856192827225, 0.0011288570240139961, 0.0011803284287452698, 0.0012317998334765434, 0.001283271238207817, 0.0013347426429390907, 0.0013862140476703644, 0.001437685452401638, 0.0014891568571329117, 0.0015406282618641853, 0.001592099666595459]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 10.0, 4.0, 7.0, 8.0, 13.0, 15.0, 14.0, 16.0, 11.0, 13.0, 17.0, 28.0, 24.0, 23.0, 44.0, 38.0, 36.0, 43.0, 41.0, 53.0, 39.0, 40.0, 44.0, 48.0, 34.0, 38.0, 39.0, 32.0, 36.0, 20.0, 28.0, 19.0, 26.0, 16.0, 20.0, 11.0, 9.0, 11.0, 5.0, 7.0, 5.0, 5.0, 7.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.75, -7.50860595703125, -7.2672119140625, -7.02581787109375, -6.784423828125, -6.54302978515625, -6.3016357421875, -6.06024169921875, -5.81884765625, -5.57745361328125, -5.3360595703125, -5.09466552734375, -4.853271484375, -4.61187744140625, -4.3704833984375, -4.12908935546875, -3.8876953125, -3.64630126953125, -3.4049072265625, -3.16351318359375, -2.922119140625, -2.68072509765625, -2.4393310546875, -2.19793701171875, -1.95654296875, -1.71514892578125, -1.4737548828125, -1.23236083984375, -0.990966796875, -0.74957275390625, -0.5081787109375, -0.26678466796875, -0.025390625, 0.21600341796875, 0.4573974609375, 0.69879150390625, 0.940185546875, 1.18157958984375, 1.4229736328125, 1.66436767578125, 1.90576171875, 2.14715576171875, 2.3885498046875, 2.62994384765625, 2.871337890625, 3.11273193359375, 3.3541259765625, 3.59552001953125, 3.8369140625, 4.07830810546875, 4.3197021484375, 4.56109619140625, 4.802490234375, 5.04388427734375, 5.2852783203125, 5.52667236328125, 5.76806640625, 6.00946044921875, 6.2508544921875, 6.49224853515625, 6.733642578125, 6.97503662109375, 7.2164306640625, 7.45782470703125, 7.69921875]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 6.0, 4.0, 6.0, 6.0, 9.0, 17.0, 22.0, 26.0, 33.0, 60.0, 64.0, 123.0, 207.0, 326.0, 563.0, 1064.0, 1966.0, 4034.0, 8334.0, 18161.0, 43248.0, 119212.0, 364917.0, 315935.0, 101540.0, 37663.0, 15746.0, 7390.0, 3626.0, 1848.0, 1048.0, 533.0, 315.0, 168.0, 105.0, 64.0, 49.0, 31.0, 26.0, 15.0, 9.0, 10.0, 13.0, 8.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.57421875, -6.3682861328125, -6.162353515625, -5.9564208984375, -5.75048828125, -5.5445556640625, -5.338623046875, -5.1326904296875, -4.9267578125, -4.7208251953125, -4.514892578125, -4.3089599609375, -4.10302734375, -3.8970947265625, -3.691162109375, -3.4852294921875, -3.279296875, -3.0733642578125, -2.867431640625, -2.6614990234375, -2.45556640625, -2.2496337890625, -2.043701171875, -1.8377685546875, -1.6318359375, -1.4259033203125, -1.219970703125, -1.0140380859375, -0.80810546875, -0.6021728515625, -0.396240234375, -0.1903076171875, 0.015625, 0.2215576171875, 0.427490234375, 0.6334228515625, 0.83935546875, 1.0452880859375, 1.251220703125, 1.4571533203125, 1.6630859375, 1.8690185546875, 2.074951171875, 2.2808837890625, 2.48681640625, 2.6927490234375, 2.898681640625, 3.1046142578125, 3.310546875, 3.5164794921875, 3.722412109375, 3.9283447265625, 4.13427734375, 4.3402099609375, 4.546142578125, 4.7520751953125, 4.9580078125, 5.1639404296875, 5.369873046875, 5.5758056640625, 5.78173828125, 5.9876708984375, 6.193603515625, 6.3995361328125, 6.60546875]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [4.0, 2.0, 6.0, 1.0, 1.0, 2.0, 6.0, 6.0, 7.0, 7.0, 11.0, 14.0, 7.0, 25.0, 12.0, 12.0, 20.0, 27.0, 29.0, 25.0, 26.0, 24.0, 40.0, 36.0, 53.0, 90.0, 143.0, 1417.0, 408.0, 139.0, 62.0, 49.0, 45.0, 27.0, 24.0, 27.0, 33.0, 26.0, 26.0, 26.0, 17.0, 17.0, 21.0, 10.0, 9.0, 4.0, 10.0, 8.0, 8.0, 4.0, 2.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.890625, -18.215576171875, -17.54052734375, -16.865478515625, -16.1904296875, -15.515380859375, -14.84033203125, -14.165283203125, -13.490234375, -12.815185546875, -12.14013671875, -11.465087890625, -10.7900390625, -10.114990234375, -9.43994140625, -8.764892578125, -8.08984375, -7.414794921875, -6.73974609375, -6.064697265625, -5.3896484375, -4.714599609375, -4.03955078125, -3.364501953125, -2.689453125, -2.014404296875, -1.33935546875, -0.664306640625, 0.0107421875, 0.685791015625, 1.36083984375, 2.035888671875, 2.7109375, 3.385986328125, 4.06103515625, 4.736083984375, 5.4111328125, 6.086181640625, 6.76123046875, 7.436279296875, 8.111328125, 8.786376953125, 9.46142578125, 10.136474609375, 10.8115234375, 11.486572265625, 12.16162109375, 12.836669921875, 13.51171875, 14.186767578125, 14.86181640625, 15.536865234375, 16.2119140625, 16.886962890625, 17.56201171875, 18.237060546875, 18.912109375, 19.587158203125, 20.26220703125, 20.937255859375, 21.6123046875, 22.287353515625, 22.96240234375, 23.637451171875, 24.3125]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 2.0, 6.0, 4.0, 8.0, 9.0, 11.0, 6.0, 10.0, 20.0, 34.0, 26.0, 34.0, 64.0, 64.0, 64.0, 98.0, 130.0, 177.0, 231.0, 374.0, 832.0, 5084.0, 469958.0, 2654442.0, 11340.0, 1145.0, 444.0, 237.0, 192.0, 153.0, 103.0, 69.0, 73.0, 47.0, 48.0, 32.0, 34.0, 22.0, 17.0, 12.0, 15.0, 9.0, 7.0, 6.0, 0.0, 5.0, 3.0, 6.0, 2.0, 1.0, 1.0, 1.0], "bins": [-41.125, -39.9541015625, -38.783203125, -37.6123046875, -36.44140625, -35.2705078125, -34.099609375, -32.9287109375, -31.7578125, -30.5869140625, -29.416015625, -28.2451171875, -27.07421875, -25.9033203125, -24.732421875, -23.5615234375, -22.390625, -21.2197265625, -20.048828125, -18.8779296875, -17.70703125, -16.5361328125, -15.365234375, -14.1943359375, -13.0234375, -11.8525390625, -10.681640625, -9.5107421875, -8.33984375, -7.1689453125, -5.998046875, -4.8271484375, -3.65625, -2.4853515625, -1.314453125, -0.1435546875, 1.02734375, 2.1982421875, 3.369140625, 4.5400390625, 5.7109375, 6.8818359375, 8.052734375, 9.2236328125, 10.39453125, 11.5654296875, 12.736328125, 13.9072265625, 15.078125, 16.2490234375, 17.419921875, 18.5908203125, 19.76171875, 20.9326171875, 22.103515625, 23.2744140625, 24.4453125, 25.6162109375, 26.787109375, 27.9580078125, 29.12890625, 30.2998046875, 31.470703125, 32.6416015625, 33.8125]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 24.0, 114.0, 304.0, 347.0, 165.0, 47.0, 12.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.7906265258789, -66.8886947631836, -64.98677062988281, -63.0848388671875, -61.18291091918945, -59.280982971191406, -57.379051208496094, -55.47712326049805, -53.5751953125, -51.67326736450195, -49.77133560180664, -47.869407653808594, -45.96747970581055, -44.0655517578125, -42.16361999511719, -40.26169204711914, -38.35976028442383, -36.45783233642578, -34.55590057373047, -32.65397262573242, -30.752044677734375, -28.850114822387695, -26.948184967041016, -25.04625701904297, -23.14432716369629, -21.24239730834961, -19.340469360351562, -17.438539505004883, -15.53661060333252, -13.634681701660156, -11.732751846313477, -9.830822944641113, -7.928897857666016, -6.026968955993652, -4.125039577484131, -2.2231101989746094, -0.3211812973022461, 1.5807476043701172, 3.482677459716797, 5.38460636138916, 7.286535263061523, 9.188464164733887, 11.09039306640625, 12.99232292175293, 14.894251823425293, 16.796180725097656, 18.698110580444336, 20.600040435791016, 22.501968383789062, 24.403898239135742, 26.30582618713379, 28.20775604248047, 30.109683990478516, 32.01161193847656, 33.913543701171875, 35.81547164916992, 37.71739959716797, 39.619327545166016, 41.52125930786133, 43.423187255859375, 45.32511520385742, 47.22704315185547, 49.12897491455078, 51.03090286254883, 52.93283462524414]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 8.0, 7.0, 10.0, 10.0, 11.0, 10.0, 15.0, 18.0, 19.0, 16.0, 18.0, 23.0, 24.0, 35.0, 20.0, 46.0, 49.0, 34.0, 40.0, 50.0, 39.0, 38.0, 43.0, 44.0, 36.0, 48.0, 28.0, 27.0, 30.0, 25.0, 30.0, 21.0, 20.0, 24.0, 15.0, 17.0, 10.0, 8.0, 8.0, 6.0, 4.0, 5.0, 4.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-52.45960998535156, -50.79045104980469, -49.12128829956055, -47.45212936401367, -45.78296661376953, -44.113807678222656, -42.444644927978516, -40.77548599243164, -39.1063232421875, -37.437164306640625, -35.768001556396484, -34.09884262084961, -32.42967987060547, -30.760520935058594, -29.091358184814453, -27.422199249267578, -25.75303840637207, -24.083877563476562, -22.414716720581055, -20.745555877685547, -19.07639503479004, -17.40723419189453, -15.73807430267334, -14.068913459777832, -12.399752616882324, -10.730591773986816, -9.061430931091309, -7.392270565032959, -5.723109722137451, -4.053949356079102, -2.3847885131835938, -0.7156276702880859, 0.9535331726074219, 2.6226940155029297, 4.2918548583984375, 5.961015224456787, 7.630176067352295, 9.299336433410645, 10.968497276306152, 12.63765811920166, 14.306818962097168, 15.975979804992676, 17.645139694213867, 19.314300537109375, 20.983461380004883, 22.65262222290039, 24.3217830657959, 25.990943908691406, 27.660104751586914, 29.329265594482422, 30.99842643737793, 32.66758728027344, 34.33674621582031, 36.00590896606445, 37.67506790161133, 39.34423065185547, 41.013389587402344, 42.68254852294922, 44.35171127319336, 46.020870208740234, 47.690032958984375, 49.35919189453125, 51.02835464477539, 52.697513580322266, 54.366676330566406]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 6.0, 2.0, 2.0, 5.0, 7.0, 11.0, 5.0, 16.0, 15.0, 14.0, 12.0, 13.0, 18.0, 26.0, 25.0, 32.0, 37.0, 37.0, 41.0, 41.0, 37.0, 49.0, 37.0, 43.0, 49.0, 46.0, 39.0, 50.0, 31.0, 26.0, 41.0, 26.0, 24.0, 19.0, 23.0, 18.0, 18.0, 12.0, 15.0, 7.0, 7.0, 10.0, 6.0, 3.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.140625, -7.888916015625, -7.63720703125, -7.385498046875, -7.1337890625, -6.882080078125, -6.63037109375, -6.378662109375, -6.126953125, -5.875244140625, -5.62353515625, -5.371826171875, -5.1201171875, -4.868408203125, -4.61669921875, -4.364990234375, -4.11328125, -3.861572265625, -3.60986328125, -3.358154296875, -3.1064453125, -2.854736328125, -2.60302734375, -2.351318359375, -2.099609375, -1.847900390625, -1.59619140625, -1.344482421875, -1.0927734375, -0.841064453125, -0.58935546875, -0.337646484375, -0.0859375, 0.165771484375, 0.41748046875, 0.669189453125, 0.9208984375, 1.172607421875, 1.42431640625, 1.676025390625, 1.927734375, 2.179443359375, 2.43115234375, 2.682861328125, 2.9345703125, 3.186279296875, 3.43798828125, 3.689697265625, 3.94140625, 4.193115234375, 4.44482421875, 4.696533203125, 4.9482421875, 5.199951171875, 5.45166015625, 5.703369140625, 5.955078125, 6.206787109375, 6.45849609375, 6.710205078125, 6.9619140625, 7.213623046875, 7.46533203125, 7.717041015625, 7.96875]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 5.0, 7.0, 10.0, 11.0, 11.0, 15.0, 22.0, 19.0, 25.0, 35.0, 45.0, 55.0, 78.0, 114.0, 205.0, 397.0, 1302.0, 7260.0, 119773.0, 3114780.0, 920951.0, 24663.0, 3005.0, 664.0, 244.0, 146.0, 114.0, 72.0, 53.0, 29.0, 30.0, 26.0, 22.0, 13.0, 21.0, 11.0, 17.0, 3.0, 6.0, 7.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-29.515625, -28.690185546875, -27.86474609375, -27.039306640625, -26.2138671875, -25.388427734375, -24.56298828125, -23.737548828125, -22.912109375, -22.086669921875, -21.26123046875, -20.435791015625, -19.6103515625, -18.784912109375, -17.95947265625, -17.134033203125, -16.30859375, -15.483154296875, -14.65771484375, -13.832275390625, -13.0068359375, -12.181396484375, -11.35595703125, -10.530517578125, -9.705078125, -8.879638671875, -8.05419921875, -7.228759765625, -6.4033203125, -5.577880859375, -4.75244140625, -3.927001953125, -3.1015625, -2.276123046875, -1.45068359375, -0.625244140625, 0.2001953125, 1.025634765625, 1.85107421875, 2.676513671875, 3.501953125, 4.327392578125, 5.15283203125, 5.978271484375, 6.8037109375, 7.629150390625, 8.45458984375, 9.280029296875, 10.10546875, 10.930908203125, 11.75634765625, 12.581787109375, 13.4072265625, 14.232666015625, 15.05810546875, 15.883544921875, 16.708984375, 17.534423828125, 18.35986328125, 19.185302734375, 20.0107421875, 20.836181640625, 21.66162109375, 22.487060546875, 23.3125]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 0.0, 2.0, 5.0, 12.0, 10.0, 5.0, 12.0, 19.0, 26.0, 34.0, 43.0, 64.0, 59.0, 114.0, 123.0, 162.0, 204.0, 301.0, 359.0, 422.0, 469.0, 388.0, 313.0, 232.0, 160.0, 133.0, 93.0, 82.0, 63.0, 42.0, 40.0, 24.0, 18.0, 17.0, 6.0, 6.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.9921875, -13.606201171875, -13.22021484375, -12.834228515625, -12.4482421875, -12.062255859375, -11.67626953125, -11.290283203125, -10.904296875, -10.518310546875, -10.13232421875, -9.746337890625, -9.3603515625, -8.974365234375, -8.58837890625, -8.202392578125, -7.81640625, -7.430419921875, -7.04443359375, -6.658447265625, -6.2724609375, -5.886474609375, -5.50048828125, -5.114501953125, -4.728515625, -4.342529296875, -3.95654296875, -3.570556640625, -3.1845703125, -2.798583984375, -2.41259765625, -2.026611328125, -1.640625, -1.254638671875, -0.86865234375, -0.482666015625, -0.0966796875, 0.289306640625, 0.67529296875, 1.061279296875, 1.447265625, 1.833251953125, 2.21923828125, 2.605224609375, 2.9912109375, 3.377197265625, 3.76318359375, 4.149169921875, 4.53515625, 4.921142578125, 5.30712890625, 5.693115234375, 6.0791015625, 6.465087890625, 6.85107421875, 7.237060546875, 7.623046875, 8.009033203125, 8.39501953125, 8.781005859375, 9.1669921875, 9.552978515625, 9.93896484375, 10.324951171875, 10.7109375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 6.0, 2.0, 2.0, 10.0, 8.0, 6.0, 8.0, 11.0, 17.0, 26.0, 26.0, 36.0, 41.0, 49.0, 71.0, 92.0, 138.0, 138.0, 173.0, 242.0, 385.0, 1000.0, 7441.0, 393235.0, 3746969.0, 39697.0, 2419.0, 645.0, 341.0, 218.0, 209.0, 130.0, 113.0, 78.0, 60.0, 55.0, 47.0, 35.0, 32.0, 24.0, 13.0, 8.0, 11.0, 4.0, 3.0, 5.0, 4.0, 4.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-55.6875, -54.06201171875, -52.4365234375, -50.81103515625, -49.185546875, -47.56005859375, -45.9345703125, -44.30908203125, -42.68359375, -41.05810546875, -39.4326171875, -37.80712890625, -36.181640625, -34.55615234375, -32.9306640625, -31.30517578125, -29.6796875, -28.05419921875, -26.4287109375, -24.80322265625, -23.177734375, -21.55224609375, -19.9267578125, -18.30126953125, -16.67578125, -15.05029296875, -13.4248046875, -11.79931640625, -10.173828125, -8.54833984375, -6.9228515625, -5.29736328125, -3.671875, -2.04638671875, -0.4208984375, 1.20458984375, 2.830078125, 4.45556640625, 6.0810546875, 7.70654296875, 9.33203125, 10.95751953125, 12.5830078125, 14.20849609375, 15.833984375, 17.45947265625, 19.0849609375, 20.71044921875, 22.3359375, 23.96142578125, 25.5869140625, 27.21240234375, 28.837890625, 30.46337890625, 32.0888671875, 33.71435546875, 35.33984375, 36.96533203125, 38.5908203125, 40.21630859375, 41.841796875, 43.46728515625, 45.0927734375, 46.71826171875, 48.34375]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 17.0, 241.0, 518.0, 201.0, 39.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.95737838745117, -31.95941734313965, -24.961456298828125, -17.9634952545166, -10.965534210205078, -3.967571258544922, 3.0303878784179688, 10.02834701538086, 17.026309967041016, 24.02427101135254, 31.022232055664062, 38.02019500732422, 45.01815414428711, 52.016117095947266, 59.014076232910156, 66.01203918457031, 73.00999450683594, 80.0079574584961, 87.00592041015625, 94.00387573242188, 101.00183868408203, 107.99980163574219, 114.99775695800781, 121.99571990966797, 128.99368286132812, 135.99163818359375, 142.98960876464844, 149.98756408691406, 156.98553466796875, 163.98348999023438, 170.9814453125, 177.97940063476562, 184.97738647460938, 191.975341796875, 198.9733123779297, 205.9712677001953, 212.96923828125, 219.96719360351562, 226.96514892578125, 233.96310424804688, 240.96107482910156, 247.9590301513672, 254.95700073242188, 261.9549560546875, 268.9529113769531, 275.95086669921875, 282.9488525390625, 289.9468078613281, 296.94476318359375, 303.9427185058594, 310.940673828125, 317.93865966796875, 324.9366149902344, 331.9345703125, 338.9325256347656, 345.93048095703125, 352.928466796875, 359.9264221191406, 366.92437744140625, 373.92236328125, 380.9203186035156, 387.91827392578125, 394.9162292480469, 401.9141845703125, 408.9121398925781]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 1.0, 5.0, 8.0, 6.0, 6.0, 12.0, 15.0, 17.0, 23.0, 22.0, 23.0, 22.0, 22.0, 30.0, 32.0, 43.0, 33.0, 35.0, 36.0, 37.0, 41.0, 40.0, 51.0, 48.0, 37.0, 49.0, 47.0, 31.0, 38.0, 17.0, 31.0, 16.0, 23.0, 17.0, 19.0, 13.0, 9.0, 11.0, 4.0, 5.0, 11.0, 8.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-45.64849853515625, -44.292381286621094, -42.9362678527832, -41.58015060424805, -40.224037170410156, -38.867919921875, -37.511802673339844, -36.15568542480469, -34.7995719909668, -33.44345474243164, -32.08734130859375, -30.731224060058594, -29.37510871887207, -28.018993377685547, -26.66287612915039, -25.306760787963867, -23.950645446777344, -22.59453010559082, -21.238414764404297, -19.88229751586914, -18.526182174682617, -17.170066833496094, -15.813950538635254, -14.457834243774414, -13.10171890258789, -11.745603561401367, -10.389487266540527, -9.033370971679688, -7.677255630493164, -6.321139812469482, -4.965023994445801, -3.608907699584961, -2.2527923583984375, -0.8966765403747559, 0.4594392776489258, 1.8155550956726074, 3.171670913696289, 4.527786731719971, 5.883902549743652, 7.240018844604492, 8.596134185791016, 9.952249526977539, 11.308365821838379, 12.664482116699219, 14.020597457885742, 15.376712799072266, 16.732830047607422, 18.088945388793945, 19.44506072998047, 20.801176071166992, 22.157291412353516, 23.513408660888672, 24.869524002075195, 26.22563934326172, 27.581756591796875, 28.9378719329834, 30.293987274169922, 31.650102615356445, 33.00621795654297, 34.362335205078125, 35.71845245361328, 37.07456588745117, 38.43068313598633, 39.78679656982422, 41.142913818359375]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 7.0, 5.0, 7.0, 10.0, 11.0, 10.0, 11.0, 17.0, 15.0, 17.0, 19.0, 27.0, 20.0, 28.0, 26.0, 35.0, 37.0, 29.0, 30.0, 39.0, 40.0, 40.0, 43.0, 35.0, 35.0, 39.0, 36.0, 32.0, 24.0, 26.0, 29.0, 32.0, 27.0, 23.0, 17.0, 23.0, 17.0, 16.0, 12.0, 13.0, 9.0, 9.0, 5.0, 4.0, 6.0, 2.0, 4.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-7.48828125, -7.265625, -7.04296875, -6.8203125, -6.59765625, -6.375, -6.15234375, -5.9296875, -5.70703125, -5.484375, -5.26171875, -5.0390625, -4.81640625, -4.59375, -4.37109375, -4.1484375, -3.92578125, -3.703125, -3.48046875, -3.2578125, -3.03515625, -2.8125, -2.58984375, -2.3671875, -2.14453125, -1.921875, -1.69921875, -1.4765625, -1.25390625, -1.03125, -0.80859375, -0.5859375, -0.36328125, -0.140625, 0.08203125, 0.3046875, 0.52734375, 0.75, 0.97265625, 1.1953125, 1.41796875, 1.640625, 1.86328125, 2.0859375, 2.30859375, 2.53125, 2.75390625, 2.9765625, 3.19921875, 3.421875, 3.64453125, 3.8671875, 4.08984375, 4.3125, 4.53515625, 4.7578125, 4.98046875, 5.203125, 5.42578125, 5.6484375, 5.87109375, 6.09375, 6.31640625, 6.5390625, 6.76171875]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 7.0, 3.0, 9.0, 4.0, 22.0, 22.0, 39.0, 53.0, 64.0, 100.0, 139.0, 213.0, 279.0, 470.0, 655.0, 934.0, 1448.0, 2078.0, 3140.0, 4640.0, 7079.0, 10848.0, 16367.0, 25154.0, 40267.0, 67113.0, 121059.0, 218376.0, 220528.0, 123285.0, 68822.0, 41265.0, 25469.0, 16273.0, 10518.0, 7197.0, 4701.0, 3142.0, 2158.0, 1495.0, 975.0, 699.0, 459.0, 322.0, 216.0, 152.0, 101.0, 67.0, 48.0, 35.0, 25.0, 11.0, 10.0, 6.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.0595703125, -1.0264739990234375, -0.993377685546875, -0.9602813720703125, -0.92718505859375, -0.8940887451171875, -0.860992431640625, -0.8278961181640625, -0.7947998046875, -0.7617034912109375, -0.728607177734375, -0.6955108642578125, -0.66241455078125, -0.6293182373046875, -0.596221923828125, -0.5631256103515625, -0.530029296875, -0.4969329833984375, -0.463836669921875, -0.4307403564453125, -0.39764404296875, -0.3645477294921875, -0.331451416015625, -0.2983551025390625, -0.2652587890625, -0.2321624755859375, -0.199066162109375, -0.1659698486328125, -0.13287353515625, -0.0997772216796875, -0.066680908203125, -0.0335845947265625, -0.00048828125, 0.0326080322265625, 0.065704345703125, 0.0988006591796875, 0.13189697265625, 0.1649932861328125, 0.198089599609375, 0.2311859130859375, 0.2642822265625, 0.2973785400390625, 0.330474853515625, 0.3635711669921875, 0.39666748046875, 0.4297637939453125, 0.462860107421875, 0.4959564208984375, 0.529052734375, 0.5621490478515625, 0.595245361328125, 0.6283416748046875, 0.66143798828125, 0.6945343017578125, 0.727630615234375, 0.7607269287109375, 0.7938232421875, 0.8269195556640625, 0.860015869140625, 0.8931121826171875, 0.92620849609375, 0.9593048095703125, 0.992401123046875, 1.0254974365234375, 1.05859375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 3.0, 2.0, 1.0, 5.0, 12.0, 11.0, 7.0, 15.0, 17.0, 16.0, 23.0, 24.0, 29.0, 33.0, 26.0, 25.0, 27.0, 31.0, 43.0, 26.0, 47.0, 45.0, 1059.0, 42.0, 41.0, 35.0, 40.0, 36.0, 38.0, 31.0, 37.0, 34.0, 25.0, 24.0, 12.0, 21.0, 20.0, 13.0, 9.0, 11.0, 5.0, 10.0, 3.0, 3.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-5.20703125, -5.0574951171875, -4.907958984375, -4.7584228515625, -4.60888671875, -4.4593505859375, -4.309814453125, -4.1602783203125, -4.0107421875, -3.8612060546875, -3.711669921875, -3.5621337890625, -3.41259765625, -3.2630615234375, -3.113525390625, -2.9639892578125, -2.814453125, -2.6649169921875, -2.515380859375, -2.3658447265625, -2.21630859375, -2.0667724609375, -1.917236328125, -1.7677001953125, -1.6181640625, -1.4686279296875, -1.319091796875, -1.1695556640625, -1.02001953125, -0.8704833984375, -0.720947265625, -0.5714111328125, -0.421875, -0.2723388671875, -0.122802734375, 0.0267333984375, 0.17626953125, 0.3258056640625, 0.475341796875, 0.6248779296875, 0.7744140625, 0.9239501953125, 1.073486328125, 1.2230224609375, 1.37255859375, 1.5220947265625, 1.671630859375, 1.8211669921875, 1.970703125, 2.1202392578125, 2.269775390625, 2.4193115234375, 2.56884765625, 2.7183837890625, 2.867919921875, 3.0174560546875, 3.1669921875, 3.3165283203125, 3.466064453125, 3.6156005859375, 3.76513671875, 3.9146728515625, 4.064208984375, 4.2137451171875, 4.36328125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 6.0, 3.0, 5.0, 14.0, 18.0, 18.0, 28.0, 63.0, 78.0, 110.0, 153.0, 238.0, 375.0, 539.0, 840.0, 1162.0, 1762.0, 2630.0, 4138.0, 6182.0, 9691.0, 15456.0, 24786.0, 41155.0, 72118.0, 138765.0, 1307602.0, 213869.0, 106261.0, 57805.0, 33924.0, 20650.0, 12897.0, 8320.0, 5128.0, 3441.0, 2279.0, 1510.0, 1024.0, 692.0, 459.0, 310.0, 212.0, 130.0, 101.0, 65.0, 50.0, 29.0, 18.0, 15.0, 8.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9501953125, -0.9183197021484375, -0.886444091796875, -0.8545684814453125, -0.82269287109375, -0.7908172607421875, -0.758941650390625, -0.7270660400390625, -0.6951904296875, -0.6633148193359375, -0.631439208984375, -0.5995635986328125, -0.56768798828125, -0.5358123779296875, -0.503936767578125, -0.4720611572265625, -0.440185546875, -0.4083099365234375, -0.376434326171875, -0.3445587158203125, -0.31268310546875, -0.2808074951171875, -0.248931884765625, -0.2170562744140625, -0.1851806640625, -0.1533050537109375, -0.121429443359375, -0.0895538330078125, -0.05767822265625, -0.0258026123046875, 0.006072998046875, 0.0379486083984375, 0.06982421875, 0.1016998291015625, 0.133575439453125, 0.1654510498046875, 0.19732666015625, 0.2292022705078125, 0.261077880859375, 0.2929534912109375, 0.3248291015625, 0.3567047119140625, 0.388580322265625, 0.4204559326171875, 0.45233154296875, 0.4842071533203125, 0.516082763671875, 0.5479583740234375, 0.579833984375, 0.6117095947265625, 0.643585205078125, 0.6754608154296875, 0.70733642578125, 0.7392120361328125, 0.771087646484375, 0.8029632568359375, 0.8348388671875, 0.8667144775390625, 0.898590087890625, 0.9304656982421875, 0.96234130859375, 0.9942169189453125, 1.026092529296875, 1.0579681396484375, 1.08984375]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 4.0, 8.0, 7.0, 7.0, 18.0, 17.0, 13.0, 21.0, 23.0, 25.0, 31.0, 36.0, 51.0, 59.0, 51.0, 58.0, 53.0, 59.0, 47.0, 67.0, 58.0, 48.0, 40.0, 29.0, 38.0, 34.0, 20.0, 22.0, 13.0, 10.0, 7.0, 4.0, 9.0, 2.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0022430419921875, -0.0021635890007019043, -0.0020841360092163086, -0.002004683017730713, -0.0019252300262451172, -0.0018457770347595215, -0.0017663240432739258, -0.00168687105178833, -0.0016074180603027344, -0.0015279650688171387, -0.001448512077331543, -0.0013690590858459473, -0.0012896060943603516, -0.0012101531028747559, -0.0011307001113891602, -0.0010512471199035645, -0.0009717941284179688, -0.000892341136932373, -0.0008128881454467773, -0.0007334351539611816, -0.0006539821624755859, -0.0005745291709899902, -0.0004950761795043945, -0.00041562318801879883, -0.0003361701965332031, -0.0002567172050476074, -0.00017726421356201172, -9.781122207641602e-05, -1.8358230590820312e-05, 6.109476089477539e-05, 0.0001405477523803711, 0.0002200007438659668, 0.0002994537353515625, 0.0003789067268371582, 0.0004583597183227539, 0.0005378127098083496, 0.0006172657012939453, 0.000696718692779541, 0.0007761716842651367, 0.0008556246757507324, 0.0009350776672363281, 0.0010145306587219238, 0.0010939836502075195, 0.0011734366416931152, 0.001252889633178711, 0.0013323426246643066, 0.0014117956161499023, 0.001491248607635498, 0.0015707015991210938, 0.0016501545906066895, 0.0017296075820922852, 0.0018090605735778809, 0.0018885135650634766, 0.0019679665565490723, 0.002047419548034668, 0.0021268725395202637, 0.0022063255310058594, 0.002285778522491455, 0.0023652315139770508, 0.0024446845054626465, 0.002524137496948242, 0.002603590488433838, 0.0026830434799194336, 0.0027624964714050293, 0.002841949462890625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 9.0, 4.0, 11.0, 10.0, 10.0, 27.0, 14.0, 35.0, 50.0, 63.0, 105.0, 107.0, 177.0, 391.0, 1124.0, 664490.0, 379934.0, 1029.0, 354.0, 188.0, 113.0, 62.0, 54.0, 38.0, 38.0, 32.0, 24.0, 12.0, 13.0, 11.0, 9.0, 2.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06878662109375, -0.06676149368286133, -0.06473636627197266, -0.06271123886108398, -0.06068611145019531, -0.05866098403930664, -0.05663585662841797, -0.0546107292175293, -0.052585601806640625, -0.05056047439575195, -0.04853534698486328, -0.04651021957397461, -0.04448509216308594, -0.042459964752197266, -0.040434837341308594, -0.03840970993041992, -0.03638458251953125, -0.03435945510864258, -0.032334327697753906, -0.030309200286865234, -0.028284072875976562, -0.02625894546508789, -0.02423381805419922, -0.022208690643310547, -0.020183563232421875, -0.018158435821533203, -0.01613330841064453, -0.01410818099975586, -0.012083053588867188, -0.010057926177978516, -0.008032798767089844, -0.006007671356201172, -0.0039825439453125, -0.001957416534423828, 6.771087646484375e-05, 0.0020928382873535156, 0.0041179656982421875, 0.006143093109130859, 0.008168220520019531, 0.010193347930908203, 0.012218475341796875, 0.014243602752685547, 0.01626873016357422, 0.01829385757446289, 0.020318984985351562, 0.022344112396240234, 0.024369239807128906, 0.026394367218017578, 0.02841949462890625, 0.030444622039794922, 0.032469749450683594, 0.034494876861572266, 0.03652000427246094, 0.03854513168334961, 0.04057025909423828, 0.04259538650512695, 0.044620513916015625, 0.0466456413269043, 0.04867076873779297, 0.05069589614868164, 0.05272102355957031, 0.054746150970458984, 0.056771278381347656, 0.05879640579223633, 0.060821533203125]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 15.0, 304.0, 654.0, 46.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01918666996061802, -0.018812132999300957, -0.018437596037983894, -0.018063057214021683, -0.01768852025270462, -0.017313983291387558, -0.016939446330070496, -0.016564909368753433, -0.01619037240743637, -0.01581583544611931, -0.015441297553479671, -0.015066760592162609, -0.014692222699522972, -0.01431768573820591, -0.013943148776888847, -0.013568611815571785, -0.013194072991609573, -0.012819536030292511, -0.012444998137652874, -0.012070461176335812, -0.011695923283696175, -0.011321386322379112, -0.01094684936106205, -0.010572312399744987, -0.01019777450710535, -0.009823237545788288, -0.009448699653148651, -0.009074162691831589, -0.008699625730514526, -0.00832508783787489, -0.007950550876557827, -0.007576013449579477, -0.007201475091278553, -0.006826937664300203, -0.006452400237321854, -0.006077863276004791, -0.005703325849026442, -0.005328788422048092, -0.0049542514607310295, -0.00457971403375268, -0.00420517660677433, -0.0038306391797959805, -0.0034561019856482744, -0.0030815647915005684, -0.0027070273645222187, -0.002332489937543869, -0.001957952743396163, -0.001583415549248457, -0.0012088781222701073, -0.0008343408117070794, -0.00045980350114405155, -8.526619058102369e-05, 0.00028927111998200417, 0.000663808430545032, 0.0010383457411080599, 0.001412882935255766, 0.0017874203622341156, 0.0021619577892124653, 0.0025364949833601713, 0.0029110321775078773, 0.003285569604486227, 0.0036601070314645767, 0.004034643992781639, 0.004409181419759989, 0.0047837188467383385]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 3.0, 7.0, 6.0, 12.0, 8.0, 13.0, 16.0, 15.0, 16.0, 27.0, 30.0, 28.0, 43.0, 34.0, 34.0, 37.0, 33.0, 41.0, 52.0, 51.0, 46.0, 37.0, 41.0, 42.0, 31.0, 33.0, 33.0, 30.0, 33.0, 27.0, 22.0, 17.0, 16.0, 17.0, 15.0, 12.0, 14.0, 12.0, 5.0, 4.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0014487504959106445, -0.0014047836884856224, -0.0013608168810606003, -0.0013168500736355782, -0.001272883266210556, -0.001228916458785534, -0.0011849496513605118, -0.0011409828439354897, -0.0010970160365104675, -0.0010530492290854454, -0.0010090824216604233, -0.0009651156142354012, -0.000921148806810379, -0.0008771819993853569, -0.0008332151919603348, -0.0007892483845353127, -0.0007452815771102905, -0.0007013147696852684, -0.0006573479622602463, -0.0006133811548352242, -0.000569414347410202, -0.0005254475399851799, -0.0004814807325601578, -0.00043751392513513565, -0.0003935471177101135, -0.0003495803102850914, -0.0003056135028600693, -0.00026164669543504715, -0.00021767988801002502, -0.0001737130805850029, -0.00012974627315998077, -8.577946573495865e-05, -4.1812658309936523e-05, 2.154149115085602e-06, 4.612095654010773e-05, 9.008776396512985e-05, 0.00013405457139015198, 0.0001780213788151741, 0.00022198818624019623, 0.00026595499366521835, 0.0003099218010902405, 0.0003538886085152626, 0.00039785541594028473, 0.00044182222336530685, 0.000485789030790329, 0.0005297558382153511, 0.0005737226456403732, 0.0006176894530653954, 0.0006616562604904175, 0.0007056230679154396, 0.0007495898753404617, 0.0007935566827654839, 0.000837523490190506, 0.0008814902976155281, 0.0009254571050405502, 0.0009694239124655724, 0.0010133907198905945, 0.0010573575273156166, 0.0011013243347406387, 0.0011452911421656609, 0.001189257949590683, 0.0012332247570157051, 0.0012771915644407272, 0.0013211583718657494, 0.0013651251792907715]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 7.0, 5.0, 7.0, 10.0, 11.0, 10.0, 11.0, 17.0, 15.0, 17.0, 19.0, 27.0, 20.0, 28.0, 26.0, 35.0, 37.0, 29.0, 30.0, 39.0, 40.0, 40.0, 43.0, 35.0, 35.0, 39.0, 36.0, 32.0, 24.0, 26.0, 29.0, 32.0, 27.0, 23.0, 17.0, 23.0, 17.0, 16.0, 12.0, 13.0, 9.0, 9.0, 5.0, 4.0, 6.0, 2.0, 4.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-7.48828125, -7.265625, -7.04296875, -6.8203125, -6.59765625, -6.375, -6.15234375, -5.9296875, -5.70703125, -5.484375, -5.26171875, -5.0390625, -4.81640625, -4.59375, -4.37109375, -4.1484375, -3.92578125, -3.703125, -3.48046875, -3.2578125, -3.03515625, -2.8125, -2.58984375, -2.3671875, -2.14453125, -1.921875, -1.69921875, -1.4765625, -1.25390625, -1.03125, -0.80859375, -0.5859375, -0.36328125, -0.140625, 0.08203125, 0.3046875, 0.52734375, 0.75, 0.97265625, 1.1953125, 1.41796875, 1.640625, 1.86328125, 2.0859375, 2.30859375, 2.53125, 2.75390625, 2.9765625, 3.19921875, 3.421875, 3.64453125, 3.8671875, 4.08984375, 4.3125, 4.53515625, 4.7578125, 4.98046875, 5.203125, 5.42578125, 5.6484375, 5.87109375, 6.09375, 6.31640625, 6.5390625, 6.76171875]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 8.0, 5.0, 7.0, 10.0, 15.0, 16.0, 13.0, 26.0, 22.0, 30.0, 34.0, 53.0, 63.0, 91.0, 112.0, 166.0, 241.0, 420.0, 732.0, 2259.0, 9646.0, 61834.0, 677497.0, 260001.0, 27134.0, 5059.0, 1371.0, 592.0, 287.0, 203.0, 148.0, 108.0, 72.0, 54.0, 46.0, 42.0, 37.0, 24.0, 12.0, 11.0, 14.0, 10.0, 6.0, 6.0, 8.0, 2.0, 4.0, 5.0, 2.0, 5.0, 1.0, 0.0, 1.0], "bins": [-14.859375, -14.419677734375, -13.97998046875, -13.540283203125, -13.1005859375, -12.660888671875, -12.22119140625, -11.781494140625, -11.341796875, -10.902099609375, -10.46240234375, -10.022705078125, -9.5830078125, -9.143310546875, -8.70361328125, -8.263916015625, -7.82421875, -7.384521484375, -6.94482421875, -6.505126953125, -6.0654296875, -5.625732421875, -5.18603515625, -4.746337890625, -4.306640625, -3.866943359375, -3.42724609375, -2.987548828125, -2.5478515625, -2.108154296875, -1.66845703125, -1.228759765625, -0.7890625, -0.349365234375, 0.09033203125, 0.530029296875, 0.9697265625, 1.409423828125, 1.84912109375, 2.288818359375, 2.728515625, 3.168212890625, 3.60791015625, 4.047607421875, 4.4873046875, 4.927001953125, 5.36669921875, 5.806396484375, 6.24609375, 6.685791015625, 7.12548828125, 7.565185546875, 8.0048828125, 8.444580078125, 8.88427734375, 9.323974609375, 9.763671875, 10.203369140625, 10.64306640625, 11.082763671875, 11.5224609375, 11.962158203125, 12.40185546875, 12.841552734375, 13.28125]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 5.0, 4.0, 4.0, 8.0, 8.0, 13.0, 15.0, 16.0, 26.0, 17.0, 24.0, 26.0, 36.0, 33.0, 48.0, 42.0, 45.0, 52.0, 67.0, 195.0, 1653.0, 224.0, 76.0, 43.0, 51.0, 33.0, 40.0, 39.0, 30.0, 34.0, 15.0, 14.0, 13.0, 15.0, 17.0, 18.0, 9.0, 11.0, 5.0, 11.0, 7.0, 1.0, 8.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-23.65625, -22.92919921875, -22.2021484375, -21.47509765625, -20.748046875, -20.02099609375, -19.2939453125, -18.56689453125, -17.83984375, -17.11279296875, -16.3857421875, -15.65869140625, -14.931640625, -14.20458984375, -13.4775390625, -12.75048828125, -12.0234375, -11.29638671875, -10.5693359375, -9.84228515625, -9.115234375, -8.38818359375, -7.6611328125, -6.93408203125, -6.20703125, -5.47998046875, -4.7529296875, -4.02587890625, -3.298828125, -2.57177734375, -1.8447265625, -1.11767578125, -0.390625, 0.33642578125, 1.0634765625, 1.79052734375, 2.517578125, 3.24462890625, 3.9716796875, 4.69873046875, 5.42578125, 6.15283203125, 6.8798828125, 7.60693359375, 8.333984375, 9.06103515625, 9.7880859375, 10.51513671875, 11.2421875, 11.96923828125, 12.6962890625, 13.42333984375, 14.150390625, 14.87744140625, 15.6044921875, 16.33154296875, 17.05859375, 17.78564453125, 18.5126953125, 19.23974609375, 19.966796875, 20.69384765625, 21.4208984375, 22.14794921875, 22.875]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 5.0, 3.0, 3.0, 7.0, 9.0, 6.0, 12.0, 11.0, 21.0, 16.0, 18.0, 19.0, 22.0, 35.0, 44.0, 45.0, 77.0, 92.0, 147.0, 258.0, 482.0, 1621.0, 53352.0, 3078260.0, 8973.0, 1042.0, 416.0, 189.0, 132.0, 83.0, 61.0, 52.0, 36.0, 26.0, 19.0, 31.0, 22.0, 18.0, 10.0, 10.0, 5.0, 8.0, 4.0, 4.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.84375, -51.208984375, -49.57421875, -47.939453125, -46.3046875, -44.669921875, -43.03515625, -41.400390625, -39.765625, -38.130859375, -36.49609375, -34.861328125, -33.2265625, -31.591796875, -29.95703125, -28.322265625, -26.6875, -25.052734375, -23.41796875, -21.783203125, -20.1484375, -18.513671875, -16.87890625, -15.244140625, -13.609375, -11.974609375, -10.33984375, -8.705078125, -7.0703125, -5.435546875, -3.80078125, -2.166015625, -0.53125, 1.103515625, 2.73828125, 4.373046875, 6.0078125, 7.642578125, 9.27734375, 10.912109375, 12.546875, 14.181640625, 15.81640625, 17.451171875, 19.0859375, 20.720703125, 22.35546875, 23.990234375, 25.625, 27.259765625, 28.89453125, 30.529296875, 32.1640625, 33.798828125, 35.43359375, 37.068359375, 38.703125, 40.337890625, 41.97265625, 43.607421875, 45.2421875, 46.876953125, 48.51171875, 50.146484375, 51.78125]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 7.0, 178.0, 632.0, 184.0, 17.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.809925079345703, -27.198936462402344, -23.58794593811035, -19.97695541381836, -16.365966796875, -12.75497817993164, -9.143987655639648, -5.532997131347656, -1.9220085144042969, 1.688981056213379, 5.299970626831055, 8.91096019744873, 12.521949768066406, 16.132938385009766, 19.743928909301758, 23.35491943359375, 26.96590805053711, 30.57689666748047, 34.187889099121094, 37.79887771606445, 41.40986633300781, 45.02085494995117, 48.63184356689453, 52.242835998535156, 55.853824615478516, 59.464813232421875, 63.0758056640625, 66.6867904663086, 70.29778289794922, 73.90876770019531, 77.51976013183594, 81.13075256347656, 84.74174499511719, 88.35273742675781, 91.9637222290039, 95.57471466064453, 99.18569946289062, 102.79669189453125, 106.40768432617188, 110.0186767578125, 113.6296615600586, 117.24065399169922, 120.85163879394531, 124.46263122558594, 128.07362365722656, 131.68460083007812, 135.29559326171875, 138.90658569335938, 142.517578125, 146.12857055664062, 149.73956298828125, 153.3505401611328, 156.96153259277344, 160.57252502441406, 164.1835174560547, 167.7945098876953, 171.40548706054688, 175.0164794921875, 178.62747192382812, 182.2384490966797, 185.8494415283203, 189.46043395996094, 193.07142639160156, 196.6824188232422, 200.2934112548828]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 1.0, 5.0, 3.0, 4.0, 3.0, 4.0, 7.0, 9.0, 4.0, 12.0, 16.0, 16.0, 12.0, 19.0, 20.0, 25.0, 26.0, 27.0, 34.0, 35.0, 49.0, 36.0, 39.0, 51.0, 40.0, 36.0, 48.0, 53.0, 42.0, 37.0, 41.0, 31.0, 25.0, 33.0, 28.0, 19.0, 14.0, 14.0, 14.0, 11.0, 17.0, 10.0, 10.0, 9.0, 3.0, 10.0, 5.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.43195343017578, -51.59483337402344, -49.75771713256836, -47.920597076416016, -46.08348083496094, -44.246360778808594, -42.409244537353516, -40.57212448120117, -38.735008239746094, -36.89788818359375, -35.06077194213867, -33.22365188598633, -31.38653564453125, -29.549415588378906, -27.712299346923828, -25.875179290771484, -24.038061141967773, -22.200942993164062, -20.36382484436035, -18.52670669555664, -16.68958854675293, -14.852469444274902, -13.015351295471191, -11.17823314666748, -9.34111499786377, -7.503996849060059, -5.666878700256348, -3.8297600746154785, -1.9926419258117676, -0.15552330017089844, 1.6815948486328125, 3.5187129974365234, 5.355831146240234, 7.192949295043945, 9.030067443847656, 10.867185592651367, 12.704303741455078, 14.541422843933105, 16.3785400390625, 18.215660095214844, 20.052776336669922, 21.889894485473633, 23.727012634277344, 25.564130783081055, 27.401248931884766, 29.23836898803711, 31.075485229492188, 32.91260528564453, 34.749725341796875, 36.58684539794922, 38.4239616394043, 40.26108169555664, 42.09819793701172, 43.93531799316406, 45.77243423461914, 47.609554290771484, 49.44667053222656, 51.283790588378906, 53.120906829833984, 54.95802688598633, 56.795143127441406, 58.63226318359375, 60.46937942504883, 62.30649948120117, 64.14361572265625]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 7.0, 14.0, 15.0, 10.0, 14.0, 20.0, 17.0, 31.0, 24.0, 15.0, 24.0, 27.0, 25.0, 39.0, 35.0, 31.0, 38.0, 41.0, 34.0, 42.0, 34.0, 42.0, 37.0, 27.0, 39.0, 25.0, 36.0, 27.0, 33.0, 23.0, 27.0, 21.0, 23.0, 11.0, 8.0, 21.0, 9.0, 6.0, 14.0, 7.0, 4.0, 2.0, 2.0, 5.0, 3.0, 5.0, 0.0, 3.0], "bins": [-8.1484375, -7.9193115234375, -7.690185546875, -7.4610595703125, -7.23193359375, -7.0028076171875, -6.773681640625, -6.5445556640625, -6.3154296875, -6.0863037109375, -5.857177734375, -5.6280517578125, -5.39892578125, -5.1697998046875, -4.940673828125, -4.7115478515625, -4.482421875, -4.2532958984375, -4.024169921875, -3.7950439453125, -3.56591796875, -3.3367919921875, -3.107666015625, -2.8785400390625, -2.6494140625, -2.4202880859375, -2.191162109375, -1.9620361328125, -1.73291015625, -1.5037841796875, -1.274658203125, -1.0455322265625, -0.81640625, -0.5872802734375, -0.358154296875, -0.1290283203125, 0.10009765625, 0.3292236328125, 0.558349609375, 0.7874755859375, 1.0166015625, 1.2457275390625, 1.474853515625, 1.7039794921875, 1.93310546875, 2.1622314453125, 2.391357421875, 2.6204833984375, 2.849609375, 3.0787353515625, 3.307861328125, 3.5369873046875, 3.76611328125, 3.9952392578125, 4.224365234375, 4.4534912109375, 4.6826171875, 4.9117431640625, 5.140869140625, 5.3699951171875, 5.59912109375, 5.8282470703125, 6.057373046875, 6.2864990234375, 6.515625]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 2.0, 5.0, 8.0, 9.0, 9.0, 11.0, 15.0, 18.0, 16.0, 30.0, 35.0, 44.0, 54.0, 106.0, 159.0, 241.0, 466.0, 915.0, 2124.0, 6318.0, 31852.0, 413168.0, 2847187.0, 823137.0, 53755.0, 9335.0, 2747.0, 1118.0, 558.0, 282.0, 169.0, 97.0, 77.0, 45.0, 36.0, 19.0, 18.0, 12.0, 16.0, 10.0, 10.0, 8.0, 13.0, 1.0, 4.0, 4.0, 7.0, 6.0, 4.0, 4.0, 1.0], "bins": [-21.125, -20.531982421875, -19.93896484375, -19.345947265625, -18.7529296875, -18.159912109375, -17.56689453125, -16.973876953125, -16.380859375, -15.787841796875, -15.19482421875, -14.601806640625, -14.0087890625, -13.415771484375, -12.82275390625, -12.229736328125, -11.63671875, -11.043701171875, -10.45068359375, -9.857666015625, -9.2646484375, -8.671630859375, -8.07861328125, -7.485595703125, -6.892578125, -6.299560546875, -5.70654296875, -5.113525390625, -4.5205078125, -3.927490234375, -3.33447265625, -2.741455078125, -2.1484375, -1.555419921875, -0.96240234375, -0.369384765625, 0.2236328125, 0.816650390625, 1.40966796875, 2.002685546875, 2.595703125, 3.188720703125, 3.78173828125, 4.374755859375, 4.9677734375, 5.560791015625, 6.15380859375, 6.746826171875, 7.33984375, 7.932861328125, 8.52587890625, 9.118896484375, 9.7119140625, 10.304931640625, 10.89794921875, 11.490966796875, 12.083984375, 12.677001953125, 13.27001953125, 13.863037109375, 14.4560546875, 15.049072265625, 15.64208984375, 16.235107421875, 16.828125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 2.0, 6.0, 5.0, 5.0, 7.0, 10.0, 19.0, 23.0, 19.0, 37.0, 43.0, 59.0, 85.0, 104.0, 141.0, 230.0, 273.0, 323.0, 374.0, 437.0, 419.0, 358.0, 247.0, 193.0, 142.0, 133.0, 110.0, 67.0, 46.0, 45.0, 29.0, 19.0, 17.0, 10.0, 6.0, 8.0, 8.0, 7.0, 3.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.8046875, -11.4310302734375, -11.057373046875, -10.6837158203125, -10.31005859375, -9.9364013671875, -9.562744140625, -9.1890869140625, -8.8154296875, -8.4417724609375, -8.068115234375, -7.6944580078125, -7.32080078125, -6.9471435546875, -6.573486328125, -6.1998291015625, -5.826171875, -5.4525146484375, -5.078857421875, -4.7052001953125, -4.33154296875, -3.9578857421875, -3.584228515625, -3.2105712890625, -2.8369140625, -2.4632568359375, -2.089599609375, -1.7159423828125, -1.34228515625, -0.9686279296875, -0.594970703125, -0.2213134765625, 0.15234375, 0.5260009765625, 0.899658203125, 1.2733154296875, 1.64697265625, 2.0206298828125, 2.394287109375, 2.7679443359375, 3.1416015625, 3.5152587890625, 3.888916015625, 4.2625732421875, 4.63623046875, 5.0098876953125, 5.383544921875, 5.7572021484375, 6.130859375, 6.5045166015625, 6.878173828125, 7.2518310546875, 7.62548828125, 7.9991455078125, 8.372802734375, 8.7464599609375, 9.1201171875, 9.4937744140625, 9.867431640625, 10.2410888671875, 10.61474609375, 10.9884033203125, 11.362060546875, 11.7357177734375, 12.109375]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 7.0, 6.0, 14.0, 11.0, 17.0, 16.0, 16.0, 23.0, 37.0, 35.0, 48.0, 74.0, 82.0, 99.0, 149.0, 183.0, 264.0, 453.0, 1050.0, 4801.0, 81145.0, 3731613.0, 359883.0, 10873.0, 1620.0, 595.0, 318.0, 205.0, 147.0, 108.0, 77.0, 73.0, 48.0, 43.0, 30.0, 30.0, 21.0, 10.0, 9.0, 8.0, 15.0, 12.0, 5.0, 7.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-43.03125, -41.71435546875, -40.3974609375, -39.08056640625, -37.763671875, -36.44677734375, -35.1298828125, -33.81298828125, -32.49609375, -31.17919921875, -29.8623046875, -28.54541015625, -27.228515625, -25.91162109375, -24.5947265625, -23.27783203125, -21.9609375, -20.64404296875, -19.3271484375, -18.01025390625, -16.693359375, -15.37646484375, -14.0595703125, -12.74267578125, -11.42578125, -10.10888671875, -8.7919921875, -7.47509765625, -6.158203125, -4.84130859375, -3.5244140625, -2.20751953125, -0.890625, 0.42626953125, 1.7431640625, 3.06005859375, 4.376953125, 5.69384765625, 7.0107421875, 8.32763671875, 9.64453125, 10.96142578125, 12.2783203125, 13.59521484375, 14.912109375, 16.22900390625, 17.5458984375, 18.86279296875, 20.1796875, 21.49658203125, 22.8134765625, 24.13037109375, 25.447265625, 26.76416015625, 28.0810546875, 29.39794921875, 30.71484375, 32.03173828125, 33.3486328125, 34.66552734375, 35.982421875, 37.29931640625, 38.6162109375, 39.93310546875, 41.25]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 7.0, 133.0, 491.0, 328.0, 53.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-267.1344299316406, -259.8751220703125, -252.6157989501953, -245.35647583007812, -238.09716796875, -230.8378448486328, -223.57852172851562, -216.3192138671875, -209.05990600585938, -201.8005828857422, -194.54127502441406, -187.28195190429688, -180.02264404296875, -172.76332092285156, -165.50399780273438, -158.24468994140625, -150.98536682128906, -143.72604370117188, -136.46673583984375, -129.20741271972656, -121.94810485839844, -114.68878173828125, -107.4294662475586, -100.17015075683594, -92.91083526611328, -85.65151977539062, -78.39220428466797, -71.13288879394531, -63.87356948852539, -56.614253997802734, -49.35493469238281, -42.095619201660156, -34.83628845214844, -27.57697296142578, -20.317655563354492, -13.058338165283203, -5.799022674560547, 1.4602928161621094, 8.719612121582031, 15.978927612304688, 23.238243103027344, 30.49755859375, 37.756874084472656, 45.01619338989258, 52.275508880615234, 59.53482437133789, 66.79414367675781, 74.05345916748047, 81.31277465820312, 88.57209014892578, 95.83140563964844, 103.09072875976562, 110.35003662109375, 117.60935974121094, 124.8686752319336, 132.12799072265625, 139.38729858398438, 146.64662170410156, 153.9059295654297, 161.16525268554688, 168.424560546875, 175.6838836669922, 182.94320678710938, 190.2025146484375, 197.4618377685547]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 8.0, 5.0, 14.0, 17.0, 8.0, 18.0, 22.0, 15.0, 28.0, 31.0, 28.0, 21.0, 36.0, 44.0, 43.0, 43.0, 40.0, 41.0, 39.0, 52.0, 31.0, 41.0, 38.0, 40.0, 41.0, 40.0, 32.0, 35.0, 23.0, 21.0, 21.0, 16.0, 10.0, 9.0, 11.0, 10.0, 6.0, 9.0, 7.0, 5.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-53.59698486328125, -52.17804718017578, -50.75910949707031, -49.340171813964844, -47.921234130859375, -46.502296447753906, -45.08335876464844, -43.66442108154297, -42.2454833984375, -40.82654571533203, -39.40760803222656, -37.988670349121094, -36.569732666015625, -35.150794982910156, -33.73185729980469, -32.31291961669922, -30.893978118896484, -29.475040435791016, -28.056102752685547, -26.637165069580078, -25.21822738647461, -23.79928970336914, -22.38035011291504, -20.96141242980957, -19.5424747467041, -18.123537063598633, -16.704599380493164, -15.285660743713379, -13.86672306060791, -12.447785377502441, -11.028846740722656, -9.609909057617188, -8.190971374511719, -6.77203369140625, -5.353095531463623, -3.934157371520996, -2.5152196884155273, -1.0962820053100586, 0.32265663146972656, 1.7415943145751953, 3.160531997680664, 4.579469680786133, 5.99840784072876, 7.417346000671387, 8.836283683776855, 10.255221366882324, 11.67416000366211, 13.093097686767578, 14.512035369873047, 15.930973052978516, 17.349910736083984, 18.768848419189453, 20.187786102294922, 21.60672378540039, 23.025663375854492, 24.44460105895996, 25.86353874206543, 27.2824764251709, 28.701414108276367, 30.12035369873047, 31.539291381835938, 32.958229064941406, 34.377166748046875, 35.796104431152344, 37.21504211425781]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 11.0, 6.0, 7.0, 7.0, 13.0, 13.0, 20.0, 15.0, 20.0, 27.0, 34.0, 36.0, 24.0, 31.0, 43.0, 32.0, 29.0, 46.0, 59.0, 41.0, 48.0, 53.0, 45.0, 30.0, 34.0, 26.0, 30.0, 32.0, 32.0, 32.0, 26.0, 19.0, 23.0, 17.0, 8.0, 13.0, 7.0, 4.0, 2.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5390625, -8.2679443359375, -7.996826171875, -7.7257080078125, -7.45458984375, -7.1834716796875, -6.912353515625, -6.6412353515625, -6.3701171875, -6.0989990234375, -5.827880859375, -5.5567626953125, -5.28564453125, -5.0145263671875, -4.743408203125, -4.4722900390625, -4.201171875, -3.9300537109375, -3.658935546875, -3.3878173828125, -3.11669921875, -2.8455810546875, -2.574462890625, -2.3033447265625, -2.0322265625, -1.7611083984375, -1.489990234375, -1.2188720703125, -0.94775390625, -0.6766357421875, -0.405517578125, -0.1343994140625, 0.13671875, 0.4078369140625, 0.678955078125, 0.9500732421875, 1.22119140625, 1.4923095703125, 1.763427734375, 2.0345458984375, 2.3056640625, 2.5767822265625, 2.847900390625, 3.1190185546875, 3.39013671875, 3.6612548828125, 3.932373046875, 4.2034912109375, 4.474609375, 4.7457275390625, 5.016845703125, 5.2879638671875, 5.55908203125, 5.8302001953125, 6.101318359375, 6.3724365234375, 6.6435546875, 6.9146728515625, 7.185791015625, 7.4569091796875, 7.72802734375, 7.9991455078125, 8.270263671875, 8.5413818359375, 8.8125]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 7.0, 8.0, 10.0, 11.0, 17.0, 23.0, 46.0, 68.0, 93.0, 128.0, 158.0, 266.0, 362.0, 565.0, 814.0, 1091.0, 1594.0, 2275.0, 3397.0, 5022.0, 7316.0, 11071.0, 17275.0, 27345.0, 45287.0, 79192.0, 145956.0, 243247.0, 194178.0, 105052.0, 58945.0, 34750.0, 21565.0, 13718.0, 8839.0, 5930.0, 4031.0, 2720.0, 1948.0, 1304.0, 877.0, 633.0, 438.0, 317.0, 216.0, 138.0, 101.0, 65.0, 56.0, 31.0, 17.0, 22.0, 13.0, 9.0, 3.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-1.033203125, -0.9984588623046875, -0.963714599609375, -0.9289703369140625, -0.89422607421875, -0.8594818115234375, -0.824737548828125, -0.7899932861328125, -0.7552490234375, -0.7205047607421875, -0.685760498046875, -0.6510162353515625, -0.61627197265625, -0.5815277099609375, -0.546783447265625, -0.5120391845703125, -0.477294921875, -0.4425506591796875, -0.407806396484375, -0.3730621337890625, -0.33831787109375, -0.3035736083984375, -0.268829345703125, -0.2340850830078125, -0.1993408203125, -0.1645965576171875, -0.129852294921875, -0.0951080322265625, -0.06036376953125, -0.0256195068359375, 0.009124755859375, 0.0438690185546875, 0.07861328125, 0.1133575439453125, 0.148101806640625, 0.1828460693359375, 0.21759033203125, 0.2523345947265625, 0.287078857421875, 0.3218231201171875, 0.3565673828125, 0.3913116455078125, 0.426055908203125, 0.4608001708984375, 0.49554443359375, 0.5302886962890625, 0.565032958984375, 0.5997772216796875, 0.634521484375, 0.6692657470703125, 0.704010009765625, 0.7387542724609375, 0.77349853515625, 0.8082427978515625, 0.842987060546875, 0.8777313232421875, 0.9124755859375, 0.9472198486328125, 0.981964111328125, 1.0167083740234375, 1.05145263671875, 1.0861968994140625, 1.120941162109375, 1.1556854248046875, 1.1904296875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 5.0, 1.0, 3.0, 5.0, 3.0, 2.0, 7.0, 9.0, 7.0, 7.0, 10.0, 16.0, 15.0, 16.0, 12.0, 16.0, 22.0, 25.0, 34.0, 34.0, 48.0, 38.0, 34.0, 30.0, 37.0, 30.0, 1065.0, 46.0, 36.0, 42.0, 24.0, 38.0, 44.0, 33.0, 28.0, 26.0, 25.0, 19.0, 16.0, 8.0, 21.0, 10.0, 12.0, 18.0, 8.0, 9.0, 11.0, 7.0, 8.0, 6.0, 6.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.63671875, -4.48480224609375, -4.3328857421875, -4.18096923828125, -4.029052734375, -3.87713623046875, -3.7252197265625, -3.57330322265625, -3.42138671875, -3.26947021484375, -3.1175537109375, -2.96563720703125, -2.813720703125, -2.66180419921875, -2.5098876953125, -2.35797119140625, -2.2060546875, -2.05413818359375, -1.9022216796875, -1.75030517578125, -1.598388671875, -1.44647216796875, -1.2945556640625, -1.14263916015625, -0.99072265625, -0.83880615234375, -0.6868896484375, -0.53497314453125, -0.383056640625, -0.23114013671875, -0.0792236328125, 0.07269287109375, 0.224609375, 0.37652587890625, 0.5284423828125, 0.68035888671875, 0.832275390625, 0.98419189453125, 1.1361083984375, 1.28802490234375, 1.43994140625, 1.59185791015625, 1.7437744140625, 1.89569091796875, 2.047607421875, 2.19952392578125, 2.3514404296875, 2.50335693359375, 2.6552734375, 2.80718994140625, 2.9591064453125, 3.11102294921875, 3.262939453125, 3.41485595703125, 3.5667724609375, 3.71868896484375, 3.87060546875, 4.02252197265625, 4.1744384765625, 4.32635498046875, 4.478271484375, 4.63018798828125, 4.7821044921875, 4.93402099609375, 5.0859375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 3.0, 6.0, 5.0, 13.0, 13.0, 26.0, 54.0, 48.0, 81.0, 107.0, 175.0, 234.0, 350.0, 470.0, 645.0, 888.0, 1347.0, 1895.0, 2671.0, 3910.0, 5987.0, 8723.0, 13303.0, 20176.0, 31836.0, 52224.0, 90860.0, 166791.0, 1290177.0, 167932.0, 91098.0, 52323.0, 31567.0, 20274.0, 13278.0, 8627.0, 5946.0, 3941.0, 2712.0, 1917.0, 1340.0, 893.0, 681.0, 459.0, 334.0, 246.0, 165.0, 144.0, 80.0, 53.0, 35.0, 29.0, 15.0, 13.0, 8.0, 8.0, 6.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.95556640625, -0.92523193359375, -0.8948974609375, -0.86456298828125, -0.834228515625, -0.80389404296875, -0.7735595703125, -0.74322509765625, -0.712890625, -0.68255615234375, -0.6522216796875, -0.62188720703125, -0.591552734375, -0.56121826171875, -0.5308837890625, -0.50054931640625, -0.47021484375, -0.43988037109375, -0.4095458984375, -0.37921142578125, -0.348876953125, -0.31854248046875, -0.2882080078125, -0.25787353515625, -0.2275390625, -0.19720458984375, -0.1668701171875, -0.13653564453125, -0.106201171875, -0.07586669921875, -0.0455322265625, -0.01519775390625, 0.01513671875, 0.04547119140625, 0.0758056640625, 0.10614013671875, 0.136474609375, 0.16680908203125, 0.1971435546875, 0.22747802734375, 0.2578125, 0.28814697265625, 0.3184814453125, 0.34881591796875, 0.379150390625, 0.40948486328125, 0.4398193359375, 0.47015380859375, 0.50048828125, 0.53082275390625, 0.5611572265625, 0.59149169921875, 0.621826171875, 0.65216064453125, 0.6824951171875, 0.71282958984375, 0.7431640625, 0.77349853515625, 0.8038330078125, 0.83416748046875, 0.864501953125, 0.89483642578125, 0.9251708984375, 0.95550537109375, 0.98583984375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 4.0, 6.0, 9.0, 14.0, 8.0, 18.0, 20.0, 30.0, 36.0, 75.0, 74.0, 90.0, 100.0, 110.0, 97.0, 72.0, 54.0, 54.0, 31.0, 29.0, 13.0, 11.0, 11.0, 13.0, 4.0, 7.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00342559814453125, -0.0032994747161865234, -0.003173351287841797, -0.0030472278594970703, -0.0029211044311523438, -0.002794981002807617, -0.0026688575744628906, -0.002542734146118164, -0.0024166107177734375, -0.002290487289428711, -0.0021643638610839844, -0.002038240432739258, -0.0019121170043945312, -0.0017859935760498047, -0.0016598701477050781, -0.0015337467193603516, -0.001407623291015625, -0.0012814998626708984, -0.0011553764343261719, -0.0010292530059814453, -0.0009031295776367188, -0.0007770061492919922, -0.0006508827209472656, -0.0005247592926025391, -0.0003986358642578125, -0.00027251243591308594, -0.00014638900756835938, -2.0265579223632812e-05, 0.00010585784912109375, 0.0002319812774658203, 0.0003581047058105469, 0.00048422813415527344, 0.0006103515625, 0.0007364749908447266, 0.0008625984191894531, 0.0009887218475341797, 0.0011148452758789062, 0.0012409687042236328, 0.0013670921325683594, 0.001493215560913086, 0.0016193389892578125, 0.001745462417602539, 0.0018715858459472656, 0.001997709274291992, 0.0021238327026367188, 0.0022499561309814453, 0.002376079559326172, 0.0025022029876708984, 0.002628326416015625, 0.0027544498443603516, 0.002880573272705078, 0.0030066967010498047, 0.0031328201293945312, 0.003258943557739258, 0.0033850669860839844, 0.003511190414428711, 0.0036373138427734375, 0.003763437271118164, 0.0038895606994628906, 0.004015684127807617, 0.004141807556152344, 0.00426793098449707, 0.004394054412841797, 0.0045201778411865234, 0.00464630126953125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 5.0, 12.0, 6.0, 16.0, 16.0, 30.0, 33.0, 47.0, 70.0, 113.0, 218.0, 383.0, 1673.0, 1040619.0, 4163.0, 511.0, 260.0, 133.0, 80.0, 45.0, 30.0, 33.0, 18.0, 18.0, 5.0, 7.0, 5.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.10382080078125, -0.10098457336425781, -0.09814834594726562, -0.09531211853027344, -0.09247589111328125, -0.08963966369628906, -0.08680343627929688, -0.08396720886230469, -0.0811309814453125, -0.07829475402832031, -0.07545852661132812, -0.07262229919433594, -0.06978607177734375, -0.06694984436035156, -0.06411361694335938, -0.06127738952636719, -0.058441162109375, -0.05560493469238281, -0.052768707275390625, -0.04993247985839844, -0.04709625244140625, -0.04426002502441406, -0.041423797607421875, -0.03858757019042969, -0.0357513427734375, -0.03291511535644531, -0.030078887939453125, -0.027242660522460938, -0.02440643310546875, -0.021570205688476562, -0.018733978271484375, -0.015897750854492188, -0.0130615234375, -0.010225296020507812, -0.007389068603515625, -0.0045528411865234375, -0.00171661376953125, 0.0011196136474609375, 0.003955841064453125, 0.0067920684814453125, 0.0096282958984375, 0.012464523315429688, 0.015300750732421875, 0.018136978149414062, 0.02097320556640625, 0.023809432983398438, 0.026645660400390625, 0.029481887817382812, 0.032318115234375, 0.03515434265136719, 0.037990570068359375, 0.04082679748535156, 0.04366302490234375, 0.04649925231933594, 0.049335479736328125, 0.05217170715332031, 0.0550079345703125, 0.05784416198730469, 0.060680389404296875, 0.06351661682128906, 0.06635284423828125, 0.06918907165527344, 0.07202529907226562, 0.07486152648925781, 0.07769775390625]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 51.0, 223.0, 441.0, 243.0, 41.0, 11.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008096171543002129, -0.007922104559838772, -0.007748038042336702, -0.007573971524834633, -0.007399904541671276, -0.007225838024169207, -0.007051771506667137, -0.00687770452350378, -0.006703637540340424, -0.006529571022838354, -0.006355504039674997, -0.006181437522172928, -0.006007370539009571, -0.005833304021507502, -0.005659237504005432, -0.005485170520842075, -0.005311104003340006, -0.005137037485837936, -0.00496297050267458, -0.00478890398517251, -0.004614837002009153, -0.004440770484507084, -0.004266703501343727, -0.004092636983841658, -0.003918570466339588, -0.003744503716006875, -0.003570436965674162, -0.0033963704481720924, -0.0032223034650087357, -0.003048236947506666, -0.002874170197173953, -0.00270010344684124, -0.0025260369293391705, -0.0023519701790064573, -0.002177903428673744, -0.0020038369111716747, -0.0018297700444236398, -0.0016557032940909266, -0.0014816366601735353, -0.0013075699098408222, -0.001133503159508109, -0.000959436409175396, -0.0007853697170503438, -0.0006113030249252915, -0.0004372362745925784, -0.0002631695242598653, -8.910289034247398e-05, 8.496385999023914e-05, 0.00025903061032295227, 0.00043309733155183494, 0.0006071640527807176, 0.0007812307449057698, 0.000955297495238483, 0.001129364245571196, 0.0013034308794885874, 0.0014774976298213005, 0.0016515643801540136, 0.0018256311304867268, 0.00199969788081944, 0.002173764631152153, 0.0023478311486542225, 0.0025218981318175793, 0.0026959646493196487, 0.002870031399652362, 0.003044098149985075]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 4.0, 11.0, 12.0, 9.0, 13.0, 16.0, 19.0, 14.0, 16.0, 21.0, 24.0, 24.0, 25.0, 19.0, 27.0, 39.0, 36.0, 32.0, 42.0, 49.0, 33.0, 36.0, 37.0, 33.0, 31.0, 36.0, 39.0, 35.0, 32.0, 31.0, 28.0, 24.0, 25.0, 12.0, 17.0, 16.0, 13.0, 16.0, 8.0, 9.0, 10.0, 6.0, 9.0, 5.0, 4.0, 2.0, 6.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.001431584358215332, -0.0013898732140660286, -0.0013481620699167252, -0.0013064509257674217, -0.0012647397816181183, -0.0012230286374688148, -0.0011813174933195114, -0.001139606349170208, -0.0010978952050209045, -0.001056184060871601, -0.0010144729167222977, -0.0009727617725729942, -0.0009310506284236908, -0.0008893394842743874, -0.0008476283401250839, -0.0008059171959757805, -0.000764206051826477, -0.0007224949076771736, -0.0006807837635278702, -0.0006390726193785667, -0.0005973614752292633, -0.0005556503310799599, -0.0005139391869306564, -0.000472228042781353, -0.00043051689863204956, -0.0003888057544827461, -0.0003470946103334427, -0.00030538346618413925, -0.0002636723220348358, -0.00022196117788553238, -0.00018025003373622894, -0.0001385388895869255, -9.682774543762207e-05, -5.5116601288318634e-05, -1.3405457139015198e-05, 2.830568701028824e-05, 7.001683115959167e-05, 0.00011172797530889511, 0.00015343911945819855, 0.00019515026360750198, 0.00023686140775680542, 0.00027857255190610886, 0.0003202836960554123, 0.00036199484020471573, 0.00040370598435401917, 0.0004454171285033226, 0.00048712827265262604, 0.0005288394168019295, 0.0005705505609512329, 0.0006122617051005363, 0.0006539728492498398, 0.0006956839933991432, 0.0007373951375484467, 0.0007791062816977501, 0.0008208174258470535, 0.000862528569996357, 0.0009042397141456604, 0.0009459508582949638, 0.0009876620024442673, 0.0010293731465935707, 0.0010710842907428741, 0.0011127954348921776, 0.001154506579041481, 0.0011962177231907845, 0.0012379288673400879]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 11.0, 6.0, 7.0, 7.0, 13.0, 13.0, 20.0, 16.0, 19.0, 27.0, 34.0, 36.0, 24.0, 31.0, 44.0, 31.0, 30.0, 48.0, 56.0, 42.0, 47.0, 54.0, 45.0, 29.0, 36.0, 24.0, 31.0, 33.0, 31.0, 32.0, 25.0, 20.0, 22.0, 17.0, 8.0, 13.0, 8.0, 3.0, 2.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5390625, -8.267822265625, -7.99658203125, -7.725341796875, -7.4541015625, -7.182861328125, -6.91162109375, -6.640380859375, -6.369140625, -6.097900390625, -5.82666015625, -5.555419921875, -5.2841796875, -5.012939453125, -4.74169921875, -4.470458984375, -4.19921875, -3.927978515625, -3.65673828125, -3.385498046875, -3.1142578125, -2.843017578125, -2.57177734375, -2.300537109375, -2.029296875, -1.758056640625, -1.48681640625, -1.215576171875, -0.9443359375, -0.673095703125, -0.40185546875, -0.130615234375, 0.140625, 0.411865234375, 0.68310546875, 0.954345703125, 1.2255859375, 1.496826171875, 1.76806640625, 2.039306640625, 2.310546875, 2.581787109375, 2.85302734375, 3.124267578125, 3.3955078125, 3.666748046875, 3.93798828125, 4.209228515625, 4.48046875, 4.751708984375, 5.02294921875, 5.294189453125, 5.5654296875, 5.836669921875, 6.10791015625, 6.379150390625, 6.650390625, 6.921630859375, 7.19287109375, 7.464111328125, 7.7353515625, 8.006591796875, 8.27783203125, 8.549072265625, 8.8203125]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 4.0, 4.0, 13.0, 10.0, 18.0, 21.0, 30.0, 32.0, 45.0, 59.0, 81.0, 104.0, 164.0, 234.0, 304.0, 431.0, 732.0, 1267.0, 2774.0, 10845.0, 82197.0, 865043.0, 68351.0, 9696.0, 2695.0, 1185.0, 689.0, 406.0, 311.0, 209.0, 153.0, 121.0, 91.0, 68.0, 40.0, 40.0, 20.0, 22.0, 12.0, 9.0, 4.0, 7.0, 6.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.5625, -20.877197265625, -20.19189453125, -19.506591796875, -18.8212890625, -18.135986328125, -17.45068359375, -16.765380859375, -16.080078125, -15.394775390625, -14.70947265625, -14.024169921875, -13.3388671875, -12.653564453125, -11.96826171875, -11.282958984375, -10.59765625, -9.912353515625, -9.22705078125, -8.541748046875, -7.8564453125, -7.171142578125, -6.48583984375, -5.800537109375, -5.115234375, -4.429931640625, -3.74462890625, -3.059326171875, -2.3740234375, -1.688720703125, -1.00341796875, -0.318115234375, 0.3671875, 1.052490234375, 1.73779296875, 2.423095703125, 3.1083984375, 3.793701171875, 4.47900390625, 5.164306640625, 5.849609375, 6.534912109375, 7.22021484375, 7.905517578125, 8.5908203125, 9.276123046875, 9.96142578125, 10.646728515625, 11.33203125, 12.017333984375, 12.70263671875, 13.387939453125, 14.0732421875, 14.758544921875, 15.44384765625, 16.129150390625, 16.814453125, 17.499755859375, 18.18505859375, 18.870361328125, 19.5556640625, 20.240966796875, 20.92626953125, 21.611572265625, 22.296875]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 4.0, 8.0, 3.0, 7.0, 15.0, 9.0, 14.0, 10.0, 22.0, 24.0, 28.0, 27.0, 25.0, 35.0, 32.0, 30.0, 50.0, 54.0, 98.0, 258.0, 1675.0, 115.0, 67.0, 52.0, 48.0, 39.0, 37.0, 37.0, 31.0, 25.0, 27.0, 25.0, 29.0, 15.0, 8.0, 17.0, 10.0, 8.0, 6.0, 9.0, 4.0, 2.0, 8.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-26.671875, -25.935791015625, -25.19970703125, -24.463623046875, -23.7275390625, -22.991455078125, -22.25537109375, -21.519287109375, -20.783203125, -20.047119140625, -19.31103515625, -18.574951171875, -17.8388671875, -17.102783203125, -16.36669921875, -15.630615234375, -14.89453125, -14.158447265625, -13.42236328125, -12.686279296875, -11.9501953125, -11.214111328125, -10.47802734375, -9.741943359375, -9.005859375, -8.269775390625, -7.53369140625, -6.797607421875, -6.0615234375, -5.325439453125, -4.58935546875, -3.853271484375, -3.1171875, -2.381103515625, -1.64501953125, -0.908935546875, -0.1728515625, 0.563232421875, 1.29931640625, 2.035400390625, 2.771484375, 3.507568359375, 4.24365234375, 4.979736328125, 5.7158203125, 6.451904296875, 7.18798828125, 7.924072265625, 8.66015625, 9.396240234375, 10.13232421875, 10.868408203125, 11.6044921875, 12.340576171875, 13.07666015625, 13.812744140625, 14.548828125, 15.284912109375, 16.02099609375, 16.757080078125, 17.4931640625, 18.229248046875, 18.96533203125, 19.701416015625, 20.4375]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 7.0, 6.0, 7.0, 6.0, 9.0, 13.0, 17.0, 20.0, 40.0, 30.0, 43.0, 55.0, 85.0, 94.0, 125.0, 234.0, 666.0, 5265.0, 3099452.0, 37421.0, 1196.0, 358.0, 137.0, 90.0, 73.0, 55.0, 45.0, 32.0, 31.0, 25.0, 17.0, 17.0, 7.0, 7.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-75.6875, -73.1396484375, -70.591796875, -68.0439453125, -65.49609375, -62.9482421875, -60.400390625, -57.8525390625, -55.3046875, -52.7568359375, -50.208984375, -47.6611328125, -45.11328125, -42.5654296875, -40.017578125, -37.4697265625, -34.921875, -32.3740234375, -29.826171875, -27.2783203125, -24.73046875, -22.1826171875, -19.634765625, -17.0869140625, -14.5390625, -11.9912109375, -9.443359375, -6.8955078125, -4.34765625, -1.7998046875, 0.748046875, 3.2958984375, 5.84375, 8.3916015625, 10.939453125, 13.4873046875, 16.03515625, 18.5830078125, 21.130859375, 23.6787109375, 26.2265625, 28.7744140625, 31.322265625, 33.8701171875, 36.41796875, 38.9658203125, 41.513671875, 44.0615234375, 46.609375, 49.1572265625, 51.705078125, 54.2529296875, 56.80078125, 59.3486328125, 61.896484375, 64.4443359375, 66.9921875, 69.5400390625, 72.087890625, 74.6357421875, 77.18359375, 79.7314453125, 82.279296875, 84.8271484375, 87.375]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 43.0, 128.0, 330.0, 317.0, 148.0, 42.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.324283599853516, -19.54854965209961, -17.772815704345703, -15.997082710266113, -14.221348762512207, -12.4456148147583, -10.669881820678711, -8.894147872924805, -7.118413925170898, -5.342679977416992, -3.566946506500244, -1.791213035583496, -0.015479087829589844, 1.7602548599243164, 3.5359878540039062, 5.3117218017578125, 7.087455749511719, 8.863189697265625, 10.638923645019531, 12.414656639099121, 14.190390586853027, 15.966124534606934, 17.741857528686523, 19.51759147644043, 21.293325424194336, 23.069059371948242, 24.84479331970215, 26.620525360107422, 28.396259307861328, 30.171993255615234, 31.94772720336914, 33.72346115112305, 35.49919891357422, 37.274932861328125, 39.05066680908203, 40.82640075683594, 42.602134704589844, 44.37786865234375, 46.153602600097656, 47.92933654785156, 49.70507049560547, 51.480804443359375, 53.25653839111328, 55.03227233886719, 56.808006286621094, 58.583740234375, 60.359474182128906, 62.13520812988281, 63.91093826293945, 65.6866683959961, 67.46240234375, 69.2381362915039, 71.01387023925781, 72.78960418701172, 74.56533813476562, 76.34107208251953, 78.11680603027344, 79.89253997802734, 81.66827392578125, 83.44400787353516, 85.21974182128906, 86.99547576904297, 88.77120971679688, 90.54694366455078, 92.32267761230469]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 5.0, 5.0, 8.0, 10.0, 8.0, 14.0, 10.0, 15.0, 23.0, 27.0, 21.0, 32.0, 31.0, 34.0, 36.0, 53.0, 43.0, 53.0, 44.0, 49.0, 38.0, 45.0, 46.0, 33.0, 29.0, 35.0, 37.0, 34.0, 20.0, 28.0, 29.0, 17.0, 19.0, 8.0, 12.0, 10.0, 7.0, 5.0, 8.0, 6.0, 4.0, 3.0, 4.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-68.32886505126953, -66.34992980957031, -64.37098693847656, -62.39204788208008, -60.413108825683594, -58.434173583984375, -56.45523452758789, -54.476295471191406, -52.49735641479492, -50.51841735839844, -48.53947830200195, -46.56053924560547, -44.58160400390625, -42.6026611328125, -40.62372589111328, -38.6447868347168, -36.66584777832031, -34.68690872192383, -32.707969665527344, -30.729032516479492, -28.750093460083008, -26.771154403686523, -24.792217254638672, -22.813278198242188, -20.834339141845703, -18.85540008544922, -16.876461029052734, -14.897523880004883, -12.918584823608398, -10.939645767211914, -8.960707664489746, -6.981769561767578, -5.002830505371094, -3.0238919258117676, -1.0449533462524414, 0.9339852333068848, 2.912923812866211, 4.891862869262695, 6.870800971984863, 8.849739074707031, 10.828678131103516, 12.8076171875, 14.786555290222168, 16.765493392944336, 18.74443244934082, 20.723371505737305, 22.702308654785156, 24.68124771118164, 26.660186767578125, 28.63912582397461, 30.618064880371094, 32.59700393676758, 34.57594299316406, 36.55487823486328, 38.533817291259766, 40.51275634765625, 42.491695404052734, 44.47063446044922, 46.4495735168457, 48.42851257324219, 50.407447814941406, 52.386390686035156, 54.365325927734375, 56.34426498413086, 58.323204040527344]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 5.0, 10.0, 12.0, 8.0, 13.0, 13.0, 14.0, 12.0, 25.0, 29.0, 23.0, 27.0, 29.0, 34.0, 29.0, 38.0, 38.0, 39.0, 39.0, 55.0, 50.0, 41.0, 48.0, 42.0, 26.0, 43.0, 33.0, 26.0, 36.0, 31.0, 27.0, 19.0, 22.0, 22.0, 13.0, 6.0, 8.0, 6.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5234375, -8.248291015625, -7.97314453125, -7.697998046875, -7.4228515625, -7.147705078125, -6.87255859375, -6.597412109375, -6.322265625, -6.047119140625, -5.77197265625, -5.496826171875, -5.2216796875, -4.946533203125, -4.67138671875, -4.396240234375, -4.12109375, -3.845947265625, -3.57080078125, -3.295654296875, -3.0205078125, -2.745361328125, -2.47021484375, -2.195068359375, -1.919921875, -1.644775390625, -1.36962890625, -1.094482421875, -0.8193359375, -0.544189453125, -0.26904296875, 0.006103515625, 0.28125, 0.556396484375, 0.83154296875, 1.106689453125, 1.3818359375, 1.656982421875, 1.93212890625, 2.207275390625, 2.482421875, 2.757568359375, 3.03271484375, 3.307861328125, 3.5830078125, 3.858154296875, 4.13330078125, 4.408447265625, 4.68359375, 4.958740234375, 5.23388671875, 5.509033203125, 5.7841796875, 6.059326171875, 6.33447265625, 6.609619140625, 6.884765625, 7.159912109375, 7.43505859375, 7.710205078125, 7.9853515625, 8.260498046875, 8.53564453125, 8.810791015625, 9.0859375]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 7.0, 5.0, 6.0, 13.0, 18.0, 11.0, 20.0, 31.0, 39.0, 53.0, 60.0, 104.0, 113.0, 184.0, 248.0, 417.0, 882.0, 1782.0, 4617.0, 16554.0, 131659.0, 1760096.0, 2061407.0, 186129.0, 20219.0, 5286.0, 1994.0, 937.0, 480.0, 276.0, 155.0, 141.0, 84.0, 61.0, 53.0, 42.0, 32.0, 20.0, 10.0, 10.0, 12.0, 7.0, 7.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.28125, -17.7109375, -17.140625, -16.5703125, -16.0, -15.4296875, -14.859375, -14.2890625, -13.71875, -13.1484375, -12.578125, -12.0078125, -11.4375, -10.8671875, -10.296875, -9.7265625, -9.15625, -8.5859375, -8.015625, -7.4453125, -6.875, -6.3046875, -5.734375, -5.1640625, -4.59375, -4.0234375, -3.453125, -2.8828125, -2.3125, -1.7421875, -1.171875, -0.6015625, -0.03125, 0.5390625, 1.109375, 1.6796875, 2.25, 2.8203125, 3.390625, 3.9609375, 4.53125, 5.1015625, 5.671875, 6.2421875, 6.8125, 7.3828125, 7.953125, 8.5234375, 9.09375, 9.6640625, 10.234375, 10.8046875, 11.375, 11.9453125, 12.515625, 13.0859375, 13.65625, 14.2265625, 14.796875, 15.3671875, 15.9375, 16.5078125, 17.078125, 17.6484375, 18.21875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 9.0, 8.0, 11.0, 12.0, 18.0, 35.0, 45.0, 66.0, 91.0, 147.0, 251.0, 370.0, 508.0, 627.0, 565.0, 447.0, 286.0, 167.0, 145.0, 82.0, 49.0, 41.0, 24.0, 20.0, 14.0, 10.0, 12.0, 6.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.015625, -15.5263671875, -15.037109375, -14.5478515625, -14.05859375, -13.5693359375, -13.080078125, -12.5908203125, -12.1015625, -11.6123046875, -11.123046875, -10.6337890625, -10.14453125, -9.6552734375, -9.166015625, -8.6767578125, -8.1875, -7.6982421875, -7.208984375, -6.7197265625, -6.23046875, -5.7412109375, -5.251953125, -4.7626953125, -4.2734375, -3.7841796875, -3.294921875, -2.8056640625, -2.31640625, -1.8271484375, -1.337890625, -0.8486328125, -0.359375, 0.1298828125, 0.619140625, 1.1083984375, 1.59765625, 2.0869140625, 2.576171875, 3.0654296875, 3.5546875, 4.0439453125, 4.533203125, 5.0224609375, 5.51171875, 6.0009765625, 6.490234375, 6.9794921875, 7.46875, 7.9580078125, 8.447265625, 8.9365234375, 9.42578125, 9.9150390625, 10.404296875, 10.8935546875, 11.3828125, 11.8720703125, 12.361328125, 12.8505859375, 13.33984375, 13.8291015625, 14.318359375, 14.8076171875, 15.296875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 4.0, 5.0, 6.0, 4.0, 10.0, 14.0, 13.0, 26.0, 18.0, 30.0, 31.0, 45.0, 47.0, 76.0, 109.0, 106.0, 189.0, 276.0, 536.0, 1224.0, 4531.0, 41123.0, 2481571.0, 1626001.0, 31676.0, 4043.0, 1138.0, 479.0, 254.0, 183.0, 133.0, 89.0, 65.0, 56.0, 40.0, 35.0, 21.0, 20.0, 15.0, 12.0, 6.0, 4.0, 8.0, 1.0, 3.0, 4.0, 5.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-36.9375, -35.744140625, -34.55078125, -33.357421875, -32.1640625, -30.970703125, -29.77734375, -28.583984375, -27.390625, -26.197265625, -25.00390625, -23.810546875, -22.6171875, -21.423828125, -20.23046875, -19.037109375, -17.84375, -16.650390625, -15.45703125, -14.263671875, -13.0703125, -11.876953125, -10.68359375, -9.490234375, -8.296875, -7.103515625, -5.91015625, -4.716796875, -3.5234375, -2.330078125, -1.13671875, 0.056640625, 1.25, 2.443359375, 3.63671875, 4.830078125, 6.0234375, 7.216796875, 8.41015625, 9.603515625, 10.796875, 11.990234375, 13.18359375, 14.376953125, 15.5703125, 16.763671875, 17.95703125, 19.150390625, 20.34375, 21.537109375, 22.73046875, 23.923828125, 25.1171875, 26.310546875, 27.50390625, 28.697265625, 29.890625, 31.083984375, 32.27734375, 33.470703125, 34.6640625, 35.857421875, 37.05078125, 38.244140625, 39.4375]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [37.0, 434.0, 498.0, 41.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.64754295349121, -9.361690521240234, -0.07583808898925781, 9.210014343261719, 18.495866775512695, 27.78171730041504, 37.06757354736328, 46.353424072265625, 55.63927459716797, 64.92512512207031, 74.21098327636719, 83.49683380126953, 92.78268432617188, 102.06853485107422, 111.35438537597656, 120.64024353027344, 129.9261016845703, 139.2119598388672, 148.497802734375, 157.78366088867188, 167.06951904296875, 176.35536193847656, 185.64122009277344, 194.92706298828125, 204.21292114257812, 213.498779296875, 222.7846221923828, 232.0704803466797, 241.3563232421875, 250.64218139648438, 259.92803955078125, 269.2138977050781, 278.499755859375, 287.7856140136719, 297.07147216796875, 306.3572998046875, 315.6431579589844, 324.92901611328125, 334.2148742675781, 343.500732421875, 352.78656005859375, 362.0724182128906, 371.3582763671875, 380.64410400390625, 389.9299621582031, 399.2158203125, 408.5016784667969, 417.78753662109375, 427.0733947753906, 436.3592529296875, 445.6451110839844, 454.9309387207031, 464.216796875, 473.5026550292969, 482.78851318359375, 492.0743713378906, 501.3602294921875, 510.6460876464844, 519.9319458007812, 529.2177734375, 538.503662109375, 547.7894897460938, 557.0753173828125, 566.3612060546875, 575.6470336914062]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 3.0, 2.0, 5.0, 8.0, 7.0, 6.0, 12.0, 14.0, 22.0, 22.0, 21.0, 27.0, 13.0, 31.0, 21.0, 32.0, 37.0, 46.0, 31.0, 39.0, 40.0, 39.0, 30.0, 42.0, 43.0, 39.0, 36.0, 31.0, 30.0, 35.0, 35.0, 21.0, 27.0, 24.0, 23.0, 17.0, 18.0, 8.0, 15.0, 11.0, 9.0, 7.0, 4.0, 4.0, 5.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-38.665008544921875, -37.35017395019531, -36.03533935546875, -34.72050476074219, -33.405670166015625, -32.0908317565918, -30.775997161865234, -29.461162567138672, -28.14632797241211, -26.831493377685547, -25.516658782958984, -24.20182228088379, -22.886987686157227, -21.572153091430664, -20.25731658935547, -18.942481994628906, -17.627647399902344, -16.31281280517578, -14.997977256774902, -13.683141708374023, -12.368307113647461, -11.053472518920898, -9.73863697052002, -8.42380142211914, -7.108966827392578, -5.794131755828857, -4.479296684265137, -3.164461612701416, -1.8496265411376953, -0.5347914695739746, 0.7800436019897461, 2.094879150390625, 3.4097137451171875, 4.724548816680908, 6.039383888244629, 7.35421895980835, 8.66905403137207, 9.983888626098633, 11.298724174499512, 12.61355972290039, 13.928394317626953, 15.243228912353516, 16.558063507080078, 17.872900009155273, 19.187734603881836, 20.5025691986084, 21.817405700683594, 23.132240295410156, 24.44707489013672, 25.76190948486328, 27.076744079589844, 28.39158058166504, 29.7064151763916, 31.021249771118164, 32.33608627319336, 33.65092086791992, 34.965755462646484, 36.28059005737305, 37.59542465209961, 38.91025924682617, 40.22509765625, 41.53993225097656, 42.854766845703125, 44.16960144042969, 45.48443603515625]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 5.0, 2.0, 4.0, 8.0, 8.0, 15.0, 12.0, 7.0, 17.0, 10.0, 11.0, 17.0, 13.0, 31.0, 30.0, 22.0, 24.0, 22.0, 39.0, 19.0, 35.0, 37.0, 47.0, 39.0, 35.0, 41.0, 42.0, 32.0, 38.0, 42.0, 25.0, 41.0, 30.0, 25.0, 24.0, 29.0, 17.0, 16.0, 12.0, 21.0, 10.0, 9.0, 11.0, 5.0, 11.0, 5.0, 4.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.453125, -7.21649169921875, -6.9798583984375, -6.74322509765625, -6.506591796875, -6.26995849609375, -6.0333251953125, -5.79669189453125, -5.56005859375, -5.32342529296875, -5.0867919921875, -4.85015869140625, -4.613525390625, -4.37689208984375, -4.1402587890625, -3.90362548828125, -3.6669921875, -3.43035888671875, -3.1937255859375, -2.95709228515625, -2.720458984375, -2.48382568359375, -2.2471923828125, -2.01055908203125, -1.77392578125, -1.53729248046875, -1.3006591796875, -1.06402587890625, -0.827392578125, -0.59075927734375, -0.3541259765625, -0.11749267578125, 0.119140625, 0.35577392578125, 0.5924072265625, 0.82904052734375, 1.065673828125, 1.30230712890625, 1.5389404296875, 1.77557373046875, 2.01220703125, 2.24884033203125, 2.4854736328125, 2.72210693359375, 2.958740234375, 3.19537353515625, 3.4320068359375, 3.66864013671875, 3.9052734375, 4.14190673828125, 4.3785400390625, 4.61517333984375, 4.851806640625, 5.08843994140625, 5.3250732421875, 5.56170654296875, 5.79833984375, 6.03497314453125, 6.2716064453125, 6.50823974609375, 6.744873046875, 6.98150634765625, 7.2181396484375, 7.45477294921875, 7.69140625]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 10.0, 10.0, 19.0, 19.0, 20.0, 36.0, 38.0, 68.0, 83.0, 176.0, 259.0, 450.0, 727.0, 1142.0, 1956.0, 3390.0, 5477.0, 9222.0, 15784.0, 27758.0, 49857.0, 94321.0, 196988.0, 293682.0, 164762.0, 80805.0, 42707.0, 24358.0, 13981.0, 8289.0, 4738.0, 2896.0, 1729.0, 1084.0, 650.0, 359.0, 267.0, 157.0, 110.0, 59.0, 47.0, 19.0, 15.0, 9.0, 6.0, 6.0, 4.0, 5.0, 3.0, 3.0, 1.0, 2.0, 4.0], "bins": [-1.5224609375, -1.478179931640625, -1.43389892578125, -1.389617919921875, -1.3453369140625, -1.301055908203125, -1.25677490234375, -1.212493896484375, -1.168212890625, -1.123931884765625, -1.07965087890625, -1.035369873046875, -0.9910888671875, -0.946807861328125, -0.90252685546875, -0.858245849609375, -0.81396484375, -0.769683837890625, -0.72540283203125, -0.681121826171875, -0.6368408203125, -0.592559814453125, -0.54827880859375, -0.503997802734375, -0.459716796875, -0.415435791015625, -0.37115478515625, -0.326873779296875, -0.2825927734375, -0.238311767578125, -0.19403076171875, -0.149749755859375, -0.10546875, -0.061187744140625, -0.01690673828125, 0.027374267578125, 0.0716552734375, 0.115936279296875, 0.16021728515625, 0.204498291015625, 0.248779296875, 0.293060302734375, 0.33734130859375, 0.381622314453125, 0.4259033203125, 0.470184326171875, 0.51446533203125, 0.558746337890625, 0.60302734375, 0.647308349609375, 0.69158935546875, 0.735870361328125, 0.7801513671875, 0.824432373046875, 0.86871337890625, 0.912994384765625, 0.957275390625, 1.001556396484375, 1.04583740234375, 1.090118408203125, 1.1343994140625, 1.178680419921875, 1.22296142578125, 1.267242431640625, 1.3115234375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 3.0, 3.0, 6.0, 5.0, 2.0, 4.0, 11.0, 8.0, 11.0, 12.0, 13.0, 9.0, 13.0, 26.0, 29.0, 24.0, 32.0, 27.0, 34.0, 32.0, 30.0, 43.0, 45.0, 35.0, 1065.0, 38.0, 41.0, 44.0, 32.0, 44.0, 34.0, 42.0, 33.0, 25.0, 25.0, 21.0, 24.0, 8.0, 14.0, 9.0, 13.0, 10.0, 7.0, 13.0, 10.0, 9.0, 4.0, 2.0, 6.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-4.92578125, -4.77520751953125, -4.6246337890625, -4.47406005859375, -4.323486328125, -4.17291259765625, -4.0223388671875, -3.87176513671875, -3.72119140625, -3.57061767578125, -3.4200439453125, -3.26947021484375, -3.118896484375, -2.96832275390625, -2.8177490234375, -2.66717529296875, -2.5166015625, -2.36602783203125, -2.2154541015625, -2.06488037109375, -1.914306640625, -1.76373291015625, -1.6131591796875, -1.46258544921875, -1.31201171875, -1.16143798828125, -1.0108642578125, -0.86029052734375, -0.709716796875, -0.55914306640625, -0.4085693359375, -0.25799560546875, -0.107421875, 0.04315185546875, 0.1937255859375, 0.34429931640625, 0.494873046875, 0.64544677734375, 0.7960205078125, 0.94659423828125, 1.09716796875, 1.24774169921875, 1.3983154296875, 1.54888916015625, 1.699462890625, 1.85003662109375, 2.0006103515625, 2.15118408203125, 2.3017578125, 2.45233154296875, 2.6029052734375, 2.75347900390625, 2.904052734375, 3.05462646484375, 3.2052001953125, 3.35577392578125, 3.50634765625, 3.65692138671875, 3.8074951171875, 3.95806884765625, 4.108642578125, 4.25921630859375, 4.4097900390625, 4.56036376953125, 4.7109375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 9.0, 13.0, 6.0, 14.0, 34.0, 33.0, 50.0, 76.0, 139.0, 145.0, 205.0, 333.0, 448.0, 655.0, 932.0, 1399.0, 2048.0, 3031.0, 4672.0, 6726.0, 10723.0, 16768.0, 26835.0, 44671.0, 78257.0, 149590.0, 1302719.0, 196691.0, 101638.0, 56251.0, 33494.0, 20561.0, 12984.0, 8388.0, 5397.0, 3550.0, 2402.0, 1667.0, 1113.0, 736.0, 555.0, 362.0, 245.0, 168.0, 125.0, 90.0, 63.0, 36.0, 36.0, 22.0, 13.0, 13.0, 4.0, 1.0, 3.0, 2.0, 2.0], "bins": [-1.10546875, -1.0726776123046875, -1.039886474609375, -1.0070953369140625, -0.97430419921875, -0.9415130615234375, -0.908721923828125, -0.8759307861328125, -0.8431396484375, -0.8103485107421875, -0.777557373046875, -0.7447662353515625, -0.71197509765625, -0.6791839599609375, -0.646392822265625, -0.6136016845703125, -0.580810546875, -0.5480194091796875, -0.515228271484375, -0.4824371337890625, -0.44964599609375, -0.4168548583984375, -0.384063720703125, -0.3512725830078125, -0.3184814453125, -0.2856903076171875, -0.252899169921875, -0.2201080322265625, -0.18731689453125, -0.1545257568359375, -0.121734619140625, -0.0889434814453125, -0.05615234375, -0.0233612060546875, 0.009429931640625, 0.0422210693359375, 0.07501220703125, 0.1078033447265625, 0.140594482421875, 0.1733856201171875, 0.2061767578125, 0.2389678955078125, 0.271759033203125, 0.3045501708984375, 0.33734130859375, 0.3701324462890625, 0.402923583984375, 0.4357147216796875, 0.468505859375, 0.5012969970703125, 0.534088134765625, 0.5668792724609375, 0.59967041015625, 0.6324615478515625, 0.665252685546875, 0.6980438232421875, 0.7308349609375, 0.7636260986328125, 0.796417236328125, 0.8292083740234375, 0.86199951171875, 0.8947906494140625, 0.927581787109375, 0.9603729248046875, 0.9931640625]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 5.0, 6.0, 4.0, 7.0, 7.0, 9.0, 4.0, 8.0, 15.0, 13.0, 13.0, 15.0, 30.0, 24.0, 35.0, 29.0, 38.0, 52.0, 37.0, 55.0, 56.0, 65.0, 44.0, 41.0, 49.0, 40.0, 51.0, 39.0, 37.0, 24.0, 24.0, 32.0, 20.0, 22.0, 13.0, 5.0, 8.0, 9.0, 11.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0019683837890625, -0.001899033784866333, -0.001829683780670166, -0.001760333776473999, -0.001690983772277832, -0.001621633768081665, -0.001552283763885498, -0.001482933759689331, -0.001413583755493164, -0.001344233751296997, -0.00127488374710083, -0.001205533742904663, -0.001136183738708496, -0.001066833734512329, -0.0009974837303161621, -0.0009281337261199951, -0.0008587837219238281, -0.0007894337177276611, -0.0007200837135314941, -0.0006507337093353271, -0.0005813837051391602, -0.0005120337009429932, -0.00044268369674682617, -0.0003733336925506592, -0.0003039836883544922, -0.0002346336841583252, -0.0001652836799621582, -9.593367576599121e-05, -2.658367156982422e-05, 4.2766332626342773e-05, 0.00011211633682250977, 0.00018146634101867676, 0.00025081634521484375, 0.00032016634941101074, 0.00038951635360717773, 0.0004588663578033447, 0.0005282163619995117, 0.0005975663661956787, 0.0006669163703918457, 0.0007362663745880127, 0.0008056163787841797, 0.0008749663829803467, 0.0009443163871765137, 0.0010136663913726807, 0.0010830163955688477, 0.0011523663997650146, 0.0012217164039611816, 0.0012910664081573486, 0.0013604164123535156, 0.0014297664165496826, 0.0014991164207458496, 0.0015684664249420166, 0.0016378164291381836, 0.0017071664333343506, 0.0017765164375305176, 0.0018458664417266846, 0.0019152164459228516, 0.0019845664501190186, 0.0020539164543151855, 0.0021232664585113525, 0.0021926164627075195, 0.0022619664669036865, 0.0023313164710998535, 0.0024006664752960205, 0.0024700164794921875]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 6.0, 8.0, 6.0, 6.0, 12.0, 20.0, 16.0, 22.0, 32.0, 44.0, 54.0, 59.0, 72.0, 111.0, 167.0, 279.0, 573.0, 2321.0, 966870.0, 75853.0, 944.0, 402.0, 180.0, 128.0, 77.0, 68.0, 41.0, 43.0, 34.0, 15.0, 28.0, 16.0, 8.0, 5.0, 8.0, 9.0, 7.0, 5.0, 1.0, 7.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.057708740234375, -0.056049346923828125, -0.05438995361328125, -0.052730560302734375, -0.0510711669921875, -0.049411773681640625, -0.04775238037109375, -0.046092987060546875, -0.04443359375, -0.042774200439453125, -0.04111480712890625, -0.039455413818359375, -0.0377960205078125, -0.036136627197265625, -0.03447723388671875, -0.032817840576171875, -0.031158447265625, -0.029499053955078125, -0.02783966064453125, -0.026180267333984375, -0.0245208740234375, -0.022861480712890625, -0.02120208740234375, -0.019542694091796875, -0.01788330078125, -0.016223907470703125, -0.01456451416015625, -0.012905120849609375, -0.0112457275390625, -0.009586334228515625, -0.00792694091796875, -0.006267547607421875, -0.004608154296875, -0.002948760986328125, -0.00128936767578125, 0.000370025634765625, 0.0020294189453125, 0.003688812255859375, 0.00534820556640625, 0.007007598876953125, 0.0086669921875, 0.010326385498046875, 0.01198577880859375, 0.013645172119140625, 0.0153045654296875, 0.016963958740234375, 0.01862335205078125, 0.020282745361328125, 0.021942138671875, 0.023601531982421875, 0.02526092529296875, 0.026920318603515625, 0.0285797119140625, 0.030239105224609375, 0.03189849853515625, 0.033557891845703125, 0.03521728515625, 0.036876678466796875, 0.03853607177734375, 0.040195465087890625, 0.0418548583984375, 0.043514251708984375, 0.04517364501953125, 0.046833038330078125, 0.048492431640625]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 15.0, 428.0, 556.0, 17.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02301296591758728, -0.02260955236852169, -0.0222061388194561, -0.02180272527039051, -0.02139931358397007, -0.02099590003490448, -0.02059248648583889, -0.0201890729367733, -0.01978565938770771, -0.01938224583864212, -0.01897883228957653, -0.01857541874051094, -0.0181720070540905, -0.01776859350502491, -0.01736517995595932, -0.01696176640689373, -0.01655835285782814, -0.01615493930876255, -0.01575152575969696, -0.015348113141953945, -0.014944699592888355, -0.01454128697514534, -0.01413787342607975, -0.01373445987701416, -0.013331047259271145, -0.012927633710205555, -0.01252422109246254, -0.01212080754339695, -0.01171739399433136, -0.01131398044526577, -0.010910567827522755, -0.010507154278457165, -0.01010374166071415, -0.00970032811164856, -0.009296915493905544, -0.008893501944839954, -0.008490088395774364, -0.00808667577803135, -0.007683262228965759, -0.007279848679900169, -0.0068764351308345795, -0.006473022047430277, -0.006069608498364687, -0.005666195414960384, -0.0052627818658947945, -0.004859368782490492, -0.004455955699086189, -0.004052542150020599, -0.0036491286009550095, -0.003245715284720063, -0.002842301968485117, -0.0024388888850808144, -0.0020354753360152245, -0.0016320622526109219, -0.0012286489363759756, -0.0008252356201410294, -0.0004218223039060831, -1.8409016774967313e-05, 0.0003850042703561485, 0.0007884175283834338, 0.00119183084461838, 0.0015952440444380045, 0.0019986573606729507, 0.002402070676907897, 0.0028054839931428432]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 4.0, 6.0, 4.0, 10.0, 11.0, 15.0, 19.0, 14.0, 21.0, 25.0, 33.0, 36.0, 38.0, 26.0, 51.0, 42.0, 45.0, 42.0, 38.0, 50.0, 58.0, 40.0, 48.0, 42.0, 27.0, 32.0, 30.0, 28.0, 25.0, 25.0, 19.0, 24.0, 15.0, 11.0, 10.0, 12.0, 10.0, 4.0, 6.0, 3.0, 5.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011220574378967285, -0.001079595647752285, -0.0010371338576078415, -0.000994672067463398, -0.0009522102773189545, -0.000909748487174511, -0.0008672866970300674, -0.0008248249068856239, -0.0007823631167411804, -0.0007399013265967369, -0.0006974395364522934, -0.0006549777463078499, -0.0006125159561634064, -0.0005700541660189629, -0.0005275923758745193, -0.00048513058573007584, -0.0004426687955856323, -0.0004002070054411888, -0.0003577452152967453, -0.0003152834251523018, -0.0002728216350078583, -0.00023035984486341476, -0.00018789805471897125, -0.00014543626457452774, -0.00010297447443008423, -6.0512684285640717e-05, -1.8050894141197205e-05, 2.4410896003246307e-05, 6.687268614768982e-05, 0.00010933447629213333, 0.00015179626643657684, 0.00019425805658102036, 0.00023671984672546387, 0.0002791816368699074, 0.0003216434270143509, 0.0003641052171587944, 0.0004065670073032379, 0.0004490287974476814, 0.0004914905875921249, 0.0005339523777365685, 0.000576414167881012, 0.0006188759580254555, 0.000661337748169899, 0.0007037995383143425, 0.000746261328458786, 0.0007887231186032295, 0.000831184908747673, 0.0008736466988921165, 0.0009161084890365601, 0.0009585702791810036, 0.001001032069325447, 0.0010434938594698906, 0.001085955649614334, 0.0011284174397587776, 0.0011708792299032211, 0.0012133410200476646, 0.0012558028101921082, 0.0012982646003365517, 0.0013407263904809952, 0.0013831881806254387, 0.0014256499707698822, 0.0014681117609143257, 0.0015105735510587692, 0.0015530353412032127, 0.0015954971313476562]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 5.0, 2.0, 4.0, 8.0, 8.0, 15.0, 12.0, 7.0, 17.0, 10.0, 11.0, 17.0, 13.0, 31.0, 30.0, 22.0, 24.0, 22.0, 39.0, 19.0, 35.0, 37.0, 47.0, 39.0, 35.0, 41.0, 42.0, 32.0, 38.0, 42.0, 25.0, 41.0, 30.0, 25.0, 24.0, 29.0, 17.0, 16.0, 12.0, 21.0, 10.0, 9.0, 11.0, 5.0, 11.0, 5.0, 4.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.453125, -7.21649169921875, -6.9798583984375, -6.74322509765625, -6.506591796875, -6.26995849609375, -6.0333251953125, -5.79669189453125, -5.56005859375, -5.32342529296875, -5.0867919921875, -4.85015869140625, -4.613525390625, -4.37689208984375, -4.1402587890625, -3.90362548828125, -3.6669921875, -3.43035888671875, -3.1937255859375, -2.95709228515625, -2.720458984375, -2.48382568359375, -2.2471923828125, -2.01055908203125, -1.77392578125, -1.53729248046875, -1.3006591796875, -1.06402587890625, -0.827392578125, -0.59075927734375, -0.3541259765625, -0.11749267578125, 0.119140625, 0.35577392578125, 0.5924072265625, 0.82904052734375, 1.065673828125, 1.30230712890625, 1.5389404296875, 1.77557373046875, 2.01220703125, 2.24884033203125, 2.4854736328125, 2.72210693359375, 2.958740234375, 3.19537353515625, 3.4320068359375, 3.66864013671875, 3.9052734375, 4.14190673828125, 4.3785400390625, 4.61517333984375, 4.851806640625, 5.08843994140625, 5.3250732421875, 5.56170654296875, 5.79833984375, 6.03497314453125, 6.2716064453125, 6.50823974609375, 6.744873046875, 6.98150634765625, 7.2181396484375, 7.45477294921875, 7.69140625]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 5.0, 9.0, 7.0, 8.0, 18.0, 26.0, 22.0, 33.0, 44.0, 56.0, 59.0, 89.0, 105.0, 159.0, 185.0, 295.0, 461.0, 859.0, 1561.0, 2860.0, 6062.0, 13895.0, 35847.0, 102981.0, 358826.0, 358114.0, 103382.0, 35623.0, 13920.0, 6124.0, 2902.0, 1511.0, 855.0, 525.0, 322.0, 214.0, 142.0, 99.0, 67.0, 84.0, 45.0, 46.0, 28.0, 21.0, 18.0, 15.0, 10.0, 4.0, 5.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.9453125, -9.634521484375, -9.32373046875, -9.012939453125, -8.7021484375, -8.391357421875, -8.08056640625, -7.769775390625, -7.458984375, -7.148193359375, -6.83740234375, -6.526611328125, -6.2158203125, -5.905029296875, -5.59423828125, -5.283447265625, -4.97265625, -4.661865234375, -4.35107421875, -4.040283203125, -3.7294921875, -3.418701171875, -3.10791015625, -2.797119140625, -2.486328125, -2.175537109375, -1.86474609375, -1.553955078125, -1.2431640625, -0.932373046875, -0.62158203125, -0.310791015625, 0.0, 0.310791015625, 0.62158203125, 0.932373046875, 1.2431640625, 1.553955078125, 1.86474609375, 2.175537109375, 2.486328125, 2.797119140625, 3.10791015625, 3.418701171875, 3.7294921875, 4.040283203125, 4.35107421875, 4.661865234375, 4.97265625, 5.283447265625, 5.59423828125, 5.905029296875, 6.2158203125, 6.526611328125, 6.83740234375, 7.148193359375, 7.458984375, 7.769775390625, 8.08056640625, 8.391357421875, 8.7021484375, 9.012939453125, 9.32373046875, 9.634521484375, 9.9453125]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 5.0, 5.0, 6.0, 8.0, 12.0, 19.0, 22.0, 20.0, 26.0, 29.0, 26.0, 43.0, 36.0, 49.0, 58.0, 71.0, 83.0, 112.0, 1523.0, 296.0, 113.0, 93.0, 54.0, 48.0, 44.0, 39.0, 28.0, 25.0, 27.0, 18.0, 24.0, 14.0, 17.0, 6.0, 11.0, 10.0, 7.0, 7.0, 5.0, 2.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.515625, -22.777587890625, -22.03955078125, -21.301513671875, -20.5634765625, -19.825439453125, -19.08740234375, -18.349365234375, -17.611328125, -16.873291015625, -16.13525390625, -15.397216796875, -14.6591796875, -13.921142578125, -13.18310546875, -12.445068359375, -11.70703125, -10.968994140625, -10.23095703125, -9.492919921875, -8.7548828125, -8.016845703125, -7.27880859375, -6.540771484375, -5.802734375, -5.064697265625, -4.32666015625, -3.588623046875, -2.8505859375, -2.112548828125, -1.37451171875, -0.636474609375, 0.1015625, 0.839599609375, 1.57763671875, 2.315673828125, 3.0537109375, 3.791748046875, 4.52978515625, 5.267822265625, 6.005859375, 6.743896484375, 7.48193359375, 8.219970703125, 8.9580078125, 9.696044921875, 10.43408203125, 11.172119140625, 11.91015625, 12.648193359375, 13.38623046875, 14.124267578125, 14.8623046875, 15.600341796875, 16.33837890625, 17.076416015625, 17.814453125, 18.552490234375, 19.29052734375, 20.028564453125, 20.7666015625, 21.504638671875, 22.24267578125, 22.980712890625, 23.71875]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 4.0, 2.0, 8.0, 7.0, 7.0, 9.0, 9.0, 17.0, 24.0, 21.0, 31.0, 31.0, 41.0, 62.0, 73.0, 107.0, 111.0, 176.0, 234.0, 401.0, 870.0, 4010.0, 49684.0, 2580293.0, 487445.0, 18118.0, 2074.0, 643.0, 299.0, 225.0, 145.0, 122.0, 90.0, 61.0, 56.0, 53.0, 37.0, 28.0, 13.0, 12.0, 9.0, 8.0, 6.0, 11.0, 6.0, 9.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-30.921875, -29.979736328125, -29.03759765625, -28.095458984375, -27.1533203125, -26.211181640625, -25.26904296875, -24.326904296875, -23.384765625, -22.442626953125, -21.50048828125, -20.558349609375, -19.6162109375, -18.674072265625, -17.73193359375, -16.789794921875, -15.84765625, -14.905517578125, -13.96337890625, -13.021240234375, -12.0791015625, -11.136962890625, -10.19482421875, -9.252685546875, -8.310546875, -7.368408203125, -6.42626953125, -5.484130859375, -4.5419921875, -3.599853515625, -2.65771484375, -1.715576171875, -0.7734375, 0.168701171875, 1.11083984375, 2.052978515625, 2.9951171875, 3.937255859375, 4.87939453125, 5.821533203125, 6.763671875, 7.705810546875, 8.64794921875, 9.590087890625, 10.5322265625, 11.474365234375, 12.41650390625, 13.358642578125, 14.30078125, 15.242919921875, 16.18505859375, 17.127197265625, 18.0693359375, 19.011474609375, 19.95361328125, 20.895751953125, 21.837890625, 22.780029296875, 23.72216796875, 24.664306640625, 25.6064453125, 26.548583984375, 27.49072265625, 28.432861328125, 29.375]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 13.0, 109.0, 499.0, 340.0, 52.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.66531372070312, -65.9568862915039, -62.24845504760742, -58.54002380371094, -54.83159637451172, -51.123165130615234, -47.41473388671875, -43.70630645751953, -39.99787521362305, -36.28944396972656, -32.581016540527344, -28.87258529663086, -25.164155960083008, -21.455726623535156, -17.747295379638672, -14.03886604309082, -10.330436706542969, -6.622006893157959, -2.913577079772949, 0.7948532104492188, 4.50328254699707, 8.211711883544922, 11.920143127441406, 15.628572463989258, 19.33700180053711, 23.04543113708496, 26.753860473632812, 30.462291717529297, 34.17072296142578, 37.879150390625, 41.587581634521484, 45.29601287841797, 49.00444030761719, 52.71287155151367, 56.42129898071289, 60.129730224609375, 63.838157653808594, 67.54658508300781, 71.25502014160156, 74.96344757080078, 78.671875, 82.38030242919922, 86.08873748779297, 89.79716491699219, 93.5055923461914, 97.21401977539062, 100.92245483398438, 104.6308822631836, 108.33931732177734, 112.04774475097656, 115.75617980957031, 119.46460723876953, 123.17303466796875, 126.8814697265625, 130.58990478515625, 134.29832458496094, 138.0067596435547, 141.71519470214844, 145.42361450195312, 149.13204956054688, 152.84048461914062, 156.5489044189453, 160.25733947753906, 163.9657745361328, 167.6741943359375]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 1.0, 1.0, 3.0, 0.0, 5.0, 2.0, 8.0, 5.0, 11.0, 11.0, 10.0, 12.0, 19.0, 9.0, 23.0, 17.0, 18.0, 20.0, 26.0, 30.0, 29.0, 30.0, 41.0, 40.0, 44.0, 28.0, 30.0, 31.0, 28.0, 29.0, 40.0, 41.0, 47.0, 34.0, 36.0, 22.0, 30.0, 26.0, 30.0, 23.0, 19.0, 18.0, 14.0, 11.0, 10.0, 11.0, 6.0, 9.0, 5.0, 3.0, 5.0, 5.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0], "bins": [-51.13078308105469, -49.60908889770508, -48.087398529052734, -46.565704345703125, -45.04401397705078, -43.52231979370117, -42.00062561035156, -40.47893524169922, -38.95724105834961, -37.435546875, -35.913856506347656, -34.39216232299805, -32.87046813964844, -31.348777770996094, -29.827083587646484, -28.305391311645508, -26.78369903564453, -25.262006759643555, -23.740314483642578, -22.21862030029297, -20.696928024291992, -19.175235748291016, -17.653541564941406, -16.13184928894043, -14.610157012939453, -13.088464736938477, -11.566771507263184, -10.04507827758789, -8.523386001586914, -7.001693248748779, -5.4800004959106445, -3.9583072662353516, -2.436614990234375, -0.9149222373962402, 0.6067705154418945, 2.1284632682800293, 3.650156021118164, 5.171848773956299, 6.693541526794434, 8.215234756469727, 9.736927032470703, 11.25861930847168, 12.780312538146973, 14.302005767822266, 15.823698043823242, 17.34539031982422, 18.867084503173828, 20.388776779174805, 21.91046905517578, 23.432161331176758, 24.953853607177734, 26.475547790527344, 27.99724006652832, 29.518932342529297, 31.040626525878906, 32.56231689453125, 34.08401107788086, 35.60570526123047, 37.12739562988281, 38.64908981323242, 40.17078399658203, 41.692474365234375, 43.214168548583984, 44.735862731933594, 46.25755310058594]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 0.0, 3.0, 8.0, 6.0, 7.0, 9.0, 13.0, 9.0, 14.0, 20.0, 14.0, 23.0, 28.0, 30.0, 34.0, 20.0, 21.0, 48.0, 31.0, 40.0, 43.0, 38.0, 52.0, 38.0, 36.0, 49.0, 41.0, 34.0, 44.0, 42.0, 30.0, 25.0, 26.0, 24.0, 22.0, 9.0, 7.0, 22.0, 11.0, 10.0, 7.0, 4.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.7109375, -8.443603515625, -8.17626953125, -7.908935546875, -7.6416015625, -7.374267578125, -7.10693359375, -6.839599609375, -6.572265625, -6.304931640625, -6.03759765625, -5.770263671875, -5.5029296875, -5.235595703125, -4.96826171875, -4.700927734375, -4.43359375, -4.166259765625, -3.89892578125, -3.631591796875, -3.3642578125, -3.096923828125, -2.82958984375, -2.562255859375, -2.294921875, -2.027587890625, -1.76025390625, -1.492919921875, -1.2255859375, -0.958251953125, -0.69091796875, -0.423583984375, -0.15625, 0.111083984375, 0.37841796875, 0.645751953125, 0.9130859375, 1.180419921875, 1.44775390625, 1.715087890625, 1.982421875, 2.249755859375, 2.51708984375, 2.784423828125, 3.0517578125, 3.319091796875, 3.58642578125, 3.853759765625, 4.12109375, 4.388427734375, 4.65576171875, 4.923095703125, 5.1904296875, 5.457763671875, 5.72509765625, 5.992431640625, 6.259765625, 6.527099609375, 6.79443359375, 7.061767578125, 7.3291015625, 7.596435546875, 7.86376953125, 8.131103515625, 8.3984375]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 8.0, 7.0, 13.0, 13.0, 12.0, 20.0, 15.0, 28.0, 17.0, 41.0, 39.0, 73.0, 159.0, 348.0, 1107.0, 5046.0, 50681.0, 1739928.0, 2310008.0, 77750.0, 6686.0, 1387.0, 417.0, 183.0, 79.0, 46.0, 25.0, 29.0, 16.0, 12.0, 13.0, 20.0, 9.0, 10.0, 12.0, 8.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.390625, -21.5927734375, -20.794921875, -19.9970703125, -19.19921875, -18.4013671875, -17.603515625, -16.8056640625, -16.0078125, -15.2099609375, -14.412109375, -13.6142578125, -12.81640625, -12.0185546875, -11.220703125, -10.4228515625, -9.625, -8.8271484375, -8.029296875, -7.2314453125, -6.43359375, -5.6357421875, -4.837890625, -4.0400390625, -3.2421875, -2.4443359375, -1.646484375, -0.8486328125, -0.05078125, 0.7470703125, 1.544921875, 2.3427734375, 3.140625, 3.9384765625, 4.736328125, 5.5341796875, 6.33203125, 7.1298828125, 7.927734375, 8.7255859375, 9.5234375, 10.3212890625, 11.119140625, 11.9169921875, 12.71484375, 13.5126953125, 14.310546875, 15.1083984375, 15.90625, 16.7041015625, 17.501953125, 18.2998046875, 19.09765625, 19.8955078125, 20.693359375, 21.4912109375, 22.2890625, 23.0869140625, 23.884765625, 24.6826171875, 25.48046875, 26.2783203125, 27.076171875, 27.8740234375, 28.671875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 5.0, 7.0, 2.0, 13.0, 23.0, 30.0, 28.0, 47.0, 79.0, 100.0, 147.0, 228.0, 334.0, 502.0, 663.0, 560.0, 437.0, 295.0, 194.0, 112.0, 88.0, 61.0, 42.0, 23.0, 16.0, 11.0, 9.0, 8.0, 7.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8203125, -12.3734130859375, -11.926513671875, -11.4796142578125, -11.03271484375, -10.5858154296875, -10.138916015625, -9.6920166015625, -9.2451171875, -8.7982177734375, -8.351318359375, -7.9044189453125, -7.45751953125, -7.0106201171875, -6.563720703125, -6.1168212890625, -5.669921875, -5.2230224609375, -4.776123046875, -4.3292236328125, -3.88232421875, -3.4354248046875, -2.988525390625, -2.5416259765625, -2.0947265625, -1.6478271484375, -1.200927734375, -0.7540283203125, -0.30712890625, 0.1397705078125, 0.586669921875, 1.0335693359375, 1.48046875, 1.9273681640625, 2.374267578125, 2.8211669921875, 3.26806640625, 3.7149658203125, 4.161865234375, 4.6087646484375, 5.0556640625, 5.5025634765625, 5.949462890625, 6.3963623046875, 6.84326171875, 7.2901611328125, 7.737060546875, 8.1839599609375, 8.630859375, 9.0777587890625, 9.524658203125, 9.9715576171875, 10.41845703125, 10.8653564453125, 11.312255859375, 11.7591552734375, 12.2060546875, 12.6529541015625, 13.099853515625, 13.5467529296875, 13.99365234375, 14.4405517578125, 14.887451171875, 15.3343505859375, 15.78125]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 6.0, 7.0, 12.0, 15.0, 15.0, 26.0, 34.0, 55.0, 106.0, 195.0, 512.0, 1304.0, 5183.0, 41418.0, 1027099.0, 3013372.0, 92669.0, 9083.0, 1839.0, 710.0, 271.0, 135.0, 69.0, 40.0, 28.0, 31.0, 15.0, 16.0, 3.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.484375, -27.539794921875, -26.59521484375, -25.650634765625, -24.7060546875, -23.761474609375, -22.81689453125, -21.872314453125, -20.927734375, -19.983154296875, -19.03857421875, -18.093994140625, -17.1494140625, -16.204833984375, -15.26025390625, -14.315673828125, -13.37109375, -12.426513671875, -11.48193359375, -10.537353515625, -9.5927734375, -8.648193359375, -7.70361328125, -6.759033203125, -5.814453125, -4.869873046875, -3.92529296875, -2.980712890625, -2.0361328125, -1.091552734375, -0.14697265625, 0.797607421875, 1.7421875, 2.686767578125, 3.63134765625, 4.575927734375, 5.5205078125, 6.465087890625, 7.40966796875, 8.354248046875, 9.298828125, 10.243408203125, 11.18798828125, 12.132568359375, 13.0771484375, 14.021728515625, 14.96630859375, 15.910888671875, 16.85546875, 17.800048828125, 18.74462890625, 19.689208984375, 20.6337890625, 21.578369140625, 22.52294921875, 23.467529296875, 24.412109375, 25.356689453125, 26.30126953125, 27.245849609375, 28.1904296875, 29.135009765625, 30.07958984375, 31.024169921875, 31.96875]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 12.0, 41.0, 81.0, 145.0, 173.0, 210.0, 157.0, 81.0, 67.0, 26.0, 12.0, 3.0, 1.0], "bins": [-129.12672424316406, -126.8286361694336, -124.53054809570312, -122.23246002197266, -119.93437194824219, -117.63627624511719, -115.33818817138672, -113.04010009765625, -110.74201202392578, -108.44392395019531, -106.14583587646484, -103.84774780273438, -101.54965209960938, -99.2515640258789, -96.95347595214844, -94.65538787841797, -92.3572998046875, -90.05921173095703, -87.76112365722656, -85.4630355834961, -83.16494750976562, -80.86685180664062, -78.56876373291016, -76.27067565917969, -73.97258758544922, -71.67449951171875, -69.37641143798828, -67.07832336425781, -64.78022766113281, -62.48214340209961, -60.184051513671875, -57.885963439941406, -55.58788299560547, -53.289794921875, -50.99170684814453, -48.6936149597168, -46.39552688598633, -44.09743881225586, -41.799346923828125, -39.501258850097656, -37.20317077636719, -34.90508270263672, -32.60699462890625, -30.308902740478516, -28.010814666748047, -25.712726593017578, -23.414636611938477, -21.116546630859375, -18.818456649780273, -16.520366668701172, -14.222278594970703, -11.924189567565918, -9.626100540161133, -7.328011512756348, -5.0299224853515625, -2.731832504272461, -0.4337444305419922, 1.864344596862793, 4.162433624267578, 6.460522651672363, 8.758611679077148, 11.056700706481934, 13.354789733886719, 15.65287971496582, 17.95096778869629]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 9.0, 6.0, 11.0, 7.0, 16.0, 21.0, 23.0, 26.0, 25.0, 23.0, 30.0, 29.0, 43.0, 29.0, 37.0, 40.0, 50.0, 42.0, 42.0, 42.0, 37.0, 53.0, 47.0, 43.0, 40.0, 35.0, 33.0, 26.0, 29.0, 25.0, 22.0, 9.0, 10.0, 9.0, 10.0, 6.0, 5.0, 5.0, 1.0, 1.0, 5.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-44.24957275390625, -42.88689422607422, -41.52421569824219, -40.161537170410156, -38.798858642578125, -37.436180114746094, -36.07350158691406, -34.71082305908203, -33.34814453125, -31.98546600341797, -30.622787475585938, -29.260108947753906, -27.897430419921875, -26.534751892089844, -25.172073364257812, -23.80939483642578, -22.44671630859375, -21.08403778076172, -19.721359252929688, -18.358680725097656, -16.996002197265625, -15.633323669433594, -14.270645141601562, -12.907966613769531, -11.5452880859375, -10.182609558105469, -8.819931030273438, -7.457252502441406, -6.094573974609375, -4.731895446777344, -3.3692169189453125, -2.0065383911132812, -0.64385986328125, 0.7188186645507812, 2.0814971923828125, 3.4441757202148438, 4.806854248046875, 6.169532775878906, 7.5322113037109375, 8.894889831542969, 10.257568359375, 11.620246887207031, 12.982925415039062, 14.345603942871094, 15.708282470703125, 17.070960998535156, 18.433639526367188, 19.79631805419922, 21.15899658203125, 22.52167510986328, 23.884353637695312, 25.247032165527344, 26.609710693359375, 27.972389221191406, 29.335067749023438, 30.69774627685547, 32.0604248046875, 33.42310333251953, 34.78578186035156, 36.148460388183594, 37.511138916015625, 38.873817443847656, 40.23649597167969, 41.59917449951172, 42.96185302734375]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 5.0, 3.0, 4.0, 3.0, 3.0, 3.0, 5.0, 7.0, 4.0, 12.0, 10.0, 9.0, 9.0, 13.0, 15.0, 19.0, 17.0, 27.0, 27.0, 32.0, 30.0, 31.0, 17.0, 25.0, 43.0, 30.0, 32.0, 37.0, 31.0, 39.0, 49.0, 33.0, 36.0, 37.0, 37.0, 31.0, 25.0, 31.0, 23.0, 20.0, 24.0, 17.0, 7.0, 18.0, 19.0, 15.0, 9.0, 7.0, 7.0, 7.0, 7.0, 6.0, 0.0, 2.0, 2.0, 5.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-7.71875, -7.47515869140625, -7.2315673828125, -6.98797607421875, -6.744384765625, -6.50079345703125, -6.2572021484375, -6.01361083984375, -5.77001953125, -5.52642822265625, -5.2828369140625, -5.03924560546875, -4.795654296875, -4.55206298828125, -4.3084716796875, -4.06488037109375, -3.8212890625, -3.57769775390625, -3.3341064453125, -3.09051513671875, -2.846923828125, -2.60333251953125, -2.3597412109375, -2.11614990234375, -1.87255859375, -1.62896728515625, -1.3853759765625, -1.14178466796875, -0.898193359375, -0.65460205078125, -0.4110107421875, -0.16741943359375, 0.076171875, 0.31976318359375, 0.5633544921875, 0.80694580078125, 1.050537109375, 1.29412841796875, 1.5377197265625, 1.78131103515625, 2.02490234375, 2.26849365234375, 2.5120849609375, 2.75567626953125, 2.999267578125, 3.24285888671875, 3.4864501953125, 3.73004150390625, 3.9736328125, 4.21722412109375, 4.4608154296875, 4.70440673828125, 4.947998046875, 5.19158935546875, 5.4351806640625, 5.67877197265625, 5.92236328125, 6.16595458984375, 6.4095458984375, 6.65313720703125, 6.896728515625, 7.14031982421875, 7.3839111328125, 7.62750244140625, 7.87109375]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 8.0, 16.0, 19.0, 30.0, 46.0, 57.0, 92.0, 130.0, 194.0, 267.0, 452.0, 596.0, 937.0, 1408.0, 2177.0, 3265.0, 4907.0, 7937.0, 11961.0, 19186.0, 30842.0, 50988.0, 87215.0, 158544.0, 244665.0, 176868.0, 97483.0, 56293.0, 33767.0, 20802.0, 12924.0, 8560.0, 5399.0, 3536.0, 2364.0, 1508.0, 1010.0, 694.0, 426.0, 340.0, 216.0, 138.0, 99.0, 63.0, 47.0, 21.0, 19.0, 13.0, 12.0, 9.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.2119140625, -1.173553466796875, -1.13519287109375, -1.096832275390625, -1.0584716796875, -1.020111083984375, -0.98175048828125, -0.943389892578125, -0.905029296875, -0.866668701171875, -0.82830810546875, -0.789947509765625, -0.7515869140625, -0.713226318359375, -0.67486572265625, -0.636505126953125, -0.59814453125, -0.559783935546875, -0.52142333984375, -0.483062744140625, -0.4447021484375, -0.406341552734375, -0.36798095703125, -0.329620361328125, -0.291259765625, -0.252899169921875, -0.21453857421875, -0.176177978515625, -0.1378173828125, -0.099456787109375, -0.06109619140625, -0.022735595703125, 0.015625, 0.053985595703125, 0.09234619140625, 0.130706787109375, 0.1690673828125, 0.207427978515625, 0.24578857421875, 0.284149169921875, 0.322509765625, 0.360870361328125, 0.39923095703125, 0.437591552734375, 0.4759521484375, 0.514312744140625, 0.55267333984375, 0.591033935546875, 0.62939453125, 0.667755126953125, 0.70611572265625, 0.744476318359375, 0.7828369140625, 0.821197509765625, 0.85955810546875, 0.897918701171875, 0.936279296875, 0.974639892578125, 1.01300048828125, 1.051361083984375, 1.0897216796875, 1.128082275390625, 1.16644287109375, 1.204803466796875, 1.2431640625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 7.0, 7.0, 10.0, 4.0, 11.0, 11.0, 13.0, 11.0, 16.0, 18.0, 19.0, 20.0, 33.0, 20.0, 29.0, 26.0, 29.0, 36.0, 33.0, 42.0, 47.0, 28.0, 45.0, 1069.0, 42.0, 40.0, 32.0, 34.0, 39.0, 32.0, 23.0, 26.0, 31.0, 24.0, 17.0, 18.0, 11.0, 11.0, 13.0, 11.0, 7.0, 8.0, 8.0, 4.0, 6.0, 4.0, 4.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.46484375, -5.2998046875, -5.134765625, -4.9697265625, -4.8046875, -4.6396484375, -4.474609375, -4.3095703125, -4.14453125, -3.9794921875, -3.814453125, -3.6494140625, -3.484375, -3.3193359375, -3.154296875, -2.9892578125, -2.82421875, -2.6591796875, -2.494140625, -2.3291015625, -2.1640625, -1.9990234375, -1.833984375, -1.6689453125, -1.50390625, -1.3388671875, -1.173828125, -1.0087890625, -0.84375, -0.6787109375, -0.513671875, -0.3486328125, -0.18359375, -0.0185546875, 0.146484375, 0.3115234375, 0.4765625, 0.6416015625, 0.806640625, 0.9716796875, 1.13671875, 1.3017578125, 1.466796875, 1.6318359375, 1.796875, 1.9619140625, 2.126953125, 2.2919921875, 2.45703125, 2.6220703125, 2.787109375, 2.9521484375, 3.1171875, 3.2822265625, 3.447265625, 3.6123046875, 3.77734375, 3.9423828125, 4.107421875, 4.2724609375, 4.4375, 4.6025390625, 4.767578125, 4.9326171875, 5.09765625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 5.0, 8.0, 11.0, 12.0, 18.0, 28.0, 40.0, 61.0, 102.0, 111.0, 185.0, 276.0, 393.0, 546.0, 801.0, 1161.0, 1651.0, 2425.0, 3586.0, 5315.0, 8161.0, 12355.0, 19315.0, 30482.0, 48677.0, 82923.0, 149568.0, 1282846.0, 183908.0, 101744.0, 58508.0, 36091.0, 22511.0, 14618.0, 9505.0, 6218.0, 4129.0, 2769.0, 1925.0, 1308.0, 908.0, 577.0, 417.0, 291.0, 216.0, 144.0, 98.0, 66.0, 41.0, 28.0, 29.0, 10.0, 10.0, 6.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-1.0078125, -0.9759979248046875, -0.944183349609375, -0.9123687744140625, -0.88055419921875, -0.8487396240234375, -0.816925048828125, -0.7851104736328125, -0.7532958984375, -0.7214813232421875, -0.689666748046875, -0.6578521728515625, -0.62603759765625, -0.5942230224609375, -0.562408447265625, -0.5305938720703125, -0.498779296875, -0.4669647216796875, -0.435150146484375, -0.4033355712890625, -0.37152099609375, -0.3397064208984375, -0.307891845703125, -0.2760772705078125, -0.2442626953125, -0.2124481201171875, -0.180633544921875, -0.1488189697265625, -0.11700439453125, -0.0851898193359375, -0.053375244140625, -0.0215606689453125, 0.01025390625, 0.0420684814453125, 0.073883056640625, 0.1056976318359375, 0.13751220703125, 0.1693267822265625, 0.201141357421875, 0.2329559326171875, 0.2647705078125, 0.2965850830078125, 0.328399658203125, 0.3602142333984375, 0.39202880859375, 0.4238433837890625, 0.455657958984375, 0.4874725341796875, 0.519287109375, 0.5511016845703125, 0.582916259765625, 0.6147308349609375, 0.64654541015625, 0.6783599853515625, 0.710174560546875, 0.7419891357421875, 0.7738037109375, 0.8056182861328125, 0.837432861328125, 0.8692474365234375, 0.90106201171875, 0.9328765869140625, 0.964691162109375, 0.9965057373046875, 1.0283203125]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 4.0, 1.0, 6.0, 4.0, 8.0, 13.0, 9.0, 10.0, 11.0, 19.0, 24.0, 34.0, 30.0, 44.0, 54.0, 62.0, 73.0, 75.0, 65.0, 68.0, 60.0, 58.0, 34.0, 48.0, 45.0, 24.0, 35.0, 17.0, 28.0, 12.0, 13.0, 7.0, 6.0, 2.0, 3.0, 4.0, 0.0, 1.0, 3.0], "bins": [-0.00455474853515625, -0.004450559616088867, -0.004346370697021484, -0.0042421817779541016, -0.004137992858886719, -0.004033803939819336, -0.003929615020751953, -0.0038254261016845703, -0.0037212371826171875, -0.0036170482635498047, -0.003512859344482422, -0.003408670425415039, -0.0033044815063476562, -0.0032002925872802734, -0.0030961036682128906, -0.002991914749145508, -0.002887725830078125, -0.002783536911010742, -0.0026793479919433594, -0.0025751590728759766, -0.0024709701538085938, -0.002366781234741211, -0.002262592315673828, -0.0021584033966064453, -0.0020542144775390625, -0.0019500255584716797, -0.0018458366394042969, -0.001741647720336914, -0.0016374588012695312, -0.0015332698822021484, -0.0014290809631347656, -0.0013248920440673828, -0.001220703125, -0.0011165142059326172, -0.0010123252868652344, -0.0009081363677978516, -0.0008039474487304688, -0.0006997585296630859, -0.0005955696105957031, -0.0004913806915283203, -0.0003871917724609375, -0.0002830028533935547, -0.00017881393432617188, -7.462501525878906e-05, 2.956390380859375e-05, 0.00013375282287597656, 0.00023794174194335938, 0.0003421306610107422, 0.000446319580078125, 0.0005505084991455078, 0.0006546974182128906, 0.0007588863372802734, 0.0008630752563476562, 0.0009672641754150391, 0.0010714530944824219, 0.0011756420135498047, 0.0012798309326171875, 0.0013840198516845703, 0.0014882087707519531, 0.001592397689819336, 0.0016965866088867188, 0.0018007755279541016, 0.0019049644470214844, 0.002009153366088867, 0.00211334228515625]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 14.0, 10.0, 17.0, 19.0, 26.0, 46.0, 50.0, 63.0, 103.0, 124.0, 212.0, 480.0, 1345.0, 986902.0, 57281.0, 834.0, 364.0, 219.0, 104.0, 83.0, 60.0, 51.0, 32.0, 28.0, 17.0, 17.0, 15.0, 7.0, 9.0, 8.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04730224609375, -0.04503059387207031, -0.042758941650390625, -0.04048728942871094, -0.03821563720703125, -0.03594398498535156, -0.033672332763671875, -0.03140068054199219, -0.0291290283203125, -0.026857376098632812, -0.024585723876953125, -0.022314071655273438, -0.02004241943359375, -0.017770767211914062, -0.015499114990234375, -0.013227462768554688, -0.010955810546875, -0.008684158325195312, -0.006412506103515625, -0.0041408538818359375, -0.00186920166015625, 0.0004024505615234375, 0.002674102783203125, 0.0049457550048828125, 0.0072174072265625, 0.009489059448242188, 0.011760711669921875, 0.014032363891601562, 0.01630401611328125, 0.018575668334960938, 0.020847320556640625, 0.023118972778320312, 0.025390625, 0.027662277221679688, 0.029933929443359375, 0.03220558166503906, 0.03447723388671875, 0.03674888610839844, 0.039020538330078125, 0.04129219055175781, 0.0435638427734375, 0.04583549499511719, 0.048107147216796875, 0.05037879943847656, 0.05265045166015625, 0.05492210388183594, 0.057193756103515625, 0.05946540832519531, 0.061737060546875, 0.06400871276855469, 0.06628036499023438, 0.06855201721191406, 0.07082366943359375, 0.07309532165527344, 0.07536697387695312, 0.07763862609863281, 0.0799102783203125, 0.08218193054199219, 0.08445358276367188, 0.08672523498535156, 0.08899688720703125, 0.09126853942871094, 0.09354019165039062, 0.09581184387207031, 0.09808349609375]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 19.0, 838.0, 159.0, 2.0, 1.0, 1.0], "bins": [-0.03422731161117554, -0.033654142171144485, -0.033080969005823135, -0.032507799565792084, -0.031934626400470734, -0.03136145696043968, -0.03078828565776348, -0.03021511435508728, -0.02964194305241108, -0.02906877174973488, -0.028495600447058678, -0.027922429144382477, -0.027349259704351425, -0.026776088401675224, -0.026202917098999023, -0.025629745796322823, -0.02505657449364662, -0.02448340319097042, -0.02391023188829422, -0.02333706244826317, -0.022763891145586967, -0.022190719842910767, -0.021617548540234566, -0.021044377237558365, -0.020471207797527313, -0.019898036494851112, -0.01932486519217491, -0.01875169575214386, -0.01817852444946766, -0.017605353146791458, -0.017032181844115257, -0.016459010541439056, -0.015885837376117706, -0.015312666073441505, -0.01473949570208788, -0.014166324399411678, -0.013593153096735477, -0.013019982725381851, -0.01244681142270565, -0.01187364012002945, -0.011300469748675823, -0.010727298445999622, -0.010154128074645996, -0.009580956771969795, -0.009007785469293594, -0.008434614166617393, -0.007861443795263767, -0.007288272492587566, -0.00671510212123394, -0.0061419312842190266, -0.005568759981542826, -0.004995589144527912, -0.004422417841851711, -0.0038492470048367977, -0.003276076167821884, -0.0027029048651456833, -0.002129733795300126, -0.0015565627254545689, -0.0009833917720243335, -0.0004102208185940981, 0.00016295025125145912, 0.0007361213210970163, 0.00130929215811193, 0.0018824634607881308, 0.0024556342978030443]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 2.0, 2.0, 0.0, 5.0, 8.0, 4.0, 4.0, 11.0, 8.0, 17.0, 14.0, 21.0, 23.0, 22.0, 31.0, 27.0, 30.0, 36.0, 48.0, 37.0, 47.0, 41.0, 37.0, 42.0, 42.0, 44.0, 46.0, 40.0, 30.0, 28.0, 35.0, 34.0, 34.0, 15.0, 23.0, 19.0, 20.0, 15.0, 10.0, 10.0, 11.0, 7.0, 6.0, 4.0, 2.0, 1.0, 5.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0014938712120056152, -0.0014473311603069305, -0.0014007911086082458, -0.0013542510569095612, -0.0013077110052108765, -0.0012611709535121918, -0.001214630901813507, -0.0011680908501148224, -0.0011215507984161377, -0.001075010746717453, -0.0010284706950187683, -0.0009819306433200836, -0.0009353905916213989, -0.0008888505399227142, -0.0008423104882240295, -0.0007957704365253448, -0.0007492303848266602, -0.0007026903331279755, -0.0006561502814292908, -0.0006096102297306061, -0.0005630701780319214, -0.0005165301263332367, -0.000469990074634552, -0.0004234500229358673, -0.0003769099712371826, -0.0003303699195384979, -0.00028382986783981323, -0.00023728981614112854, -0.00019074976444244385, -0.00014420971274375916, -9.766966104507446e-05, -5.112960934638977e-05, -4.589557647705078e-06, 4.1950494050979614e-05, 8.84905457496643e-05, 0.000135030597448349, 0.0001815706491470337, 0.00022811070084571838, 0.0002746507525444031, 0.00032119080424308777, 0.00036773085594177246, 0.00041427090764045715, 0.00046081095933914185, 0.0005073510110378265, 0.0005538910627365112, 0.0006004311144351959, 0.0006469711661338806, 0.0006935112178325653, 0.00074005126953125, 0.0007865913212299347, 0.0008331313729286194, 0.0008796714246273041, 0.0009262114763259888, 0.0009727515280246735, 0.0010192915797233582, 0.0010658316314220428, 0.0011123716831207275, 0.0011589117348194122, 0.001205451786518097, 0.0012519918382167816, 0.0012985318899154663, 0.001345071941614151, 0.0013916119933128357, 0.0014381520450115204, 0.001484692096710205]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 5.0, 3.0, 4.0, 3.0, 3.0, 3.0, 5.0, 7.0, 4.0, 12.0, 10.0, 9.0, 9.0, 13.0, 15.0, 19.0, 17.0, 27.0, 27.0, 32.0, 30.0, 31.0, 17.0, 25.0, 43.0, 30.0, 32.0, 37.0, 32.0, 38.0, 49.0, 33.0, 36.0, 37.0, 37.0, 31.0, 25.0, 31.0, 24.0, 19.0, 24.0, 17.0, 7.0, 18.0, 19.0, 15.0, 9.0, 7.0, 7.0, 7.0, 7.0, 6.0, 0.0, 2.0, 2.0, 5.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-7.71875, -7.47515869140625, -7.2315673828125, -6.98797607421875, -6.744384765625, -6.50079345703125, -6.2572021484375, -6.01361083984375, -5.77001953125, -5.52642822265625, -5.2828369140625, -5.03924560546875, -4.795654296875, -4.55206298828125, -4.3084716796875, -4.06488037109375, -3.8212890625, -3.57769775390625, -3.3341064453125, -3.09051513671875, -2.846923828125, -2.60333251953125, -2.3597412109375, -2.11614990234375, -1.87255859375, -1.62896728515625, -1.3853759765625, -1.14178466796875, -0.898193359375, -0.65460205078125, -0.4110107421875, -0.16741943359375, 0.076171875, 0.31976318359375, 0.5633544921875, 0.80694580078125, 1.050537109375, 1.29412841796875, 1.5377197265625, 1.78131103515625, 2.02490234375, 2.26849365234375, 2.5120849609375, 2.75567626953125, 2.999267578125, 3.24285888671875, 3.4864501953125, 3.73004150390625, 3.9736328125, 4.21722412109375, 4.4608154296875, 4.70440673828125, 4.947998046875, 5.19158935546875, 5.4351806640625, 5.67877197265625, 5.92236328125, 6.16595458984375, 6.4095458984375, 6.65313720703125, 6.896728515625, 7.14031982421875, 7.3839111328125, 7.62750244140625, 7.87109375]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 7.0, 12.0, 5.0, 6.0, 12.0, 11.0, 23.0, 32.0, 41.0, 38.0, 65.0, 72.0, 129.0, 177.0, 238.0, 329.0, 542.0, 764.0, 1350.0, 2310.0, 4629.0, 10586.0, 29583.0, 93945.0, 315275.0, 396628.0, 126760.0, 38657.0, 13520.0, 5573.0, 2799.0, 1535.0, 962.0, 635.0, 365.0, 257.0, 165.0, 141.0, 112.0, 76.0, 39.0, 39.0, 35.0, 29.0, 11.0, 15.0, 12.0, 7.0, 5.0, 1.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.9375, -10.6072998046875, -10.277099609375, -9.9468994140625, -9.61669921875, -9.2864990234375, -8.956298828125, -8.6260986328125, -8.2958984375, -7.9656982421875, -7.635498046875, -7.3052978515625, -6.97509765625, -6.6448974609375, -6.314697265625, -5.9844970703125, -5.654296875, -5.3240966796875, -4.993896484375, -4.6636962890625, -4.33349609375, -4.0032958984375, -3.673095703125, -3.3428955078125, -3.0126953125, -2.6824951171875, -2.352294921875, -2.0220947265625, -1.69189453125, -1.3616943359375, -1.031494140625, -0.7012939453125, -0.37109375, -0.0408935546875, 0.289306640625, 0.6195068359375, 0.94970703125, 1.2799072265625, 1.610107421875, 1.9403076171875, 2.2705078125, 2.6007080078125, 2.930908203125, 3.2611083984375, 3.59130859375, 3.9215087890625, 4.251708984375, 4.5819091796875, 4.912109375, 5.2423095703125, 5.572509765625, 5.9027099609375, 6.23291015625, 6.5631103515625, 6.893310546875, 7.2235107421875, 7.5537109375, 7.8839111328125, 8.214111328125, 8.5443115234375, 8.87451171875, 9.2047119140625, 9.534912109375, 9.8651123046875, 10.1953125]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 4.0, 5.0, 5.0, 12.0, 10.0, 13.0, 24.0, 10.0, 28.0, 16.0, 34.0, 33.0, 43.0, 43.0, 36.0, 58.0, 67.0, 96.0, 236.0, 1555.0, 196.0, 104.0, 60.0, 58.0, 41.0, 46.0, 37.0, 27.0, 37.0, 29.0, 16.0, 18.0, 15.0, 10.0, 9.0, 6.0, 4.0, 1.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.515625, -21.7236328125, -20.931640625, -20.1396484375, -19.34765625, -18.5556640625, -17.763671875, -16.9716796875, -16.1796875, -15.3876953125, -14.595703125, -13.8037109375, -13.01171875, -12.2197265625, -11.427734375, -10.6357421875, -9.84375, -9.0517578125, -8.259765625, -7.4677734375, -6.67578125, -5.8837890625, -5.091796875, -4.2998046875, -3.5078125, -2.7158203125, -1.923828125, -1.1318359375, -0.33984375, 0.4521484375, 1.244140625, 2.0361328125, 2.828125, 3.6201171875, 4.412109375, 5.2041015625, 5.99609375, 6.7880859375, 7.580078125, 8.3720703125, 9.1640625, 9.9560546875, 10.748046875, 11.5400390625, 12.33203125, 13.1240234375, 13.916015625, 14.7080078125, 15.5, 16.2919921875, 17.083984375, 17.8759765625, 18.66796875, 19.4599609375, 20.251953125, 21.0439453125, 21.8359375, 22.6279296875, 23.419921875, 24.2119140625, 25.00390625, 25.7958984375, 26.587890625, 27.3798828125, 28.171875]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 7.0, 15.0, 18.0, 22.0, 32.0, 43.0, 47.0, 56.0, 115.0, 198.0, 282.0, 515.0, 1065.0, 12268.0, 2788796.0, 336438.0, 3876.0, 769.0, 349.0, 227.0, 148.0, 88.0, 95.0, 57.0, 46.0, 36.0, 26.0, 24.0, 17.0, 7.0, 4.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-52.5, -50.99267578125, -49.4853515625, -47.97802734375, -46.470703125, -44.96337890625, -43.4560546875, -41.94873046875, -40.44140625, -38.93408203125, -37.4267578125, -35.91943359375, -34.412109375, -32.90478515625, -31.3974609375, -29.89013671875, -28.3828125, -26.87548828125, -25.3681640625, -23.86083984375, -22.353515625, -20.84619140625, -19.3388671875, -17.83154296875, -16.32421875, -14.81689453125, -13.3095703125, -11.80224609375, -10.294921875, -8.78759765625, -7.2802734375, -5.77294921875, -4.265625, -2.75830078125, -1.2509765625, 0.25634765625, 1.763671875, 3.27099609375, 4.7783203125, 6.28564453125, 7.79296875, 9.30029296875, 10.8076171875, 12.31494140625, 13.822265625, 15.32958984375, 16.8369140625, 18.34423828125, 19.8515625, 21.35888671875, 22.8662109375, 24.37353515625, 25.880859375, 27.38818359375, 28.8955078125, 30.40283203125, 31.91015625, 33.41748046875, 34.9248046875, 36.43212890625, 37.939453125, 39.44677734375, 40.9541015625, 42.46142578125, 43.96875]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 8.0, 133.0, 771.0, 100.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-325.0115661621094, -318.57366943359375, -312.1357727050781, -305.6978759765625, -299.25994873046875, -292.8220520019531, -286.3841552734375, -279.9462585449219, -273.50836181640625, -267.0704650878906, -260.632568359375, -254.1946563720703, -247.7567596435547, -241.31886291503906, -234.88095092773438, -228.44305419921875, -222.00515747070312, -215.5672607421875, -209.12936401367188, -202.6914520263672, -196.25355529785156, -189.81565856933594, -183.37774658203125, -176.93984985351562, -170.501953125, -164.06405639648438, -157.62615966796875, -151.18824768066406, -144.75035095214844, -138.3124542236328, -131.87454223632812, -125.4366455078125, -118.99876403808594, -112.56086730957031, -106.12296295166016, -99.68505859375, -93.24716186523438, -86.80926513671875, -80.3713607788086, -73.93345642089844, -67.49555969238281, -61.05765914916992, -54.61975860595703, -48.18185806274414, -41.74395751953125, -35.30605697631836, -28.86815643310547, -22.430255889892578, -15.992355346679688, -9.554454803466797, -3.1165542602539062, 3.3213462829589844, 9.759246826171875, 16.197147369384766, 22.635047912597656, 29.072948455810547, 35.51084899902344, 41.94874954223633, 48.38665008544922, 54.82455062866211, 61.262451171875, 67.70034790039062, 74.13825225830078, 80.57615661621094, 87.01405334472656]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 7.0, 6.0, 7.0, 7.0, 5.0, 12.0, 14.0, 14.0, 18.0, 23.0, 24.0, 24.0, 27.0, 22.0, 34.0, 32.0, 54.0, 43.0, 43.0, 49.0, 51.0, 44.0, 45.0, 39.0, 33.0, 34.0, 40.0, 48.0, 26.0, 25.0, 23.0, 22.0, 24.0, 16.0, 12.0, 12.0, 10.0, 10.0, 8.0, 4.0, 5.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-61.96592330932617, -60.257659912109375, -58.54939270019531, -56.841129302978516, -55.13286590576172, -53.424598693847656, -51.71633529663086, -50.00807189941406, -48.2998046875, -46.5915412902832, -44.88327407836914, -43.175010681152344, -41.46674346923828, -39.758480072021484, -38.05021667480469, -36.341949462890625, -34.63368606567383, -32.92542266845703, -31.21715545654297, -29.508892059326172, -27.800626754760742, -26.092361450195312, -24.384098052978516, -22.675832748413086, -20.967567443847656, -19.259302139282227, -17.551036834716797, -15.8427734375, -14.13450813293457, -12.42624282836914, -10.717978477478027, -9.009714126586914, -7.30145263671875, -5.5931878089904785, -3.884922981262207, -2.1766581535339355, -0.46839332580566406, 1.2398719787597656, 2.948136329650879, 4.656400680541992, 6.364665985107422, 8.072931289672852, 9.781195640563965, 11.489459991455078, 13.197725296020508, 14.905990600585938, 16.614253997802734, 18.322519302368164, 20.030784606933594, 21.739049911499023, 23.447315216064453, 25.15557861328125, 26.86384391784668, 28.57210922241211, 30.280372619628906, 31.988637924194336, 33.696903228759766, 35.40516662597656, 37.113433837890625, 38.82169723510742, 40.52996063232422, 42.23822784423828, 43.94649124145508, 45.654754638671875, 47.36302185058594]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 0.0, 4.0, 1.0, 1.0, 3.0, 4.0, 10.0, 7.0, 11.0, 7.0, 14.0, 15.0, 11.0, 27.0, 14.0, 24.0, 22.0, 27.0, 28.0, 21.0, 38.0, 27.0, 39.0, 39.0, 35.0, 39.0, 38.0, 50.0, 37.0, 48.0, 38.0, 31.0, 32.0, 37.0, 32.0, 31.0, 19.0, 24.0, 21.0, 12.0, 15.0, 10.0, 14.0, 11.0, 13.0, 10.0, 4.0, 3.0, 2.0, 2.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.9375, -8.6708984375, -8.404296875, -8.1376953125, -7.87109375, -7.6044921875, -7.337890625, -7.0712890625, -6.8046875, -6.5380859375, -6.271484375, -6.0048828125, -5.73828125, -5.4716796875, -5.205078125, -4.9384765625, -4.671875, -4.4052734375, -4.138671875, -3.8720703125, -3.60546875, -3.3388671875, -3.072265625, -2.8056640625, -2.5390625, -2.2724609375, -2.005859375, -1.7392578125, -1.47265625, -1.2060546875, -0.939453125, -0.6728515625, -0.40625, -0.1396484375, 0.126953125, 0.3935546875, 0.66015625, 0.9267578125, 1.193359375, 1.4599609375, 1.7265625, 1.9931640625, 2.259765625, 2.5263671875, 2.79296875, 3.0595703125, 3.326171875, 3.5927734375, 3.859375, 4.1259765625, 4.392578125, 4.6591796875, 4.92578125, 5.1923828125, 5.458984375, 5.7255859375, 5.9921875, 6.2587890625, 6.525390625, 6.7919921875, 7.05859375, 7.3251953125, 7.591796875, 7.8583984375, 8.125]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 2.0, 1.0, 8.0, 3.0, 15.0, 13.0, 12.0, 20.0, 20.0, 22.0, 31.0, 51.0, 46.0, 70.0, 87.0, 150.0, 206.0, 255.0, 308.0, 494.0, 3071.0, 4186576.0, 1112.0, 484.0, 313.0, 243.0, 177.0, 140.0, 82.0, 55.0, 53.0, 41.0, 21.0, 17.0, 21.0, 13.0, 14.0, 10.0, 15.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-187.375, -180.767578125, -174.16015625, -167.552734375, -160.9453125, -154.337890625, -147.73046875, -141.123046875, -134.515625, -127.908203125, -121.30078125, -114.693359375, -108.0859375, -101.478515625, -94.87109375, -88.263671875, -81.65625, -75.048828125, -68.44140625, -61.833984375, -55.2265625, -48.619140625, -42.01171875, -35.404296875, -28.796875, -22.189453125, -15.58203125, -8.974609375, -2.3671875, 4.240234375, 10.84765625, 17.455078125, 24.0625, 30.669921875, 37.27734375, 43.884765625, 50.4921875, 57.099609375, 63.70703125, 70.314453125, 76.921875, 83.529296875, 90.13671875, 96.744140625, 103.3515625, 109.958984375, 116.56640625, 123.173828125, 129.78125, 136.388671875, 142.99609375, 149.603515625, 156.2109375, 162.818359375, 169.42578125, 176.033203125, 182.640625, 189.248046875, 195.85546875, 202.462890625, 209.0703125, 215.677734375, 222.28515625, 228.892578125, 235.5]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 7.0, 4.0, 3.0, 8.0, 11.0, 9.0, 13.0, 17.0, 28.0, 48.0, 55.0, 72.0, 109.0, 166.0, 265.0, 424.0, 676.0, 723.0, 532.0, 318.0, 231.0, 118.0, 61.0, 42.0, 47.0, 31.0, 14.0, 18.0, 12.0, 6.0, 3.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.578125, -18.0645751953125, -17.551025390625, -17.0374755859375, -16.52392578125, -16.0103759765625, -15.496826171875, -14.9832763671875, -14.4697265625, -13.9561767578125, -13.442626953125, -12.9290771484375, -12.41552734375, -11.9019775390625, -11.388427734375, -10.8748779296875, -10.361328125, -9.8477783203125, -9.334228515625, -8.8206787109375, -8.30712890625, -7.7935791015625, -7.280029296875, -6.7664794921875, -6.2529296875, -5.7393798828125, -5.225830078125, -4.7122802734375, -4.19873046875, -3.6851806640625, -3.171630859375, -2.6580810546875, -2.14453125, -1.6309814453125, -1.117431640625, -0.6038818359375, -0.09033203125, 0.4232177734375, 0.936767578125, 1.4503173828125, 1.9638671875, 2.4774169921875, 2.990966796875, 3.5045166015625, 4.01806640625, 4.5316162109375, 5.045166015625, 5.5587158203125, 6.072265625, 6.5858154296875, 7.099365234375, 7.6129150390625, 8.12646484375, 8.6400146484375, 9.153564453125, 9.6671142578125, 10.1806640625, 10.6942138671875, 11.207763671875, 11.7213134765625, 12.23486328125, 12.7484130859375, 13.261962890625, 13.7755126953125, 14.2890625]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 2.0, 2.0, 5.0, 4.0, 5.0, 7.0, 11.0, 7.0, 7.0, 15.0, 21.0, 23.0, 23.0, 31.0, 38.0, 33.0, 55.0, 66.0, 106.0, 282.0, 1729.0, 824935.0, 3363315.0, 2759.0, 317.0, 104.0, 71.0, 51.0, 45.0, 33.0, 21.0, 23.0, 23.0, 22.0, 13.0, 21.0, 14.0, 5.0, 8.0, 9.0, 7.0, 4.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-90.5, -87.677734375, -84.85546875, -82.033203125, -79.2109375, -76.388671875, -73.56640625, -70.744140625, -67.921875, -65.099609375, -62.27734375, -59.455078125, -56.6328125, -53.810546875, -50.98828125, -48.166015625, -45.34375, -42.521484375, -39.69921875, -36.876953125, -34.0546875, -31.232421875, -28.41015625, -25.587890625, -22.765625, -19.943359375, -17.12109375, -14.298828125, -11.4765625, -8.654296875, -5.83203125, -3.009765625, -0.1875, 2.634765625, 5.45703125, 8.279296875, 11.1015625, 13.923828125, 16.74609375, 19.568359375, 22.390625, 25.212890625, 28.03515625, 30.857421875, 33.6796875, 36.501953125, 39.32421875, 42.146484375, 44.96875, 47.791015625, 50.61328125, 53.435546875, 56.2578125, 59.080078125, 61.90234375, 64.724609375, 67.546875, 70.369140625, 73.19140625, 76.013671875, 78.8359375, 81.658203125, 84.48046875, 87.302734375, 90.125]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 9.0, 14.0, 29.0, 63.0, 92.0, 116.0, 157.0, 186.0, 132.0, 93.0, 74.0, 34.0, 7.0, 7.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.989965438842773, -17.10354232788086, -15.217117309570312, -13.330694198608398, -11.444270133972168, -9.557846069335938, -7.671422958374023, -5.784998893737793, -3.8985748291015625, -2.012151002883911, -0.12572717666625977, 1.7606964111328125, 3.647120475769043, 5.533544540405273, 7.4199676513671875, 9.306391716003418, 11.192815780639648, 13.079239845275879, 14.96566390991211, 16.852087020874023, 18.738510131835938, 20.624935150146484, 22.5113582611084, 24.397781372070312, 26.28420639038086, 28.170629501342773, 30.05705451965332, 31.943477630615234, 33.82990264892578, 35.71632385253906, 37.60274887084961, 39.489173889160156, 41.37559509277344, 43.262020111083984, 45.148441314697266, 47.03486633300781, 48.92129135131836, 50.807716369628906, 52.69413757324219, 54.580562591552734, 56.46698760986328, 58.35341262817383, 60.23983383178711, 62.126258850097656, 64.01268005371094, 65.89910888671875, 67.78553009033203, 69.67195129394531, 71.55838012695312, 73.4448013305664, 75.33123016357422, 77.2176513671875, 79.10407257080078, 80.9905014038086, 82.87692260742188, 84.76334381103516, 86.64976501464844, 88.53618621826172, 90.42261505126953, 92.30903625488281, 94.1954574584961, 96.0818862915039, 97.96830749511719, 99.85472869873047, 101.74115753173828]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 7.0, 7.0, 8.0, 16.0, 12.0, 17.0, 14.0, 18.0, 23.0, 27.0, 20.0, 32.0, 30.0, 26.0, 36.0, 42.0, 35.0, 39.0, 31.0, 39.0, 39.0, 35.0, 41.0, 37.0, 44.0, 31.0, 37.0, 26.0, 22.0, 22.0, 23.0, 20.0, 23.0, 19.0, 14.0, 15.0, 13.0, 13.0, 18.0, 3.0, 7.0, 4.0, 3.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-40.918212890625, -39.644020080566406, -38.36982345581055, -37.09563064575195, -35.82143783569336, -34.5472412109375, -33.273048400878906, -31.998855590820312, -30.724660873413086, -29.45046615600586, -28.176273345947266, -26.90207862854004, -25.627883911132812, -24.35369110107422, -23.079496383666992, -21.805301666259766, -20.531108856201172, -19.256914138793945, -17.98272132873535, -16.708526611328125, -15.434332847595215, -14.160139083862305, -12.885944366455078, -11.611750602722168, -10.337556838989258, -9.063363075256348, -7.789168834686279, -6.514974594116211, -5.240780830383301, -3.9665870666503906, -2.6923928260803223, -1.418198585510254, -0.14400482177734375, 1.1301891803741455, 2.4043831825256348, 3.678577184677124, 4.952771186828613, 6.226964950561523, 7.501159191131592, 8.77535343170166, 10.04954719543457, 11.32374095916748, 12.59793472290039, 13.872129440307617, 15.146323204040527, 16.420516967773438, 17.694711685180664, 18.96890640258789, 20.243099212646484, 21.51729393005371, 22.791486740112305, 24.06568145751953, 25.339874267578125, 26.61406898498535, 27.888263702392578, 29.162456512451172, 30.4366512298584, 31.710845947265625, 32.98503875732422, 34.25923156738281, 35.53342819213867, 36.807621002197266, 38.08181381225586, 39.35601043701172, 40.63020324707031]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 3.0, 3.0, 2.0, 10.0, 6.0, 9.0, 7.0, 14.0, 16.0, 8.0, 29.0, 28.0, 27.0, 31.0, 20.0, 22.0, 36.0, 35.0, 42.0, 44.0, 41.0, 49.0, 36.0, 35.0, 41.0, 43.0, 30.0, 46.0, 35.0, 28.0, 34.0, 26.0, 31.0, 28.0, 17.0, 13.0, 10.0, 12.0, 18.0, 11.0, 6.0, 6.0, 2.0, 4.0, 4.0, 1.0, 3.0, 1.0, 3.0], "bins": [-9.9296875, -9.66375732421875, -9.3978271484375, -9.13189697265625, -8.865966796875, -8.60003662109375, -8.3341064453125, -8.06817626953125, -7.80224609375, -7.53631591796875, -7.2703857421875, -7.00445556640625, -6.738525390625, -6.47259521484375, -6.2066650390625, -5.94073486328125, -5.6748046875, -5.40887451171875, -5.1429443359375, -4.87701416015625, -4.611083984375, -4.34515380859375, -4.0792236328125, -3.81329345703125, -3.54736328125, -3.28143310546875, -3.0155029296875, -2.74957275390625, -2.483642578125, -2.21771240234375, -1.9517822265625, -1.68585205078125, -1.419921875, -1.15399169921875, -0.8880615234375, -0.62213134765625, -0.356201171875, -0.09027099609375, 0.1756591796875, 0.44158935546875, 0.70751953125, 0.97344970703125, 1.2393798828125, 1.50531005859375, 1.771240234375, 2.03717041015625, 2.3031005859375, 2.56903076171875, 2.8349609375, 3.10089111328125, 3.3668212890625, 3.63275146484375, 3.898681640625, 4.16461181640625, 4.4305419921875, 4.69647216796875, 4.96240234375, 5.22833251953125, 5.4942626953125, 5.76019287109375, 6.026123046875, 6.29205322265625, 6.5579833984375, 6.82391357421875, 7.08984375]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 7.0, 19.0, 14.0, 29.0, 47.0, 55.0, 106.0, 105.0, 160.0, 242.0, 338.0, 515.0, 769.0, 1170.0, 1698.0, 2534.0, 3855.0, 5837.0, 8971.0, 13851.0, 22825.0, 37156.0, 63818.0, 120234.0, 232038.0, 237563.0, 125167.0, 65966.0, 38607.0, 23305.0, 14673.0, 9191.0, 6052.0, 3748.0, 2579.0, 1663.0, 1156.0, 767.0, 532.0, 381.0, 258.0, 169.0, 112.0, 97.0, 62.0, 32.0, 23.0, 21.0, 10.0, 8.0, 7.0, 9.0, 1.0, 2.0, 1.0, 3.0], "bins": [-1.2861328125, -1.2471923828125, -1.208251953125, -1.1693115234375, -1.13037109375, -1.0914306640625, -1.052490234375, -1.0135498046875, -0.974609375, -0.9356689453125, -0.896728515625, -0.8577880859375, -0.81884765625, -0.7799072265625, -0.740966796875, -0.7020263671875, -0.6630859375, -0.6241455078125, -0.585205078125, -0.5462646484375, -0.50732421875, -0.4683837890625, -0.429443359375, -0.3905029296875, -0.3515625, -0.3126220703125, -0.273681640625, -0.2347412109375, -0.19580078125, -0.1568603515625, -0.117919921875, -0.0789794921875, -0.0400390625, -0.0010986328125, 0.037841796875, 0.0767822265625, 0.11572265625, 0.1546630859375, 0.193603515625, 0.2325439453125, 0.271484375, 0.3104248046875, 0.349365234375, 0.3883056640625, 0.42724609375, 0.4661865234375, 0.505126953125, 0.5440673828125, 0.5830078125, 0.6219482421875, 0.660888671875, 0.6998291015625, 0.73876953125, 0.7777099609375, 0.816650390625, 0.8555908203125, 0.89453125, 0.9334716796875, 0.972412109375, 1.0113525390625, 1.05029296875, 1.0892333984375, 1.128173828125, 1.1671142578125, 1.2060546875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 2.0, 6.0, 5.0, 8.0, 14.0, 8.0, 10.0, 13.0, 13.0, 15.0, 18.0, 19.0, 21.0, 19.0, 28.0, 23.0, 26.0, 27.0, 27.0, 34.0, 32.0, 32.0, 45.0, 52.0, 1057.0, 39.0, 34.0, 35.0, 37.0, 27.0, 31.0, 27.0, 33.0, 22.0, 22.0, 21.0, 22.0, 16.0, 14.0, 18.0, 14.0, 14.0, 11.0, 9.0, 4.0, 1.0, 4.0, 3.0, 3.0, 6.0, 2.0, 2.0, 1.0, 2.0, 5.0], "bins": [-4.83984375, -4.69500732421875, -4.5501708984375, -4.40533447265625, -4.260498046875, -4.11566162109375, -3.9708251953125, -3.82598876953125, -3.68115234375, -3.53631591796875, -3.3914794921875, -3.24664306640625, -3.101806640625, -2.95697021484375, -2.8121337890625, -2.66729736328125, -2.5224609375, -2.37762451171875, -2.2327880859375, -2.08795166015625, -1.943115234375, -1.79827880859375, -1.6534423828125, -1.50860595703125, -1.36376953125, -1.21893310546875, -1.0740966796875, -0.92926025390625, -0.784423828125, -0.63958740234375, -0.4947509765625, -0.34991455078125, -0.205078125, -0.06024169921875, 0.0845947265625, 0.22943115234375, 0.374267578125, 0.51910400390625, 0.6639404296875, 0.80877685546875, 0.95361328125, 1.09844970703125, 1.2432861328125, 1.38812255859375, 1.532958984375, 1.67779541015625, 1.8226318359375, 1.96746826171875, 2.1123046875, 2.25714111328125, 2.4019775390625, 2.54681396484375, 2.691650390625, 2.83648681640625, 2.9813232421875, 3.12615966796875, 3.27099609375, 3.41583251953125, 3.5606689453125, 3.70550537109375, 3.850341796875, 3.99517822265625, 4.1400146484375, 4.28485107421875, 4.4296875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 12.0, 29.0, 27.0, 37.0, 81.0, 106.0, 151.0, 230.0, 280.0, 437.0, 559.0, 870.0, 1188.0, 1819.0, 2742.0, 4074.0, 5869.0, 8979.0, 13953.0, 21460.0, 34617.0, 55482.0, 97410.0, 180689.0, 1293192.0, 153727.0, 83459.0, 48787.0, 30271.0, 19365.0, 12322.0, 8167.0, 5441.0, 3562.0, 2450.0, 1618.0, 1092.0, 775.0, 538.0, 407.0, 271.0, 210.0, 118.0, 95.0, 56.0, 44.0, 26.0, 13.0, 9.0, 7.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.97265625, -0.9406280517578125, -0.908599853515625, -0.8765716552734375, -0.84454345703125, -0.8125152587890625, -0.780487060546875, -0.7484588623046875, -0.7164306640625, -0.6844024658203125, -0.652374267578125, -0.6203460693359375, -0.58831787109375, -0.5562896728515625, -0.524261474609375, -0.4922332763671875, -0.460205078125, -0.4281768798828125, -0.396148681640625, -0.3641204833984375, -0.33209228515625, -0.3000640869140625, -0.268035888671875, -0.2360076904296875, -0.2039794921875, -0.1719512939453125, -0.139923095703125, -0.1078948974609375, -0.07586669921875, -0.0438385009765625, -0.011810302734375, 0.0202178955078125, 0.05224609375, 0.0842742919921875, 0.116302490234375, 0.1483306884765625, 0.18035888671875, 0.2123870849609375, 0.244415283203125, 0.2764434814453125, 0.3084716796875, 0.3404998779296875, 0.372528076171875, 0.4045562744140625, 0.43658447265625, 0.4686126708984375, 0.500640869140625, 0.5326690673828125, 0.564697265625, 0.5967254638671875, 0.628753662109375, 0.6607818603515625, 0.69281005859375, 0.7248382568359375, 0.756866455078125, 0.7888946533203125, 0.8209228515625, 0.8529510498046875, 0.884979248046875, 0.9170074462890625, 0.94903564453125, 0.9810638427734375, 1.013092041015625, 1.0451202392578125, 1.0771484375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 7.0, 3.0, 6.0, 9.0, 4.0, 9.0, 15.0, 24.0, 18.0, 20.0, 23.0, 29.0, 50.0, 37.0, 50.0, 69.0, 51.0, 71.0, 64.0, 57.0, 48.0, 50.0, 40.0, 60.0, 33.0, 31.0, 20.0, 21.0, 14.0, 8.0, 11.0, 6.0, 8.0, 9.0, 3.0, 6.0, 5.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0024623870849609375, -0.0023832321166992188, -0.0023040771484375, -0.0022249221801757812, -0.0021457672119140625, -0.0020666122436523438, -0.001987457275390625, -0.0019083023071289062, -0.0018291473388671875, -0.0017499923706054688, -0.00167083740234375, -0.0015916824340820312, -0.0015125274658203125, -0.0014333724975585938, -0.001354217529296875, -0.0012750625610351562, -0.0011959075927734375, -0.0011167526245117188, -0.00103759765625, -0.0009584426879882812, -0.0008792877197265625, -0.0008001327514648438, -0.000720977783203125, -0.0006418228149414062, -0.0005626678466796875, -0.00048351287841796875, -0.00040435791015625, -0.00032520294189453125, -0.0002460479736328125, -0.00016689300537109375, -8.7738037109375e-05, -8.58306884765625e-06, 7.05718994140625e-05, 0.00014972686767578125, 0.0002288818359375, 0.00030803680419921875, 0.0003871917724609375, 0.00046634674072265625, 0.000545501708984375, 0.0006246566772460938, 0.0007038116455078125, 0.0007829666137695312, 0.00086212158203125, 0.0009412765502929688, 0.0010204315185546875, 0.0010995864868164062, 0.001178741455078125, 0.0012578964233398438, 0.0013370513916015625, 0.0014162063598632812, 0.001495361328125, 0.0015745162963867188, 0.0016536712646484375, 0.0017328262329101562, 0.001811981201171875, 0.0018911361694335938, 0.0019702911376953125, 0.0020494461059570312, 0.00212860107421875, 0.0022077560424804688, 0.0022869110107421875, 0.0023660659790039062, 0.002445220947265625, 0.0025243759155273438, 0.0026035308837890625]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 4.0, 4.0, 7.0, 1.0, 6.0, 10.0, 10.0, 15.0, 6.0, 16.0, 28.0, 24.0, 35.0, 46.0, 57.0, 97.0, 123.0, 173.0, 240.0, 408.0, 729.0, 4824.0, 999408.0, 39777.0, 978.0, 498.0, 284.0, 177.0, 146.0, 108.0, 72.0, 54.0, 53.0, 39.0, 16.0, 18.0, 11.0, 9.0, 8.0, 5.0, 10.0, 5.0, 2.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0], "bins": [-0.04962158203125, -0.04810285568237305, -0.046584129333496094, -0.04506540298461914, -0.04354667663574219, -0.042027950286865234, -0.04050922393798828, -0.03899049758911133, -0.037471771240234375, -0.03595304489135742, -0.03443431854248047, -0.032915592193603516, -0.03139686584472656, -0.02987813949584961, -0.028359413146972656, -0.026840686798095703, -0.02532196044921875, -0.023803234100341797, -0.022284507751464844, -0.02076578140258789, -0.019247055053710938, -0.017728328704833984, -0.01620960235595703, -0.014690876007080078, -0.013172149658203125, -0.011653423309326172, -0.010134696960449219, -0.008615970611572266, -0.0070972442626953125, -0.005578517913818359, -0.004059791564941406, -0.002541065216064453, -0.0010223388671875, 0.0004963874816894531, 0.0020151138305664062, 0.0035338401794433594, 0.0050525665283203125, 0.006571292877197266, 0.008090019226074219, 0.009608745574951172, 0.011127471923828125, 0.012646198272705078, 0.014164924621582031, 0.015683650970458984, 0.017202377319335938, 0.01872110366821289, 0.020239830017089844, 0.021758556365966797, 0.02327728271484375, 0.024796009063720703, 0.026314735412597656, 0.02783346176147461, 0.029352188110351562, 0.030870914459228516, 0.03238964080810547, 0.03390836715698242, 0.035427093505859375, 0.03694581985473633, 0.03846454620361328, 0.039983272552490234, 0.04150199890136719, 0.04302072525024414, 0.044539451599121094, 0.04605817794799805, 0.047576904296875]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 34.0, 258.0, 543.0, 169.0, 9.0, 0.0, 3.0], "bins": [-0.015030762180685997, -0.01477746944874525, -0.01452417578548193, -0.014270883053541183, -0.014017589390277863, -0.013764296658337116, -0.01351100392639637, -0.013257710263133049, -0.013004417531192303, -0.012751124799251556, -0.012497831135988235, -0.01224453840404749, -0.011991244740784168, -0.011737952008843422, -0.011484658345580101, -0.011231365613639355, -0.010978072881698608, -0.010724780149757862, -0.010471486486494541, -0.010218193754553795, -0.009964900091290474, -0.009711607359349728, -0.009458314627408981, -0.00920502096414566, -0.00895172730088234, -0.008698434568941593, -0.008445140905678272, -0.008191848173737526, -0.007938554510474205, -0.007685261778533459, -0.007431968580931425, -0.0071786753833293915, -0.006925382651388645, -0.0066720894537866116, -0.006418796256184578, -0.006165503524243832, -0.005912210326641798, -0.005658917129039764, -0.005405623931437731, -0.005152330733835697, -0.0048990375362336636, -0.00464574433863163, -0.004392451141029596, -0.004139157943427563, -0.0038858652114868164, -0.003632572013884783, -0.003379278816282749, -0.0031259856186807156, -0.0028726926539093256, -0.002619399456307292, -0.002366106491535902, -0.0021128132939338684, -0.0018595202127471566, -0.0016062271315604448, -0.0013529339339584112, -0.0010996408527716994, -0.0008463477715849876, -0.0005930546903982759, -0.00033976155100390315, -8.646841160953045e-05, 0.00016682466957718134, 0.00042011775076389313, 0.0006734109483659267, 0.0009267040295526385, 0.0011799971107393503]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 6.0, 7.0, 7.0, 12.0, 7.0, 13.0, 18.0, 15.0, 29.0, 23.0, 19.0, 21.0, 30.0, 38.0, 32.0, 34.0, 41.0, 44.0, 35.0, 32.0, 52.0, 43.0, 47.0, 48.0, 32.0, 43.0, 36.0, 30.0, 25.0, 40.0, 24.0, 22.0, 19.0, 14.0, 15.0, 16.0, 9.0, 5.0, 8.0, 5.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.0015001893043518066, -0.0014580516144633293, -0.001415913924574852, -0.0013737762346863747, -0.0013316385447978973, -0.00128950085490942, -0.0012473631650209427, -0.0012052254751324654, -0.001163087785243988, -0.0011209500953555107, -0.0010788124054670334, -0.001036674715578556, -0.0009945370256900787, -0.0009523993358016014, -0.0009102616459131241, -0.0008681239560246468, -0.0008259862661361694, -0.0007838485762476921, -0.0007417108863592148, -0.0006995731964707375, -0.0006574355065822601, -0.0006152978166937828, -0.0005731601268053055, -0.0005310224369168282, -0.0004888847470283508, -0.0004467470571398735, -0.0004046093672513962, -0.00036247167736291885, -0.00032033398747444153, -0.0002781962975859642, -0.00023605860769748688, -0.00019392091780900955, -0.00015178322792053223, -0.0001096455380320549, -6.750784814357758e-05, -2.537015825510025e-05, 1.6767531633377075e-05, 5.89052215218544e-05, 0.00010104291141033173, 0.00014318060129880905, 0.00018531829118728638, 0.0002274559810757637, 0.00026959367096424103, 0.00031173136085271835, 0.0003538690507411957, 0.000396006740629673, 0.00043814443051815033, 0.00048028212040662766, 0.000522419810295105, 0.0005645575001835823, 0.0006066951900720596, 0.000648832879960537, 0.0006909705698490143, 0.0007331082597374916, 0.0007752459496259689, 0.0008173836395144463, 0.0008595213294029236, 0.0009016590192914009, 0.0009437967091798782, 0.0009859343990683556, 0.0010280720889568329, 0.0010702097788453102, 0.0011123474687337875, 0.0011544851586222649, 0.0011966228485107422]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 3.0, 3.0, 2.0, 10.0, 6.0, 9.0, 7.0, 14.0, 16.0, 8.0, 29.0, 28.0, 27.0, 31.0, 20.0, 22.0, 36.0, 35.0, 42.0, 44.0, 41.0, 49.0, 36.0, 35.0, 41.0, 43.0, 30.0, 46.0, 35.0, 28.0, 34.0, 26.0, 31.0, 28.0, 17.0, 13.0, 10.0, 12.0, 18.0, 11.0, 6.0, 6.0, 2.0, 4.0, 4.0, 1.0, 3.0, 1.0, 3.0], "bins": [-9.9296875, -9.66375732421875, -9.3978271484375, -9.13189697265625, -8.865966796875, -8.60003662109375, -8.3341064453125, -8.06817626953125, -7.80224609375, -7.53631591796875, -7.2703857421875, -7.00445556640625, -6.738525390625, -6.47259521484375, -6.2066650390625, -5.94073486328125, -5.6748046875, -5.40887451171875, -5.1429443359375, -4.87701416015625, -4.611083984375, -4.34515380859375, -4.0792236328125, -3.81329345703125, -3.54736328125, -3.28143310546875, -3.0155029296875, -2.74957275390625, -2.483642578125, -2.21771240234375, -1.9517822265625, -1.68585205078125, -1.419921875, -1.15399169921875, -0.8880615234375, -0.62213134765625, -0.356201171875, -0.09027099609375, 0.1756591796875, 0.44158935546875, 0.70751953125, 0.97344970703125, 1.2393798828125, 1.50531005859375, 1.771240234375, 2.03717041015625, 2.3031005859375, 2.56903076171875, 2.8349609375, 3.10089111328125, 3.3668212890625, 3.63275146484375, 3.898681640625, 4.16461181640625, 4.4305419921875, 4.69647216796875, 4.96240234375, 5.22833251953125, 5.4942626953125, 5.76019287109375, 6.026123046875, 6.29205322265625, 6.5579833984375, 6.82391357421875, 7.08984375]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 4.0, 8.0, 12.0, 15.0, 10.0, 30.0, 40.0, 47.0, 56.0, 83.0, 115.0, 153.0, 203.0, 285.0, 362.0, 415.0, 585.0, 822.0, 996.0, 1602.0, 3100.0, 8499.0, 38525.0, 213550.0, 565462.0, 167967.0, 30173.0, 7128.0, 2723.0, 1479.0, 981.0, 742.0, 563.0, 440.0, 348.0, 272.0, 192.0, 145.0, 120.0, 86.0, 53.0, 40.0, 37.0, 29.0, 19.0, 9.0, 11.0, 7.0, 3.0, 5.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-14.203125, -13.76513671875, -13.3271484375, -12.88916015625, -12.451171875, -12.01318359375, -11.5751953125, -11.13720703125, -10.69921875, -10.26123046875, -9.8232421875, -9.38525390625, -8.947265625, -8.50927734375, -8.0712890625, -7.63330078125, -7.1953125, -6.75732421875, -6.3193359375, -5.88134765625, -5.443359375, -5.00537109375, -4.5673828125, -4.12939453125, -3.69140625, -3.25341796875, -2.8154296875, -2.37744140625, -1.939453125, -1.50146484375, -1.0634765625, -0.62548828125, -0.1875, 0.25048828125, 0.6884765625, 1.12646484375, 1.564453125, 2.00244140625, 2.4404296875, 2.87841796875, 3.31640625, 3.75439453125, 4.1923828125, 4.63037109375, 5.068359375, 5.50634765625, 5.9443359375, 6.38232421875, 6.8203125, 7.25830078125, 7.6962890625, 8.13427734375, 8.572265625, 9.01025390625, 9.4482421875, 9.88623046875, 10.32421875, 10.76220703125, 11.2001953125, 11.63818359375, 12.076171875, 12.51416015625, 12.9521484375, 13.39013671875, 13.828125]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 3.0, 4.0, 7.0, 6.0, 4.0, 7.0, 8.0, 7.0, 11.0, 17.0, 15.0, 17.0, 19.0, 19.0, 37.0, 32.0, 32.0, 34.0, 40.0, 53.0, 90.0, 126.0, 315.0, 1472.0, 161.0, 96.0, 58.0, 56.0, 37.0, 37.0, 35.0, 27.0, 20.0, 19.0, 24.0, 19.0, 14.0, 12.0, 7.0, 11.0, 6.0, 5.0, 7.0, 6.0, 2.0, 4.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-20.625, -19.984375, -19.34375, -18.703125, -18.0625, -17.421875, -16.78125, -16.140625, -15.5, -14.859375, -14.21875, -13.578125, -12.9375, -12.296875, -11.65625, -11.015625, -10.375, -9.734375, -9.09375, -8.453125, -7.8125, -7.171875, -6.53125, -5.890625, -5.25, -4.609375, -3.96875, -3.328125, -2.6875, -2.046875, -1.40625, -0.765625, -0.125, 0.515625, 1.15625, 1.796875, 2.4375, 3.078125, 3.71875, 4.359375, 5.0, 5.640625, 6.28125, 6.921875, 7.5625, 8.203125, 8.84375, 9.484375, 10.125, 10.765625, 11.40625, 12.046875, 12.6875, 13.328125, 13.96875, 14.609375, 15.25, 15.890625, 16.53125, 17.171875, 17.8125, 18.453125, 19.09375, 19.734375, 20.375]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 4.0, 5.0, 6.0, 8.0, 7.0, 9.0, 9.0, 7.0, 18.0, 17.0, 30.0, 37.0, 46.0, 69.0, 94.0, 131.0, 211.0, 361.0, 670.0, 2060.0, 2540297.0, 598117.0, 1849.0, 660.0, 341.0, 188.0, 110.0, 91.0, 68.0, 51.0, 27.0, 28.0, 16.0, 17.0, 13.0, 6.0, 2.0, 5.0, 3.0, 7.0, 6.0, 3.0, 2.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.25, -67.9052734375, -65.560546875, -63.2158203125, -60.87109375, -58.5263671875, -56.181640625, -53.8369140625, -51.4921875, -49.1474609375, -46.802734375, -44.4580078125, -42.11328125, -39.7685546875, -37.423828125, -35.0791015625, -32.734375, -30.3896484375, -28.044921875, -25.7001953125, -23.35546875, -21.0107421875, -18.666015625, -16.3212890625, -13.9765625, -11.6318359375, -9.287109375, -6.9423828125, -4.59765625, -2.2529296875, 0.091796875, 2.4365234375, 4.78125, 7.1259765625, 9.470703125, 11.8154296875, 14.16015625, 16.5048828125, 18.849609375, 21.1943359375, 23.5390625, 25.8837890625, 28.228515625, 30.5732421875, 32.91796875, 35.2626953125, 37.607421875, 39.9521484375, 42.296875, 44.6416015625, 46.986328125, 49.3310546875, 51.67578125, 54.0205078125, 56.365234375, 58.7099609375, 61.0546875, 63.3994140625, 65.744140625, 68.0888671875, 70.43359375, 72.7783203125, 75.123046875, 77.4677734375, 79.8125]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 104.0, 611.0, 272.0, 24.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.70269775390625, -81.51537322998047, -76.32804870605469, -71.14073181152344, -65.95340728759766, -60.766082763671875, -55.578758239746094, -50.39143753051758, -45.2041130065918, -40.016788482666016, -34.8294677734375, -29.64214324951172, -24.45482063293457, -19.267498016357422, -14.08017349243164, -8.892852783203125, -3.7055282592773438, 1.481794834136963, 6.6691179275512695, 11.856441497802734, 17.043764114379883, 22.23108673095703, 27.418411254882812, 32.60573196411133, 37.79305648803711, 42.98038101196289, 48.167701721191406, 53.35502624511719, 58.54235076904297, 63.729671478271484, 68.9169921875, 74.10431671142578, 79.29164123535156, 84.47896575927734, 89.66629028320312, 94.85360717773438, 100.04093170166016, 105.22825622558594, 110.41558074951172, 115.6029052734375, 120.79022216796875, 125.97754669189453, 131.1648712158203, 136.35218811035156, 141.53952026367188, 146.72683715820312, 151.91415405273438, 157.1014862060547, 162.288818359375, 167.47613525390625, 172.66346740722656, 177.8507843017578, 183.03811645507812, 188.22543334960938, 193.41275024414062, 198.60008239746094, 203.7873992919922, 208.97471618652344, 214.16204833984375, 219.349365234375, 224.5366973876953, 229.72401428222656, 234.91134643554688, 240.09866333007812, 245.28598022460938]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 12.0, 10.0, 10.0, 10.0, 13.0, 13.0, 23.0, 23.0, 22.0, 27.0, 32.0, 33.0, 44.0, 43.0, 39.0, 30.0, 37.0, 34.0, 46.0, 54.0, 46.0, 36.0, 37.0, 42.0, 38.0, 30.0, 27.0, 24.0, 25.0, 24.0, 16.0, 26.0, 13.0, 13.0, 16.0, 6.0, 9.0, 6.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-70.62963104248047, -68.70393371582031, -66.77824401855469, -64.85254669189453, -62.92685317993164, -61.00115966796875, -59.07546615600586, -57.14977264404297, -55.22407531738281, -53.29838180541992, -51.37268829345703, -49.446990966796875, -47.521297454833984, -45.595603942871094, -43.6699104309082, -41.74421691894531, -39.81852340698242, -37.89282989501953, -35.96713638305664, -34.04144287109375, -32.115745544433594, -30.190052032470703, -28.264358520507812, -26.338665008544922, -24.4129695892334, -22.487276077270508, -20.561580657958984, -18.635887145996094, -16.710193634033203, -14.78449821472168, -12.858804702758789, -10.933110237121582, -9.007415771484375, -7.081721305847168, -5.156027317047119, -3.2303333282470703, -1.3046388626098633, 0.6210556030273438, 2.5467491149902344, 4.472443580627441, 6.398138046264648, 8.323832511901855, 10.249526977539062, 12.175220489501953, 14.10091495513916, 16.026609420776367, 17.952302932739258, 19.87799835205078, 21.803691864013672, 23.729385375976562, 25.655080795288086, 27.580774307250977, 29.5064697265625, 31.43216323852539, 33.35785675048828, 35.28355026245117, 37.20924377441406, 39.13493728637695, 41.060630798339844, 42.986328125, 44.91202163696289, 46.83771514892578, 48.76340866088867, 50.68910217285156, 52.61479949951172]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 8.0, 8.0, 4.0, 12.0, 14.0, 14.0, 11.0, 13.0, 15.0, 11.0, 20.0, 22.0, 29.0, 27.0, 34.0, 27.0, 27.0, 41.0, 42.0, 37.0, 49.0, 36.0, 41.0, 43.0, 39.0, 34.0, 30.0, 26.0, 28.0, 22.0, 36.0, 31.0, 19.0, 16.0, 25.0, 25.0, 14.0, 15.0, 9.0, 13.0, 9.0, 2.0, 5.0, 8.0, 5.0, 5.0, 3.0, 0.0, 1.0, 2.0], "bins": [-8.734375, -8.4910888671875, -8.247802734375, -8.0045166015625, -7.76123046875, -7.5179443359375, -7.274658203125, -7.0313720703125, -6.7880859375, -6.5447998046875, -6.301513671875, -6.0582275390625, -5.81494140625, -5.5716552734375, -5.328369140625, -5.0850830078125, -4.841796875, -4.5985107421875, -4.355224609375, -4.1119384765625, -3.86865234375, -3.6253662109375, -3.382080078125, -3.1387939453125, -2.8955078125, -2.6522216796875, -2.408935546875, -2.1656494140625, -1.92236328125, -1.6790771484375, -1.435791015625, -1.1925048828125, -0.94921875, -0.7059326171875, -0.462646484375, -0.2193603515625, 0.02392578125, 0.2672119140625, 0.510498046875, 0.7537841796875, 0.9970703125, 1.2403564453125, 1.483642578125, 1.7269287109375, 1.97021484375, 2.2135009765625, 2.456787109375, 2.7000732421875, 2.943359375, 3.1866455078125, 3.429931640625, 3.6732177734375, 3.91650390625, 4.1597900390625, 4.403076171875, 4.6463623046875, 4.8896484375, 5.1329345703125, 5.376220703125, 5.6195068359375, 5.86279296875, 6.1060791015625, 6.349365234375, 6.5926513671875, 6.8359375]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 11.0, 5.0, 5.0, 16.0, 25.0, 18.0, 23.0, 36.0, 42.0, 41.0, 55.0, 73.0, 103.0, 135.0, 203.0, 350.0, 629.0, 1620.0, 4959.0, 25966.0, 442687.0, 2952451.0, 715213.0, 39665.0, 6184.0, 1795.0, 768.0, 395.0, 225.0, 140.0, 107.0, 63.0, 71.0, 38.0, 45.0, 22.0, 24.0, 14.0, 18.0, 10.0, 9.0, 7.0, 4.0, 5.0, 6.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.171875, -19.489990234375, -18.80810546875, -18.126220703125, -17.4443359375, -16.762451171875, -16.08056640625, -15.398681640625, -14.716796875, -14.034912109375, -13.35302734375, -12.671142578125, -11.9892578125, -11.307373046875, -10.62548828125, -9.943603515625, -9.26171875, -8.579833984375, -7.89794921875, -7.216064453125, -6.5341796875, -5.852294921875, -5.17041015625, -4.488525390625, -3.806640625, -3.124755859375, -2.44287109375, -1.760986328125, -1.0791015625, -0.397216796875, 0.28466796875, 0.966552734375, 1.6484375, 2.330322265625, 3.01220703125, 3.694091796875, 4.3759765625, 5.057861328125, 5.73974609375, 6.421630859375, 7.103515625, 7.785400390625, 8.46728515625, 9.149169921875, 9.8310546875, 10.512939453125, 11.19482421875, 11.876708984375, 12.55859375, 13.240478515625, 13.92236328125, 14.604248046875, 15.2861328125, 15.968017578125, 16.64990234375, 17.331787109375, 18.013671875, 18.695556640625, 19.37744140625, 20.059326171875, 20.7412109375, 21.423095703125, 22.10498046875, 22.786865234375, 23.46875]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 14.0, 13.0, 16.0, 36.0, 34.0, 50.0, 71.0, 85.0, 103.0, 145.0, 195.0, 292.0, 424.0, 548.0, 553.0, 391.0, 271.0, 207.0, 186.0, 111.0, 81.0, 69.0, 52.0, 28.0, 27.0, 21.0, 16.0, 12.0, 4.0, 5.0, 4.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-18.59375, -18.1181640625, -17.642578125, -17.1669921875, -16.69140625, -16.2158203125, -15.740234375, -15.2646484375, -14.7890625, -14.3134765625, -13.837890625, -13.3623046875, -12.88671875, -12.4111328125, -11.935546875, -11.4599609375, -10.984375, -10.5087890625, -10.033203125, -9.5576171875, -9.08203125, -8.6064453125, -8.130859375, -7.6552734375, -7.1796875, -6.7041015625, -6.228515625, -5.7529296875, -5.27734375, -4.8017578125, -4.326171875, -3.8505859375, -3.375, -2.8994140625, -2.423828125, -1.9482421875, -1.47265625, -0.9970703125, -0.521484375, -0.0458984375, 0.4296875, 0.9052734375, 1.380859375, 1.8564453125, 2.33203125, 2.8076171875, 3.283203125, 3.7587890625, 4.234375, 4.7099609375, 5.185546875, 5.6611328125, 6.13671875, 6.6123046875, 7.087890625, 7.5634765625, 8.0390625, 8.5146484375, 8.990234375, 9.4658203125, 9.94140625, 10.4169921875, 10.892578125, 11.3681640625, 11.84375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 6.0, 3.0, 11.0, 13.0, 22.0, 28.0, 45.0, 79.0, 146.0, 299.0, 751.0, 2681.0, 45325.0, 3944409.0, 194252.0, 4319.0, 1056.0, 390.0, 193.0, 86.0, 67.0, 28.0, 27.0, 23.0, 9.0, 4.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-61.84375, -60.2431640625, -58.642578125, -57.0419921875, -55.44140625, -53.8408203125, -52.240234375, -50.6396484375, -49.0390625, -47.4384765625, -45.837890625, -44.2373046875, -42.63671875, -41.0361328125, -39.435546875, -37.8349609375, -36.234375, -34.6337890625, -33.033203125, -31.4326171875, -29.83203125, -28.2314453125, -26.630859375, -25.0302734375, -23.4296875, -21.8291015625, -20.228515625, -18.6279296875, -17.02734375, -15.4267578125, -13.826171875, -12.2255859375, -10.625, -9.0244140625, -7.423828125, -5.8232421875, -4.22265625, -2.6220703125, -1.021484375, 0.5791015625, 2.1796875, 3.7802734375, 5.380859375, 6.9814453125, 8.58203125, 10.1826171875, 11.783203125, 13.3837890625, 14.984375, 16.5849609375, 18.185546875, 19.7861328125, 21.38671875, 22.9873046875, 24.587890625, 26.1884765625, 27.7890625, 29.3896484375, 30.990234375, 32.5908203125, 34.19140625, 35.7919921875, 37.392578125, 38.9931640625, 40.59375]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 66.0, 928.0, 22.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-255.44949340820312, -234.90330505371094, -214.3571014404297, -193.8109130859375, -173.26470947265625, -152.71852111816406, -132.17233276367188, -111.62612915039062, -91.07994079589844, -70.53374481201172, -49.987552642822266, -29.441360473632812, -8.895164489746094, 11.651031494140625, 32.19721984863281, 52.74342346191406, 73.28961181640625, 93.83580780029297, 114.38200378417969, 134.92819213867188, 155.47439575195312, 176.0205841064453, 196.5667724609375, 217.11297607421875, 237.65916442871094, 258.2053527832031, 278.7515563964844, 299.2977294921875, 319.84393310546875, 340.39013671875, 360.93634033203125, 381.4825439453125, 402.02874755859375, 422.574951171875, 443.1211242675781, 463.6673278808594, 484.2135314941406, 504.75970458984375, 525.305908203125, 545.8521118164062, 566.3983154296875, 586.9445190429688, 607.49072265625, 628.036865234375, 648.5830688476562, 669.1292724609375, 689.6754760742188, 710.2216796875, 730.767822265625, 751.3140258789062, 771.8602294921875, 792.4063720703125, 812.9525756835938, 833.498779296875, 854.0449829101562, 874.5911865234375, 895.1373901367188, 915.68359375, 936.2297973632812, 956.7760009765625, 977.3221435546875, 997.8683471679688, 1018.41455078125, 1038.960693359375, 1059.5069580078125]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 3.0, 6.0, 4.0, 12.0, 18.0, 14.0, 17.0, 22.0, 22.0, 23.0, 37.0, 31.0, 32.0, 40.0, 46.0, 47.0, 30.0, 51.0, 44.0, 40.0, 49.0, 48.0, 29.0, 40.0, 37.0, 28.0, 35.0, 26.0, 29.0, 18.0, 20.0, 25.0, 12.0, 11.0, 10.0, 13.0, 9.0, 8.0, 7.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-54.12510681152344, -52.422367095947266, -50.71963119506836, -49.01689147949219, -47.314151763916016, -45.611412048339844, -43.90867614746094, -42.205936431884766, -40.503196716308594, -38.80045700073242, -37.097721099853516, -35.394981384277344, -33.69224166870117, -31.989503860473633, -30.286766052246094, -28.584026336669922, -26.881290435791016, -25.178552627563477, -23.475812911987305, -21.773075103759766, -20.070335388183594, -18.367597579956055, -16.664859771728516, -14.96212100982666, -13.259382247924805, -11.55664348602295, -9.853904724121094, -8.151166915893555, -6.448428153991699, -4.745689392089844, -3.0429515838623047, -1.3402128219604492, 0.36252593994140625, 2.0652644634246826, 3.768002986907959, 5.470741271972656, 7.173480033874512, 8.876218795776367, 10.578956604003906, 12.281695365905762, 13.984434127807617, 15.687172889709473, 17.389911651611328, 19.092649459838867, 20.795387268066406, 22.498126983642578, 24.200864791870117, 25.903602600097656, 27.606342315673828, 29.309080123901367, 31.01181983947754, 32.71455764770508, 34.41729736328125, 36.120033264160156, 37.82277297973633, 39.5255126953125, 41.228248596191406, 42.93098831176758, 44.633724212646484, 46.336463928222656, 48.03920364379883, 49.741943359375, 51.444679260253906, 53.14741897583008, 54.85015869140625]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 8.0, 7.0, 7.0, 5.0, 13.0, 7.0, 6.0, 16.0, 19.0, 10.0, 19.0, 18.0, 23.0, 31.0, 31.0, 37.0, 25.0, 30.0, 35.0, 25.0, 43.0, 38.0, 39.0, 34.0, 38.0, 34.0, 35.0, 32.0, 38.0, 28.0, 24.0, 30.0, 34.0, 28.0, 27.0, 26.0, 17.0, 15.0, 13.0, 6.0, 10.0, 11.0, 11.0, 3.0, 8.0, 2.0, 0.0, 5.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-6.2890625, -6.0947265625, -5.900390625, -5.7060546875, -5.51171875, -5.3173828125, -5.123046875, -4.9287109375, -4.734375, -4.5400390625, -4.345703125, -4.1513671875, -3.95703125, -3.7626953125, -3.568359375, -3.3740234375, -3.1796875, -2.9853515625, -2.791015625, -2.5966796875, -2.40234375, -2.2080078125, -2.013671875, -1.8193359375, -1.625, -1.4306640625, -1.236328125, -1.0419921875, -0.84765625, -0.6533203125, -0.458984375, -0.2646484375, -0.0703125, 0.1240234375, 0.318359375, 0.5126953125, 0.70703125, 0.9013671875, 1.095703125, 1.2900390625, 1.484375, 1.6787109375, 1.873046875, 2.0673828125, 2.26171875, 2.4560546875, 2.650390625, 2.8447265625, 3.0390625, 3.2333984375, 3.427734375, 3.6220703125, 3.81640625, 4.0107421875, 4.205078125, 4.3994140625, 4.59375, 4.7880859375, 4.982421875, 5.1767578125, 5.37109375, 5.5654296875, 5.759765625, 5.9541015625, 6.1484375]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 5.0, 2.0, 4.0, 4.0, 3.0, 2.0, 5.0, 7.0, 13.0, 13.0, 13.0, 30.0, 40.0, 58.0, 96.0, 97.0, 172.0, 257.0, 355.0, 540.0, 839.0, 1230.0, 1794.0, 2704.0, 4144.0, 6283.0, 9665.0, 14809.0, 24173.0, 40022.0, 72024.0, 135111.0, 241710.0, 217100.0, 116577.0, 62148.0, 35808.0, 21592.0, 13486.0, 8656.0, 5741.0, 3668.0, 2500.0, 1607.0, 1095.0, 733.0, 515.0, 346.0, 227.0, 157.0, 127.0, 86.0, 59.0, 33.0, 27.0, 18.0, 16.0, 8.0, 9.0, 2.0, 3.0, 3.0, 2.0], "bins": [-0.99169921875, -0.962432861328125, -0.93316650390625, -0.903900146484375, -0.8746337890625, -0.845367431640625, -0.81610107421875, -0.786834716796875, -0.757568359375, -0.728302001953125, -0.69903564453125, -0.669769287109375, -0.6405029296875, -0.611236572265625, -0.58197021484375, -0.552703857421875, -0.5234375, -0.494171142578125, -0.46490478515625, -0.435638427734375, -0.4063720703125, -0.377105712890625, -0.34783935546875, -0.318572998046875, -0.289306640625, -0.260040283203125, -0.23077392578125, -0.201507568359375, -0.1722412109375, -0.142974853515625, -0.11370849609375, -0.084442138671875, -0.05517578125, -0.025909423828125, 0.00335693359375, 0.032623291015625, 0.0618896484375, 0.091156005859375, 0.12042236328125, 0.149688720703125, 0.178955078125, 0.208221435546875, 0.23748779296875, 0.266754150390625, 0.2960205078125, 0.325286865234375, 0.35455322265625, 0.383819580078125, 0.4130859375, 0.442352294921875, 0.47161865234375, 0.500885009765625, 0.5301513671875, 0.559417724609375, 0.58868408203125, 0.617950439453125, 0.647216796875, 0.676483154296875, 0.70574951171875, 0.735015869140625, 0.7642822265625, 0.793548583984375, 0.82281494140625, 0.852081298828125, 0.88134765625]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 2.0, 6.0, 6.0, 8.0, 20.0, 21.0, 28.0, 24.0, 26.0, 29.0, 31.0, 42.0, 50.0, 45.0, 41.0, 51.0, 36.0, 1076.0, 51.0, 47.0, 49.0, 34.0, 44.0, 34.0, 30.0, 28.0, 31.0, 30.0, 28.0, 12.0, 16.0, 11.0, 11.0, 3.0, 6.0, 6.0, 4.0, 6.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.22265625, -5.057861328125, -4.89306640625, -4.728271484375, -4.5634765625, -4.398681640625, -4.23388671875, -4.069091796875, -3.904296875, -3.739501953125, -3.57470703125, -3.409912109375, -3.2451171875, -3.080322265625, -2.91552734375, -2.750732421875, -2.5859375, -2.421142578125, -2.25634765625, -2.091552734375, -1.9267578125, -1.761962890625, -1.59716796875, -1.432373046875, -1.267578125, -1.102783203125, -0.93798828125, -0.773193359375, -0.6083984375, -0.443603515625, -0.27880859375, -0.114013671875, 0.05078125, 0.215576171875, 0.38037109375, 0.545166015625, 0.7099609375, 0.874755859375, 1.03955078125, 1.204345703125, 1.369140625, 1.533935546875, 1.69873046875, 1.863525390625, 2.0283203125, 2.193115234375, 2.35791015625, 2.522705078125, 2.6875, 2.852294921875, 3.01708984375, 3.181884765625, 3.3466796875, 3.511474609375, 3.67626953125, 3.841064453125, 4.005859375, 4.170654296875, 4.33544921875, 4.500244140625, 4.6650390625, 4.829833984375, 4.99462890625, 5.159423828125, 5.32421875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 4.0, 9.0, 13.0, 24.0, 32.0, 49.0, 65.0, 114.0, 166.0, 230.0, 368.0, 530.0, 848.0, 1229.0, 1824.0, 2943.0, 4540.0, 7182.0, 11775.0, 19017.0, 31536.0, 53413.0, 96875.0, 192010.0, 1316835.0, 157571.0, 80839.0, 45822.0, 27084.0, 16408.0, 9932.0, 6278.0, 3993.0, 2621.0, 1668.0, 1077.0, 744.0, 471.0, 352.0, 216.0, 136.0, 94.0, 72.0, 39.0, 30.0, 12.0, 12.0, 10.0, 9.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0], "bins": [-0.96240234375, -0.9335479736328125, -0.904693603515625, -0.8758392333984375, -0.84698486328125, -0.8181304931640625, -0.789276123046875, -0.7604217529296875, -0.7315673828125, -0.7027130126953125, -0.673858642578125, -0.6450042724609375, -0.61614990234375, -0.5872955322265625, -0.558441162109375, -0.5295867919921875, -0.500732421875, -0.4718780517578125, -0.443023681640625, -0.4141693115234375, -0.38531494140625, -0.3564605712890625, -0.327606201171875, -0.2987518310546875, -0.2698974609375, -0.2410430908203125, -0.212188720703125, -0.1833343505859375, -0.15447998046875, -0.1256256103515625, -0.096771240234375, -0.0679168701171875, -0.0390625, -0.0102081298828125, 0.018646240234375, 0.0475006103515625, 0.07635498046875, 0.1052093505859375, 0.134063720703125, 0.1629180908203125, 0.1917724609375, 0.2206268310546875, 0.249481201171875, 0.2783355712890625, 0.30718994140625, 0.3360443115234375, 0.364898681640625, 0.3937530517578125, 0.422607421875, 0.4514617919921875, 0.480316162109375, 0.5091705322265625, 0.53802490234375, 0.5668792724609375, 0.595733642578125, 0.6245880126953125, 0.6534423828125, 0.6822967529296875, 0.711151123046875, 0.7400054931640625, 0.76885986328125, 0.7977142333984375, 0.826568603515625, 0.8554229736328125, 0.88427734375]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 5.0, 3.0, 5.0, 5.0, 9.0, 3.0, 8.0, 8.0, 11.0, 10.0, 16.0, 25.0, 18.0, 27.0, 22.0, 29.0, 32.0, 54.0, 51.0, 53.0, 55.0, 43.0, 55.0, 58.0, 54.0, 44.0, 39.0, 36.0, 35.0, 27.0, 22.0, 21.0, 20.0, 19.0, 21.0, 14.0, 9.0, 9.0, 4.0, 3.0, 1.0, 5.0, 3.0, 2.0, 2.0, 5.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.0017480850219726562, -0.0016879290342330933, -0.0016277730464935303, -0.0015676170587539673, -0.0015074610710144043, -0.0014473050832748413, -0.0013871490955352783, -0.0013269931077957153, -0.0012668371200561523, -0.0012066811323165894, -0.0011465251445770264, -0.0010863691568374634, -0.0010262131690979004, -0.0009660571813583374, -0.0009059011936187744, -0.0008457452058792114, -0.0007855892181396484, -0.0007254332304000854, -0.0006652772426605225, -0.0006051212549209595, -0.0005449652671813965, -0.0004848092794418335, -0.0004246532917022705, -0.0003644973039627075, -0.00030434131622314453, -0.00024418532848358154, -0.00018402934074401855, -0.00012387335300445557, -6.371736526489258e-05, -3.56137752532959e-06, 5.65946102142334e-05, 0.00011675059795379639, 0.00017690658569335938, 0.00023706257343292236, 0.00029721856117248535, 0.00035737454891204834, 0.00041753053665161133, 0.0004776865243911743, 0.0005378425121307373, 0.0005979984998703003, 0.0006581544876098633, 0.0007183104753494263, 0.0007784664630889893, 0.0008386224508285522, 0.0008987784385681152, 0.0009589344263076782, 0.0010190904140472412, 0.0010792464017868042, 0.0011394023895263672, 0.0011995583772659302, 0.0012597143650054932, 0.0013198703527450562, 0.0013800263404846191, 0.0014401823282241821, 0.0015003383159637451, 0.001560494303703308, 0.001620650291442871, 0.001680806279182434, 0.001740962266921997, 0.00180111825466156, 0.001861274242401123, 0.001921430230140686, 0.001981586217880249, 0.002041742205619812, 0.002101898193359375]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 6.0, 7.0, 6.0, 8.0, 4.0, 5.0, 13.0, 14.0, 12.0, 17.0, 25.0, 35.0, 42.0, 67.0, 68.0, 93.0, 132.0, 139.0, 277.0, 393.0, 699.0, 2378.0, 932495.0, 108628.0, 1244.0, 553.0, 352.0, 217.0, 150.0, 113.0, 83.0, 72.0, 42.0, 30.0, 29.0, 22.0, 15.0, 11.0, 11.0, 13.0, 10.0, 9.0, 2.0, 7.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.044708251953125, -0.04345989227294922, -0.04221153259277344, -0.040963172912597656, -0.039714813232421875, -0.038466453552246094, -0.03721809387207031, -0.03596973419189453, -0.03472137451171875, -0.03347301483154297, -0.03222465515136719, -0.030976295471191406, -0.029727935791015625, -0.028479576110839844, -0.027231216430664062, -0.02598285675048828, -0.0247344970703125, -0.02348613739013672, -0.022237777709960938, -0.020989418029785156, -0.019741058349609375, -0.018492698669433594, -0.017244338989257812, -0.01599597930908203, -0.01474761962890625, -0.013499259948730469, -0.012250900268554688, -0.011002540588378906, -0.009754180908203125, -0.008505821228027344, -0.0072574615478515625, -0.006009101867675781, -0.0047607421875, -0.0035123825073242188, -0.0022640228271484375, -0.0010156631469726562, 0.000232696533203125, 0.0014810562133789062, 0.0027294158935546875, 0.003977775573730469, 0.00522613525390625, 0.006474494934082031, 0.0077228546142578125, 0.008971214294433594, 0.010219573974609375, 0.011467933654785156, 0.012716293334960938, 0.013964653015136719, 0.0152130126953125, 0.01646137237548828, 0.017709732055664062, 0.018958091735839844, 0.020206451416015625, 0.021454811096191406, 0.022703170776367188, 0.02395153045654297, 0.02519989013671875, 0.02644824981689453, 0.027696609497070312, 0.028944969177246094, 0.030193328857421875, 0.031441688537597656, 0.03269004821777344, 0.03393840789794922, 0.035186767578125]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 38.0, 577.0, 383.0, 15.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.011961775831878185, -0.01168915443122387, -0.011416533961892128, -0.011143912561237812, -0.01087129209190607, -0.010598670691251755, -0.010326050221920013, -0.010053428821265697, -0.009780808351933956, -0.00950818695127964, -0.009235566481947899, -0.008962945081293583, -0.008690324611961842, -0.008417703211307526, -0.008145082741975784, -0.007872461341321468, -0.00759984040632844, -0.007327219471335411, -0.007054598536342382, -0.006781977601349354, -0.006509356666356325, -0.0062367357313632965, -0.0059641143307089806, -0.005691493861377239, -0.005418872460722923, -0.005146251525729895, -0.004873630590736866, -0.004601009655743837, -0.004328388720750809, -0.00405576778575778, -0.0037831466179341078, -0.003510525682941079, -0.003237904980778694, -0.0029652840457856655, -0.002692663110792637, -0.0024200421757996082, -0.0021474212408065796, -0.0018748001893982291, -0.0016021791379898787, -0.00132955820299685, -0.0010569372680038214, -0.0007843163330107927, -0.0005116953398101032, -0.00023907434660941362, 3.354658838361502e-05, 0.00030616752337664366, 0.0005787885747849941, 0.0008514095097780228, 0.0011240304447710514, 0.00139665137976408, 0.0016692723147571087, 0.0019418933661654592, 0.002214514184743166, 0.0024871351197361946, 0.002759756287559867, 0.0030323772225528955, 0.003304998157545924, 0.003577619092538953, 0.0038502400275319815, 0.004122861195355654, 0.004395482130348682, 0.004668103065341711, 0.00494072400033474, 0.005213344935327768, 0.005485965870320797]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 8.0, 1.0, 8.0, 6.0, 8.0, 9.0, 16.0, 16.0, 22.0, 16.0, 26.0, 26.0, 37.0, 31.0, 33.0, 35.0, 29.0, 41.0, 29.0, 35.0, 43.0, 47.0, 55.0, 42.0, 39.0, 48.0, 21.0, 49.0, 28.0, 25.0, 27.0, 22.0, 26.0, 19.0, 14.0, 10.0, 18.0, 7.0, 8.0, 13.0, 10.0, 5.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009658932685852051, -0.0009272890165448189, -0.0008886847645044327, -0.0008500805124640465, -0.0008114762604236603, -0.0007728720083832741, -0.0007342677563428879, -0.0006956635043025017, -0.0006570592522621155, -0.0006184550002217293, -0.0005798507481813431, -0.0005412464961409569, -0.0005026422441005707, -0.0004640379920601845, -0.0004254337400197983, -0.0003868294879794121, -0.0003482252359390259, -0.0003096209838986397, -0.0002710167318582535, -0.00023241247981786728, -0.00019380822777748108, -0.00015520397573709488, -0.00011659972369670868, -7.799547165632248e-05, -3.939121961593628e-05, -7.869675755500793e-07, 3.781728446483612e-05, 7.642153650522232e-05, 0.00011502578854560852, 0.00015363004058599472, 0.00019223429262638092, 0.00023083854466676712, 0.0002694427967071533, 0.0003080470487475395, 0.0003466513007879257, 0.0003852555528283119, 0.0004238598048686981, 0.0004624640569090843, 0.0005010683089494705, 0.0005396725609898567, 0.0005782768130302429, 0.0006168810650706291, 0.0006554853171110153, 0.0006940895691514015, 0.0007326938211917877, 0.0007712980732321739, 0.0008099023252725601, 0.0008485065773129463, 0.0008871108293533325, 0.0009257150813937187, 0.0009643193334341049, 0.0010029235854744911, 0.0010415278375148773, 0.0010801320895552635, 0.0011187363415956497, 0.001157340593636036, 0.0011959448456764221, 0.0012345490977168083, 0.0012731533497571945, 0.0013117576017975807, 0.001350361853837967, 0.0013889661058783531, 0.0014275703579187393, 0.0014661746099591255, 0.0015047788619995117]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 8.0, 7.0, 7.0, 5.0, 13.0, 7.0, 6.0, 16.0, 19.0, 10.0, 19.0, 18.0, 23.0, 31.0, 31.0, 37.0, 25.0, 30.0, 35.0, 25.0, 43.0, 38.0, 39.0, 34.0, 38.0, 34.0, 35.0, 32.0, 38.0, 28.0, 24.0, 30.0, 34.0, 28.0, 27.0, 26.0, 17.0, 15.0, 13.0, 6.0, 10.0, 11.0, 11.0, 3.0, 7.0, 3.0, 0.0, 5.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-6.2890625, -6.0947265625, -5.900390625, -5.7060546875, -5.51171875, -5.3173828125, -5.123046875, -4.9287109375, -4.734375, -4.5400390625, -4.345703125, -4.1513671875, -3.95703125, -3.7626953125, -3.568359375, -3.3740234375, -3.1796875, -2.9853515625, -2.791015625, -2.5966796875, -2.40234375, -2.2080078125, -2.013671875, -1.8193359375, -1.625, -1.4306640625, -1.236328125, -1.0419921875, -0.84765625, -0.6533203125, -0.458984375, -0.2646484375, -0.0703125, 0.1240234375, 0.318359375, 0.5126953125, 0.70703125, 0.9013671875, 1.095703125, 1.2900390625, 1.484375, 1.6787109375, 1.873046875, 2.0673828125, 2.26171875, 2.4560546875, 2.650390625, 2.8447265625, 3.0390625, 3.2333984375, 3.427734375, 3.6220703125, 3.81640625, 4.0107421875, 4.205078125, 4.3994140625, 4.59375, 4.7880859375, 4.982421875, 5.1767578125, 5.37109375, 5.5654296875, 5.759765625, 5.9541015625, 6.1484375]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 5.0, 2.0, 9.0, 4.0, 17.0, 21.0, 30.0, 38.0, 51.0, 81.0, 102.0, 105.0, 163.0, 233.0, 307.0, 423.0, 666.0, 868.0, 1246.0, 1838.0, 2869.0, 6120.0, 21018.0, 156219.0, 681606.0, 139995.0, 19743.0, 5770.0, 2902.0, 1892.0, 1132.0, 828.0, 612.0, 450.0, 324.0, 219.0, 189.0, 128.0, 95.0, 75.0, 36.0, 22.0, 19.0, 28.0, 15.0, 17.0, 8.0, 8.0, 2.0, 1.0, 5.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-15.984375, -15.4921875, -15.0, -14.5078125, -14.015625, -13.5234375, -13.03125, -12.5390625, -12.046875, -11.5546875, -11.0625, -10.5703125, -10.078125, -9.5859375, -9.09375, -8.6015625, -8.109375, -7.6171875, -7.125, -6.6328125, -6.140625, -5.6484375, -5.15625, -4.6640625, -4.171875, -3.6796875, -3.1875, -2.6953125, -2.203125, -1.7109375, -1.21875, -0.7265625, -0.234375, 0.2578125, 0.75, 1.2421875, 1.734375, 2.2265625, 2.71875, 3.2109375, 3.703125, 4.1953125, 4.6875, 5.1796875, 5.671875, 6.1640625, 6.65625, 7.1484375, 7.640625, 8.1328125, 8.625, 9.1171875, 9.609375, 10.1015625, 10.59375, 11.0859375, 11.578125, 12.0703125, 12.5625, 13.0546875, 13.546875, 14.0390625, 14.53125, 15.0234375, 15.515625]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 7.0, 2.0, 3.0, 7.0, 3.0, 3.0, 10.0, 13.0, 13.0, 12.0, 24.0, 14.0, 18.0, 28.0, 35.0, 38.0, 33.0, 38.0, 57.0, 72.0, 109.0, 227.0, 1587.0, 238.0, 93.0, 46.0, 37.0, 31.0, 34.0, 35.0, 29.0, 23.0, 23.0, 19.0, 20.0, 14.0, 13.0, 10.0, 9.0, 5.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-18.515625, -17.94482421875, -17.3740234375, -16.80322265625, -16.232421875, -15.66162109375, -15.0908203125, -14.52001953125, -13.94921875, -13.37841796875, -12.8076171875, -12.23681640625, -11.666015625, -11.09521484375, -10.5244140625, -9.95361328125, -9.3828125, -8.81201171875, -8.2412109375, -7.67041015625, -7.099609375, -6.52880859375, -5.9580078125, -5.38720703125, -4.81640625, -4.24560546875, -3.6748046875, -3.10400390625, -2.533203125, -1.96240234375, -1.3916015625, -0.82080078125, -0.25, 0.32080078125, 0.8916015625, 1.46240234375, 2.033203125, 2.60400390625, 3.1748046875, 3.74560546875, 4.31640625, 4.88720703125, 5.4580078125, 6.02880859375, 6.599609375, 7.17041015625, 7.7412109375, 8.31201171875, 8.8828125, 9.45361328125, 10.0244140625, 10.59521484375, 11.166015625, 11.73681640625, 12.3076171875, 12.87841796875, 13.44921875, 14.02001953125, 14.5908203125, 15.16162109375, 15.732421875, 16.30322265625, 16.8740234375, 17.44482421875, 18.015625]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 6.0, 2.0, 6.0, 10.0, 13.0, 5.0, 12.0, 17.0, 26.0, 31.0, 31.0, 38.0, 58.0, 71.0, 90.0, 140.0, 189.0, 319.0, 609.0, 1575.0, 39710.0, 3096200.0, 4163.0, 980.0, 459.0, 242.0, 179.0, 117.0, 84.0, 58.0, 72.0, 40.0, 32.0, 26.0, 17.0, 12.0, 15.0, 8.0, 14.0, 7.0, 6.0, 7.0, 1.0, 4.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-54.5625, -52.87255859375, -51.1826171875, -49.49267578125, -47.802734375, -46.11279296875, -44.4228515625, -42.73291015625, -41.04296875, -39.35302734375, -37.6630859375, -35.97314453125, -34.283203125, -32.59326171875, -30.9033203125, -29.21337890625, -27.5234375, -25.83349609375, -24.1435546875, -22.45361328125, -20.763671875, -19.07373046875, -17.3837890625, -15.69384765625, -14.00390625, -12.31396484375, -10.6240234375, -8.93408203125, -7.244140625, -5.55419921875, -3.8642578125, -2.17431640625, -0.484375, 1.20556640625, 2.8955078125, 4.58544921875, 6.275390625, 7.96533203125, 9.6552734375, 11.34521484375, 13.03515625, 14.72509765625, 16.4150390625, 18.10498046875, 19.794921875, 21.48486328125, 23.1748046875, 24.86474609375, 26.5546875, 28.24462890625, 29.9345703125, 31.62451171875, 33.314453125, 35.00439453125, 36.6943359375, 38.38427734375, 40.07421875, 41.76416015625, 43.4541015625, 45.14404296875, 46.833984375, 48.52392578125, 50.2138671875, 51.90380859375, 53.59375]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 19.0, 82.0, 253.0, 365.0, 225.0, 43.0, 14.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.48968505859375, -102.51563262939453, -99.54158782958984, -96.56753540039062, -93.59349060058594, -90.61943817138672, -87.6453857421875, -84.67134094238281, -81.6972885131836, -78.72323608398438, -75.74919128417969, -72.77513885498047, -69.80109405517578, -66.82704162597656, -63.85299301147461, -60.878944396972656, -57.9048957824707, -54.93084716796875, -51.9567985534668, -48.982749938964844, -46.008697509765625, -43.03464889526367, -40.06060028076172, -37.0865478515625, -34.11250305175781, -31.13845443725586, -28.164403915405273, -25.19035530090332, -22.216304779052734, -19.24225616455078, -16.268207550048828, -13.294157028198242, -10.320106506347656, -7.346056938171387, -4.372007846832275, -1.397958755493164, 1.5760908126831055, 4.550140380859375, 7.524188995361328, 10.498239517211914, 13.472288131713867, 16.44633674621582, 19.420387268066406, 22.39443588256836, 25.368484497070312, 28.3425350189209, 31.31658363342285, 34.29063415527344, 37.26468276977539, 40.238731384277344, 43.2127799987793, 46.18682861328125, 49.16088104248047, 52.13492965698242, 55.108978271484375, 58.083030700683594, 61.05707550048828, 64.0311279296875, 67.00517272949219, 69.9792251586914, 72.9532699584961, 75.92732238769531, 78.9013671875, 81.87541961669922, 84.84947204589844]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 7.0, 4.0, 4.0, 12.0, 19.0, 14.0, 13.0, 14.0, 22.0, 21.0, 33.0, 34.0, 25.0, 36.0, 40.0, 34.0, 42.0, 45.0, 34.0, 56.0, 41.0, 45.0, 51.0, 44.0, 43.0, 26.0, 33.0, 30.0, 24.0, 28.0, 24.0, 25.0, 13.0, 16.0, 10.0, 4.0, 5.0, 6.0, 7.0, 6.0, 4.0, 3.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-59.913509368896484, -58.10139083862305, -56.28927230834961, -54.477149963378906, -52.66503143310547, -50.85291290283203, -49.040794372558594, -47.228675842285156, -45.41655731201172, -43.60443878173828, -41.792320251464844, -39.980201721191406, -38.1680793762207, -36.355960845947266, -34.54384231567383, -32.73172378540039, -30.91960334777832, -29.107484817504883, -27.295364379882812, -25.483245849609375, -23.671127319335938, -21.8590087890625, -20.04688835144043, -18.234769821166992, -16.422649383544922, -14.610529899597168, -12.79841136932373, -10.986291885375977, -9.174173355102539, -7.362053871154785, -5.549934387207031, -3.7378158569335938, -1.9256973266601562, -0.113578200340271, 1.6985409259796143, 3.510660171508789, 5.322779178619385, 7.1348981857299805, 8.947017669677734, 10.759136199951172, 12.571255683898926, 14.38337516784668, 16.195493698120117, 18.007614135742188, 19.819732666015625, 21.631851196289062, 23.4439697265625, 25.256088256835938, 27.068208694458008, 28.880327224731445, 30.692447662353516, 32.50456619262695, 34.31668472290039, 36.12880325317383, 37.94092559814453, 39.75304412841797, 41.565162658691406, 43.377281188964844, 45.18939971923828, 47.00151824951172, 48.81364059448242, 50.62575912475586, 52.4378776550293, 54.249996185302734, 56.06211471557617]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 2.0, 5.0, 9.0, 5.0, 7.0, 13.0, 13.0, 14.0, 22.0, 18.0, 27.0, 35.0, 27.0, 18.0, 25.0, 31.0, 35.0, 35.0, 48.0, 40.0, 28.0, 34.0, 26.0, 41.0, 32.0, 37.0, 28.0, 40.0, 34.0, 22.0, 33.0, 27.0, 30.0, 15.0, 28.0, 17.0, 14.0, 16.0, 12.0, 10.0, 12.0, 6.0, 3.0, 4.0, 5.0, 4.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-6.35546875, -6.15106201171875, -5.9466552734375, -5.74224853515625, -5.537841796875, -5.33343505859375, -5.1290283203125, -4.92462158203125, -4.72021484375, -4.51580810546875, -4.3114013671875, -4.10699462890625, -3.902587890625, -3.69818115234375, -3.4937744140625, -3.28936767578125, -3.0849609375, -2.88055419921875, -2.6761474609375, -2.47174072265625, -2.267333984375, -2.06292724609375, -1.8585205078125, -1.65411376953125, -1.44970703125, -1.24530029296875, -1.0408935546875, -0.83648681640625, -0.632080078125, -0.42767333984375, -0.2232666015625, -0.01885986328125, 0.185546875, 0.38995361328125, 0.5943603515625, 0.79876708984375, 1.003173828125, 1.20758056640625, 1.4119873046875, 1.61639404296875, 1.82080078125, 2.02520751953125, 2.2296142578125, 2.43402099609375, 2.638427734375, 2.84283447265625, 3.0472412109375, 3.25164794921875, 3.4560546875, 3.66046142578125, 3.8648681640625, 4.06927490234375, 4.273681640625, 4.47808837890625, 4.6824951171875, 4.88690185546875, 5.09130859375, 5.29571533203125, 5.5001220703125, 5.70452880859375, 5.908935546875, 6.11334228515625, 6.3177490234375, 6.52215576171875, 6.7265625]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 3.0, 6.0, 12.0, 13.0, 14.0, 24.0, 34.0, 46.0, 79.0, 108.0, 131.0, 175.0, 241.0, 368.0, 517.0, 716.0, 1126.0, 1638.0, 2727.0, 4618.0, 9205.0, 21567.0, 72090.0, 315362.0, 1094449.0, 1680991.0, 728873.0, 181559.0, 44781.0, 15179.0, 6974.0, 3886.0, 2314.0, 1395.0, 923.0, 600.0, 439.0, 324.0, 219.0, 159.0, 122.0, 86.0, 65.0, 40.0, 35.0, 14.0, 9.0, 11.0, 9.0, 5.0, 6.0, 0.0, 3.0, 1.0, 2.0], "bins": [-9.4453125, -9.1700439453125, -8.894775390625, -8.6195068359375, -8.34423828125, -8.0689697265625, -7.793701171875, -7.5184326171875, -7.2431640625, -6.9678955078125, -6.692626953125, -6.4173583984375, -6.14208984375, -5.8668212890625, -5.591552734375, -5.3162841796875, -5.041015625, -4.7657470703125, -4.490478515625, -4.2152099609375, -3.93994140625, -3.6646728515625, -3.389404296875, -3.1141357421875, -2.8388671875, -2.5635986328125, -2.288330078125, -2.0130615234375, -1.73779296875, -1.4625244140625, -1.187255859375, -0.9119873046875, -0.63671875, -0.3614501953125, -0.086181640625, 0.1890869140625, 0.46435546875, 0.7396240234375, 1.014892578125, 1.2901611328125, 1.5654296875, 1.8406982421875, 2.115966796875, 2.3912353515625, 2.66650390625, 2.9417724609375, 3.217041015625, 3.4923095703125, 3.767578125, 4.0428466796875, 4.318115234375, 4.5933837890625, 4.86865234375, 5.1439208984375, 5.419189453125, 5.6944580078125, 5.9697265625, 6.2449951171875, 6.520263671875, 6.7955322265625, 7.07080078125, 7.3460693359375, 7.621337890625, 7.8966064453125, 8.171875]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 6.0, 4.0, 19.0, 30.0, 49.0, 89.0, 156.0, 262.0, 459.0, 716.0, 843.0, 560.0, 359.0, 203.0, 131.0, 73.0, 54.0, 22.0, 18.0, 3.0, 7.0, 7.0, 1.0, 0.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.453125, -13.805419921875, -13.15771484375, -12.510009765625, -11.8623046875, -11.214599609375, -10.56689453125, -9.919189453125, -9.271484375, -8.623779296875, -7.97607421875, -7.328369140625, -6.6806640625, -6.032958984375, -5.38525390625, -4.737548828125, -4.08984375, -3.442138671875, -2.79443359375, -2.146728515625, -1.4990234375, -0.851318359375, -0.20361328125, 0.444091796875, 1.091796875, 1.739501953125, 2.38720703125, 3.034912109375, 3.6826171875, 4.330322265625, 4.97802734375, 5.625732421875, 6.2734375, 6.921142578125, 7.56884765625, 8.216552734375, 8.8642578125, 9.511962890625, 10.15966796875, 10.807373046875, 11.455078125, 12.102783203125, 12.75048828125, 13.398193359375, 14.0458984375, 14.693603515625, 15.34130859375, 15.989013671875, 16.63671875, 17.284423828125, 17.93212890625, 18.579833984375, 19.2275390625, 19.875244140625, 20.52294921875, 21.170654296875, 21.818359375, 22.466064453125, 23.11376953125, 23.761474609375, 24.4091796875, 25.056884765625, 25.70458984375, 26.352294921875, 27.0]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 7.0, 7.0, 8.0, 10.0, 6.0, 31.0, 38.0, 72.0, 124.0, 275.0, 579.0, 1417.0, 5360.0, 2686681.0, 1492535.0, 4670.0, 1364.0, 560.0, 242.0, 143.0, 53.0, 36.0, 21.0, 12.0, 9.0, 6.0, 5.0, 5.0, 2.0, 2.0, 2.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-63.09375, -61.51513671875, -59.9365234375, -58.35791015625, -56.779296875, -55.20068359375, -53.6220703125, -52.04345703125, -50.46484375, -48.88623046875, -47.3076171875, -45.72900390625, -44.150390625, -42.57177734375, -40.9931640625, -39.41455078125, -37.8359375, -36.25732421875, -34.6787109375, -33.10009765625, -31.521484375, -29.94287109375, -28.3642578125, -26.78564453125, -25.20703125, -23.62841796875, -22.0498046875, -20.47119140625, -18.892578125, -17.31396484375, -15.7353515625, -14.15673828125, -12.578125, -10.99951171875, -9.4208984375, -7.84228515625, -6.263671875, -4.68505859375, -3.1064453125, -1.52783203125, 0.05078125, 1.62939453125, 3.2080078125, 4.78662109375, 6.365234375, 7.94384765625, 9.5224609375, 11.10107421875, 12.6796875, 14.25830078125, 15.8369140625, 17.41552734375, 18.994140625, 20.57275390625, 22.1513671875, 23.72998046875, 25.30859375, 26.88720703125, 28.4658203125, 30.04443359375, 31.623046875, 33.20166015625, 34.7802734375, 36.35888671875, 37.9375]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 68.0, 689.0, 252.0, 2.0, 0.0, 2.0], "bins": [-572.313232421875, -562.7169799804688, -553.1207275390625, -543.5244750976562, -533.92822265625, -524.3319702148438, -514.7357177734375, -505.13946533203125, -495.543212890625, -485.94696044921875, -476.3507080078125, -466.75445556640625, -457.158203125, -447.56195068359375, -437.9656982421875, -428.36944580078125, -418.7732238769531, -409.1769714355469, -399.5807189941406, -389.9844665527344, -380.3882141113281, -370.7919616699219, -361.1957092285156, -351.5994873046875, -342.00323486328125, -332.406982421875, -322.81072998046875, -313.2144775390625, -303.61822509765625, -294.02197265625, -284.42572021484375, -274.8294677734375, -265.2332458496094, -255.63699340820312, -246.04074096679688, -236.44448852539062, -226.84823608398438, -217.25198364257812, -207.65574645996094, -198.0594940185547, -188.46324157714844, -178.8669891357422, -169.27073669433594, -159.6744842529297, -150.0782470703125, -140.48199462890625, -130.8857421875, -121.28948974609375, -111.6932373046875, -102.09698486328125, -92.500732421875, -82.90448760986328, -73.30823516845703, -63.71198272705078, -54.1157341003418, -44.51948547363281, -34.92323303222656, -25.326982498168945, -15.730731964111328, -6.134481430053711, 3.4617691040039062, 13.058021545410156, 22.65427017211914, 32.250518798828125, 41.846771240234375]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 4.0, 11.0, 7.0, 10.0, 14.0, 22.0, 27.0, 29.0, 16.0, 26.0, 33.0, 39.0, 43.0, 54.0, 49.0, 20.0, 51.0, 42.0, 60.0, 59.0, 47.0, 46.0, 42.0, 38.0, 34.0, 27.0, 26.0, 22.0, 30.0, 20.0, 15.0, 7.0, 5.0, 4.0, 9.0, 3.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-59.777099609375, -58.08835220336914, -56.39960479736328, -54.71086120605469, -53.02211380004883, -51.33336639404297, -49.64461898803711, -47.95587158203125, -46.267127990722656, -44.5783805847168, -42.88963317871094, -41.200889587402344, -39.512142181396484, -37.823394775390625, -36.134647369384766, -34.445899963378906, -32.75715255737305, -31.068405151367188, -29.37965965270996, -27.6909122467041, -26.002166748046875, -24.313419342041016, -22.624671936035156, -20.935924530029297, -19.24717903137207, -17.55843162536621, -15.869686126708984, -14.180938720703125, -12.492192268371582, -10.803445816040039, -9.11469841003418, -7.425951957702637, -5.737205505371094, -4.048459053039551, -2.3597121238708496, -0.6709651947021484, 1.0177812576293945, 2.7065277099609375, 4.395275115966797, 6.08402156829834, 7.772768020629883, 9.461514472961426, 11.150260925292969, 12.839008331298828, 14.527754783630371, 16.216501235961914, 17.905248641967773, 19.593994140625, 21.28274154663086, 22.97148895263672, 24.660234451293945, 26.348981857299805, 28.03772735595703, 29.72647476196289, 31.41522216796875, 33.10396957397461, 34.79271697998047, 36.48146438598633, 38.17021179199219, 39.85895538330078, 41.54770278930664, 43.2364501953125, 44.92519760131836, 46.61394500732422, 48.30268859863281]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 8.0, 8.0, 7.0, 11.0, 15.0, 17.0, 15.0, 15.0, 20.0, 13.0, 28.0, 29.0, 31.0, 32.0, 30.0, 44.0, 33.0, 34.0, 35.0, 42.0, 33.0, 33.0, 39.0, 38.0, 39.0, 34.0, 43.0, 30.0, 25.0, 19.0, 29.0, 19.0, 24.0, 15.0, 23.0, 20.0, 8.0, 9.0, 9.0, 8.0, 7.0, 4.0, 4.0, 7.0, 3.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 3.0], "bins": [-5.18359375, -5.02191162109375, -4.8602294921875, -4.69854736328125, -4.536865234375, -4.37518310546875, -4.2135009765625, -4.05181884765625, -3.89013671875, -3.72845458984375, -3.5667724609375, -3.40509033203125, -3.243408203125, -3.08172607421875, -2.9200439453125, -2.75836181640625, -2.5966796875, -2.43499755859375, -2.2733154296875, -2.11163330078125, -1.949951171875, -1.78826904296875, -1.6265869140625, -1.46490478515625, -1.30322265625, -1.14154052734375, -0.9798583984375, -0.81817626953125, -0.656494140625, -0.49481201171875, -0.3331298828125, -0.17144775390625, -0.009765625, 0.15191650390625, 0.3135986328125, 0.47528076171875, 0.636962890625, 0.79864501953125, 0.9603271484375, 1.12200927734375, 1.28369140625, 1.44537353515625, 1.6070556640625, 1.76873779296875, 1.930419921875, 2.09210205078125, 2.2537841796875, 2.41546630859375, 2.5771484375, 2.73883056640625, 2.9005126953125, 3.06219482421875, 3.223876953125, 3.38555908203125, 3.5472412109375, 3.70892333984375, 3.87060546875, 4.03228759765625, 4.1939697265625, 4.35565185546875, 4.517333984375, 4.67901611328125, 4.8406982421875, 5.00238037109375, 5.1640625]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 2.0, 7.0, 3.0, 9.0, 11.0, 20.0, 19.0, 25.0, 49.0, 78.0, 104.0, 147.0, 226.0, 290.0, 424.0, 636.0, 883.0, 1204.0, 1724.0, 2552.0, 3515.0, 5090.0, 7600.0, 11518.0, 17491.0, 27830.0, 45550.0, 77357.0, 143757.0, 242942.0, 194204.0, 103851.0, 58858.0, 35076.0, 21881.0, 13976.0, 9203.0, 6233.0, 4265.0, 2950.0, 2166.0, 1421.0, 1026.0, 687.0, 475.0, 338.0, 277.0, 185.0, 135.0, 72.0, 71.0, 50.0, 33.0, 20.0, 19.0, 16.0, 7.0, 2.0, 2.0, 4.0], "bins": [-0.7373046875, -0.7154541015625, -0.693603515625, -0.6717529296875, -0.64990234375, -0.6280517578125, -0.606201171875, -0.5843505859375, -0.5625, -0.5406494140625, -0.518798828125, -0.4969482421875, -0.47509765625, -0.4532470703125, -0.431396484375, -0.4095458984375, -0.3876953125, -0.3658447265625, -0.343994140625, -0.3221435546875, -0.30029296875, -0.2784423828125, -0.256591796875, -0.2347412109375, -0.212890625, -0.1910400390625, -0.169189453125, -0.1473388671875, -0.12548828125, -0.1036376953125, -0.081787109375, -0.0599365234375, -0.0380859375, -0.0162353515625, 0.005615234375, 0.0274658203125, 0.04931640625, 0.0711669921875, 0.093017578125, 0.1148681640625, 0.13671875, 0.1585693359375, 0.180419921875, 0.2022705078125, 0.22412109375, 0.2459716796875, 0.267822265625, 0.2896728515625, 0.3115234375, 0.3333740234375, 0.355224609375, 0.3770751953125, 0.39892578125, 0.4207763671875, 0.442626953125, 0.4644775390625, 0.486328125, 0.5081787109375, 0.530029296875, 0.5518798828125, 0.57373046875, 0.5955810546875, 0.617431640625, 0.6392822265625, 0.6611328125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 6.0, 5.0, 6.0, 5.0, 7.0, 7.0, 7.0, 15.0, 20.0, 17.0, 15.0, 23.0, 28.0, 30.0, 27.0, 37.0, 37.0, 45.0, 43.0, 42.0, 37.0, 46.0, 1069.0, 42.0, 30.0, 30.0, 28.0, 33.0, 31.0, 31.0, 29.0, 28.0, 25.0, 18.0, 24.0, 10.0, 17.0, 9.0, 13.0, 12.0, 7.0, 4.0, 11.0, 7.0, 8.0, 5.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.34765625, -3.240570068359375, -3.13348388671875, -3.026397705078125, -2.9193115234375, -2.812225341796875, -2.70513916015625, -2.598052978515625, -2.490966796875, -2.383880615234375, -2.27679443359375, -2.169708251953125, -2.0626220703125, -1.955535888671875, -1.84844970703125, -1.741363525390625, -1.63427734375, -1.527191162109375, -1.42010498046875, -1.313018798828125, -1.2059326171875, -1.098846435546875, -0.99176025390625, -0.884674072265625, -0.777587890625, -0.670501708984375, -0.56341552734375, -0.456329345703125, -0.3492431640625, -0.242156982421875, -0.13507080078125, -0.027984619140625, 0.0791015625, 0.186187744140625, 0.29327392578125, 0.400360107421875, 0.5074462890625, 0.614532470703125, 0.72161865234375, 0.828704833984375, 0.935791015625, 1.042877197265625, 1.14996337890625, 1.257049560546875, 1.3641357421875, 1.471221923828125, 1.57830810546875, 1.685394287109375, 1.79248046875, 1.899566650390625, 2.00665283203125, 2.113739013671875, 2.2208251953125, 2.327911376953125, 2.43499755859375, 2.542083740234375, 2.649169921875, 2.756256103515625, 2.86334228515625, 2.970428466796875, 3.0775146484375, 3.184600830078125, 3.29168701171875, 3.398773193359375, 3.505859375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 9.0, 9.0, 17.0, 31.0, 36.0, 68.0, 85.0, 133.0, 157.0, 228.0, 355.0, 469.0, 672.0, 1089.0, 1483.0, 2191.0, 3192.0, 4766.0, 7217.0, 11068.0, 16962.0, 27024.0, 44358.0, 75640.0, 138781.0, 1286648.0, 202179.0, 109386.0, 60815.0, 36375.0, 22621.0, 14592.0, 9336.0, 5961.0, 4172.0, 2822.0, 1822.0, 1350.0, 971.0, 634.0, 428.0, 303.0, 229.0, 164.0, 84.0, 69.0, 37.0, 30.0, 31.0, 20.0, 7.0, 8.0, 4.0, 0.0, 0.0, 1.0], "bins": [-0.693359375, -0.6728515625, -0.65234375, -0.6318359375, -0.611328125, -0.5908203125, -0.5703125, -0.5498046875, -0.529296875, -0.5087890625, -0.48828125, -0.4677734375, -0.447265625, -0.4267578125, -0.40625, -0.3857421875, -0.365234375, -0.3447265625, -0.32421875, -0.3037109375, -0.283203125, -0.2626953125, -0.2421875, -0.2216796875, -0.201171875, -0.1806640625, -0.16015625, -0.1396484375, -0.119140625, -0.0986328125, -0.078125, -0.0576171875, -0.037109375, -0.0166015625, 0.00390625, 0.0244140625, 0.044921875, 0.0654296875, 0.0859375, 0.1064453125, 0.126953125, 0.1474609375, 0.16796875, 0.1884765625, 0.208984375, 0.2294921875, 0.25, 0.2705078125, 0.291015625, 0.3115234375, 0.33203125, 0.3525390625, 0.373046875, 0.3935546875, 0.4140625, 0.4345703125, 0.455078125, 0.4755859375, 0.49609375, 0.5166015625, 0.537109375, 0.5576171875, 0.578125, 0.5986328125, 0.619140625]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 7.0, 0.0, 4.0, 2.0, 7.0, 8.0, 7.0, 13.0, 7.0, 12.0, 16.0, 23.0, 26.0, 20.0, 26.0, 18.0, 41.0, 39.0, 42.0, 50.0, 47.0, 49.0, 61.0, 45.0, 49.0, 41.0, 55.0, 44.0, 40.0, 35.0, 35.0, 28.0, 14.0, 21.0, 21.0, 22.0, 12.0, 7.0, 6.0, 6.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00131988525390625, -0.0012701302766799927, -0.0012203752994537354, -0.001170620322227478, -0.0011208653450012207, -0.0010711103677749634, -0.001021355390548706, -0.0009716004133224487, -0.0009218454360961914, -0.0008720904588699341, -0.0008223354816436768, -0.0007725805044174194, -0.0007228255271911621, -0.0006730705499649048, -0.0006233155727386475, -0.0005735605955123901, -0.0005238056182861328, -0.0004740506410598755, -0.00042429566383361816, -0.00037454068660736084, -0.0003247857093811035, -0.0002750307321548462, -0.00022527575492858887, -0.00017552077770233154, -0.00012576580047607422, -7.60108232498169e-05, -2.625584602355957e-05, 2.3499131202697754e-05, 7.325410842895508e-05, 0.0001230090856552124, 0.00017276406288146973, 0.00022251904010772705, 0.0002722740173339844, 0.0003220289945602417, 0.000371783971786499, 0.00042153894901275635, 0.00047129392623901367, 0.000521048903465271, 0.0005708038806915283, 0.0006205588579177856, 0.000670313835144043, 0.0007200688123703003, 0.0007698237895965576, 0.0008195787668228149, 0.0008693337440490723, 0.0009190887212753296, 0.0009688436985015869, 0.0010185986757278442, 0.0010683536529541016, 0.0011181086301803589, 0.0011678636074066162, 0.0012176185846328735, 0.0012673735618591309, 0.0013171285390853882, 0.0013668835163116455, 0.0014166384935379028, 0.0014663934707641602, 0.0015161484479904175, 0.0015659034252166748, 0.0016156584024429321, 0.0016654133796691895, 0.0017151683568954468, 0.001764923334121704, 0.0018146783113479614, 0.0018644332885742188]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 7.0, 4.0, 5.0, 14.0, 18.0, 24.0, 29.0, 39.0, 53.0, 55.0, 69.0, 112.0, 133.0, 199.0, 257.0, 380.0, 612.0, 1264.0, 307306.0, 734440.0, 1467.0, 641.0, 384.0, 260.0, 178.0, 144.0, 99.0, 91.0, 58.0, 46.0, 45.0, 31.0, 25.0, 20.0, 11.0, 8.0, 12.0, 9.0, 4.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.027557373046875, -0.026670217514038086, -0.025783061981201172, -0.024895906448364258, -0.024008750915527344, -0.02312159538269043, -0.022234439849853516, -0.0213472843170166, -0.020460128784179688, -0.019572973251342773, -0.01868581771850586, -0.017798662185668945, -0.01691150665283203, -0.016024351119995117, -0.015137195587158203, -0.014250040054321289, -0.013362884521484375, -0.012475728988647461, -0.011588573455810547, -0.010701417922973633, -0.009814262390136719, -0.008927106857299805, -0.00803995132446289, -0.0071527957916259766, -0.0062656402587890625, -0.0053784847259521484, -0.004491329193115234, -0.0036041736602783203, -0.0027170181274414062, -0.0018298625946044922, -0.0009427070617675781, -5.555152893066406e-05, 0.00083160400390625, 0.001718759536743164, 0.002605915069580078, 0.003493070602416992, 0.004380226135253906, 0.00526738166809082, 0.006154537200927734, 0.0070416927337646484, 0.007928848266601562, 0.008816003799438477, 0.00970315933227539, 0.010590314865112305, 0.011477470397949219, 0.012364625930786133, 0.013251781463623047, 0.014138936996459961, 0.015026092529296875, 0.01591324806213379, 0.016800403594970703, 0.017687559127807617, 0.01857471466064453, 0.019461870193481445, 0.02034902572631836, 0.021236181259155273, 0.022123336791992188, 0.0230104923248291, 0.023897647857666016, 0.02478480339050293, 0.025671958923339844, 0.026559114456176758, 0.027446269989013672, 0.028333425521850586, 0.0292205810546875]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 7.0, 31.0, 149.0, 338.0, 315.0, 133.0, 30.0, 8.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002386812586337328, -0.0023185203317552805, -0.0022502278443425894, -0.002181935589760542, -0.002113643102347851, -0.0020453508477658033, -0.0019770583603531122, -0.0019087661057710648, -0.0018404737347736955, -0.0017721813637763262, -0.0017038889927789569, -0.0016355966217815876, -0.0015673043671995401, -0.001499011879786849, -0.0014307196252048016, -0.0013624272542074323, -0.001294134883210063, -0.0012258425122126937, -0.0011575501412153244, -0.0010892577702179551, -0.0010209653992205858, -0.0009526730864308774, -0.0008843807736411691, -0.0008160884026437998, -0.0007477960316464305, -0.0006795036606490612, -0.0006112112896516919, -0.0005429189768619835, -0.00047462660586461425, -0.00040633423486724496, -0.0003380418929737061, -0.0002697495510801673, -0.00020145741291344166, -0.0001331650564679876, -6.487270002253354e-05, 3.419656422920525e-06, 7.171201286837459e-05, 0.00014000438386574388, 0.0002082967257592827, 0.00027658906765282154, 0.00034488143865019083, 0.0004131738096475601, 0.00048146615154109895, 0.0005497584934346378, 0.0006180508644320071, 0.0006863432354293764, 0.0007546355482190847, 0.000822927919216454, 0.0008912202902138233, 0.0009595126612111926, 0.001027805032208562, 0.0010960974032059312, 0.0011643897742033005, 0.001232682028785348, 0.0013009743997827172, 0.0013692667707800865, 0.0014375591417774558, 0.001505851512774825, 0.0015741438837721944, 0.0016424362547695637, 0.0017107285093516111, 0.0017790209967643023, 0.0018473132513463497, 0.001915605622343719, 0.0019838979933410883]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 4.0, 4.0, 5.0, 5.0, 6.0, 9.0, 13.0, 8.0, 15.0, 17.0, 16.0, 20.0, 27.0, 30.0, 24.0, 26.0, 29.0, 40.0, 36.0, 37.0, 52.0, 38.0, 36.0, 45.0, 28.0, 40.0, 44.0, 35.0, 36.0, 32.0, 24.0, 34.0, 21.0, 30.0, 22.0, 20.0, 16.0, 15.0, 19.0, 16.0, 8.0, 7.0, 6.0, 3.0, 4.0, 5.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007917284965515137, -0.000765705481171608, -0.0007396824657917023, -0.0007136594504117966, -0.0006876364350318909, -0.0006616134196519852, -0.0006355904042720795, -0.0006095673888921738, -0.0005835443735122681, -0.0005575213581323624, -0.0005314983427524567, -0.000505475327372551, -0.00047945231199264526, -0.00045342929661273956, -0.00042740628123283386, -0.00040138326585292816, -0.00037536025047302246, -0.00034933723509311676, -0.00032331421971321106, -0.00029729120433330536, -0.00027126818895339966, -0.00024524517357349396, -0.00021922215819358826, -0.00019319914281368256, -0.00016717612743377686, -0.00014115311205387115, -0.00011513009667396545, -8.910708129405975e-05, -6.308406591415405e-05, -3.706105053424835e-05, -1.1038035154342651e-05, 1.498498022556305e-05, 4.100799560546875e-05, 6.703101098537445e-05, 9.305402636528015e-05, 0.00011907704174518585, 0.00014510005712509155, 0.00017112307250499725, 0.00019714608788490295, 0.00022316910326480865, 0.00024919211864471436, 0.00027521513402462006, 0.00030123814940452576, 0.00032726116478443146, 0.00035328418016433716, 0.00037930719554424286, 0.00040533021092414856, 0.00043135322630405426, 0.00045737624168395996, 0.00048339925706386566, 0.0005094222724437714, 0.0005354452878236771, 0.0005614683032035828, 0.0005874913185834885, 0.0006135143339633942, 0.0006395373493432999, 0.0006655603647232056, 0.0006915833801031113, 0.000717606395483017, 0.0007436294108629227, 0.0007696524262428284, 0.0007956754416227341, 0.0008216984570026398, 0.0008477214723825455, 0.0008737444877624512]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 8.0, 8.0, 7.0, 11.0, 15.0, 17.0, 15.0, 15.0, 20.0, 13.0, 28.0, 29.0, 31.0, 32.0, 30.0, 44.0, 33.0, 34.0, 35.0, 42.0, 33.0, 33.0, 39.0, 38.0, 39.0, 34.0, 43.0, 30.0, 25.0, 19.0, 29.0, 19.0, 24.0, 15.0, 23.0, 20.0, 8.0, 9.0, 9.0, 8.0, 7.0, 4.0, 4.0, 7.0, 3.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 3.0], "bins": [-5.18359375, -5.02191162109375, -4.8602294921875, -4.69854736328125, -4.536865234375, -4.37518310546875, -4.2135009765625, -4.05181884765625, -3.89013671875, -3.72845458984375, -3.5667724609375, -3.40509033203125, -3.243408203125, -3.08172607421875, -2.9200439453125, -2.75836181640625, -2.5966796875, -2.43499755859375, -2.2733154296875, -2.11163330078125, -1.949951171875, -1.78826904296875, -1.6265869140625, -1.46490478515625, -1.30322265625, -1.14154052734375, -0.9798583984375, -0.81817626953125, -0.656494140625, -0.49481201171875, -0.3331298828125, -0.17144775390625, -0.009765625, 0.15191650390625, 0.3135986328125, 0.47528076171875, 0.636962890625, 0.79864501953125, 0.9603271484375, 1.12200927734375, 1.28369140625, 1.44537353515625, 1.6070556640625, 1.76873779296875, 1.930419921875, 2.09210205078125, 2.2537841796875, 2.41546630859375, 2.5771484375, 2.73883056640625, 2.9005126953125, 3.06219482421875, 3.223876953125, 3.38555908203125, 3.5472412109375, 3.70892333984375, 3.87060546875, 4.03228759765625, 4.1939697265625, 4.35565185546875, 4.517333984375, 4.67901611328125, 4.8406982421875, 5.00238037109375, 5.1640625]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 1.0, 4.0, 5.0, 2.0, 7.0, 10.0, 14.0, 16.0, 30.0, 28.0, 53.0, 63.0, 79.0, 102.0, 138.0, 188.0, 255.0, 451.0, 635.0, 1093.0, 1865.0, 3850.0, 9967.0, 31448.0, 144473.0, 612458.0, 183214.0, 37003.0, 11409.0, 4286.0, 2108.0, 1123.0, 688.0, 445.0, 296.0, 222.0, 129.0, 101.0, 72.0, 50.0, 39.0, 37.0, 19.0, 23.0, 10.0, 18.0, 10.0, 4.0, 8.0, 2.0, 3.0, 7.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.2421875, -8.9295654296875, -8.616943359375, -8.3043212890625, -7.99169921875, -7.6790771484375, -7.366455078125, -7.0538330078125, -6.7412109375, -6.4285888671875, -6.115966796875, -5.8033447265625, -5.49072265625, -5.1781005859375, -4.865478515625, -4.5528564453125, -4.240234375, -3.9276123046875, -3.614990234375, -3.3023681640625, -2.98974609375, -2.6771240234375, -2.364501953125, -2.0518798828125, -1.7392578125, -1.4266357421875, -1.114013671875, -0.8013916015625, -0.48876953125, -0.1761474609375, 0.136474609375, 0.4490966796875, 0.76171875, 1.0743408203125, 1.386962890625, 1.6995849609375, 2.01220703125, 2.3248291015625, 2.637451171875, 2.9500732421875, 3.2626953125, 3.5753173828125, 3.887939453125, 4.2005615234375, 4.51318359375, 4.8258056640625, 5.138427734375, 5.4510498046875, 5.763671875, 6.0762939453125, 6.388916015625, 6.7015380859375, 7.01416015625, 7.3267822265625, 7.639404296875, 7.9520263671875, 8.2646484375, 8.5772705078125, 8.889892578125, 9.2025146484375, 9.51513671875, 9.8277587890625, 10.140380859375, 10.4530029296875, 10.765625]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 8.0, 7.0, 13.0, 13.0, 15.0, 12.0, 17.0, 21.0, 28.0, 30.0, 33.0, 42.0, 57.0, 82.0, 125.0, 1651.0, 441.0, 90.0, 58.0, 50.0, 55.0, 44.0, 41.0, 23.0, 20.0, 16.0, 12.0, 10.0, 13.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-18.5625, -17.98046875, -17.3984375, -16.81640625, -16.234375, -15.65234375, -15.0703125, -14.48828125, -13.90625, -13.32421875, -12.7421875, -12.16015625, -11.578125, -10.99609375, -10.4140625, -9.83203125, -9.25, -8.66796875, -8.0859375, -7.50390625, -6.921875, -6.33984375, -5.7578125, -5.17578125, -4.59375, -4.01171875, -3.4296875, -2.84765625, -2.265625, -1.68359375, -1.1015625, -0.51953125, 0.0625, 0.64453125, 1.2265625, 1.80859375, 2.390625, 2.97265625, 3.5546875, 4.13671875, 4.71875, 5.30078125, 5.8828125, 6.46484375, 7.046875, 7.62890625, 8.2109375, 8.79296875, 9.375, 9.95703125, 10.5390625, 11.12109375, 11.703125, 12.28515625, 12.8671875, 13.44921875, 14.03125, 14.61328125, 15.1953125, 15.77734375, 16.359375, 16.94140625, 17.5234375, 18.10546875, 18.6875]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 12.0, 10.0, 18.0, 16.0, 26.0, 35.0, 40.0, 64.0, 113.0, 226.0, 430.0, 1158.0, 203593.0, 2937381.0, 1407.0, 506.0, 273.0, 136.0, 67.0, 41.0, 21.0, 25.0, 24.0, 16.0, 14.0, 10.0, 9.0, 10.0, 3.0, 5.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.34375, -52.6494140625, -50.955078125, -49.2607421875, -47.56640625, -45.8720703125, -44.177734375, -42.4833984375, -40.7890625, -39.0947265625, -37.400390625, -35.7060546875, -34.01171875, -32.3173828125, -30.623046875, -28.9287109375, -27.234375, -25.5400390625, -23.845703125, -22.1513671875, -20.45703125, -18.7626953125, -17.068359375, -15.3740234375, -13.6796875, -11.9853515625, -10.291015625, -8.5966796875, -6.90234375, -5.2080078125, -3.513671875, -1.8193359375, -0.125, 1.5693359375, 3.263671875, 4.9580078125, 6.65234375, 8.3466796875, 10.041015625, 11.7353515625, 13.4296875, 15.1240234375, 16.818359375, 18.5126953125, 20.20703125, 21.9013671875, 23.595703125, 25.2900390625, 26.984375, 28.6787109375, 30.373046875, 32.0673828125, 33.76171875, 35.4560546875, 37.150390625, 38.8447265625, 40.5390625, 42.2333984375, 43.927734375, 45.6220703125, 47.31640625, 49.0107421875, 50.705078125, 52.3994140625, 54.09375]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 50.0, 182.0, 464.0, 257.0, 46.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.63360595703125, -14.008525848388672, -12.38344669342041, -10.758367538452148, -9.13328742980957, -7.508207321166992, -5.8831281661987305, -4.258049011230469, -2.6329689025878906, -1.0078892707824707, 0.6171903610229492, 2.242269992828369, 3.867349624633789, 5.492429733276367, 7.117508888244629, 8.74258804321289, 10.367668151855469, 11.992748260498047, 13.617827415466309, 15.24290657043457, 16.86798667907715, 18.493066787719727, 20.118144989013672, 21.74322509765625, 23.368305206298828, 24.993385314941406, 26.618465423583984, 28.24354362487793, 29.868623733520508, 31.493703842163086, 33.11878204345703, 34.74386215209961, 36.36894226074219, 37.994022369384766, 39.619102478027344, 41.24418258666992, 42.8692626953125, 44.49433898925781, 46.11941909790039, 47.74449920654297, 49.36957931518555, 50.994659423828125, 52.6197395324707, 54.24481964111328, 55.869895935058594, 57.49497985839844, 59.12005615234375, 60.74513626098633, 62.370216369628906, 63.995296478271484, 65.62037658691406, 67.24545288085938, 68.87053680419922, 70.49561309814453, 72.12069702148438, 73.74577331542969, 75.370849609375, 76.99592590332031, 78.62100982666016, 80.24608612060547, 81.87117004394531, 83.49624633789062, 85.12133026123047, 86.74640655517578, 88.37149047851562]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 3.0, 3.0, 5.0, 6.0, 8.0, 14.0, 16.0, 10.0, 27.0, 33.0, 40.0, 37.0, 46.0, 38.0, 56.0, 49.0, 44.0, 48.0, 63.0, 61.0, 57.0, 44.0, 55.0, 39.0, 27.0, 39.0, 32.0, 25.0, 20.0, 18.0, 9.0, 12.0, 10.0, 4.0, 1.0, 5.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.127288818359375, -33.85502243041992, -32.582759857177734, -31.31049346923828, -30.03822898864746, -28.76596450805664, -27.493698120117188, -26.221433639526367, -24.949169158935547, -23.676904678344727, -22.404640197753906, -21.132373809814453, -19.860109329223633, -18.587844848632812, -17.31557846069336, -16.04331398010254, -14.771049499511719, -13.498785018920898, -12.226519584655762, -10.954254150390625, -9.681989669799805, -8.409725189208984, -7.137459754943848, -5.865194320678711, -4.592929840087891, -3.320664882659912, -2.0483999252319336, -0.7761349678039551, 0.49612998962402344, 1.768394947052002, 3.0406599044799805, 4.312925338745117, 5.585186004638672, 6.85745096206665, 8.129715919494629, 9.401981353759766, 10.674245834350586, 11.946510314941406, 13.218775749206543, 14.49104118347168, 15.7633056640625, 17.03557014465332, 18.30783462524414, 19.580101013183594, 20.852365493774414, 22.124629974365234, 23.396896362304688, 24.669160842895508, 25.941425323486328, 27.21368980407715, 28.48595428466797, 29.758220672607422, 31.030485153198242, 32.30274963378906, 33.575016021728516, 34.84728240966797, 36.119544982910156, 37.39181137084961, 38.6640739440918, 39.93634033203125, 41.20860290527344, 42.48086929321289, 43.753135681152344, 45.02539825439453, 46.297664642333984]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 5.0, 1.0, 8.0, 11.0, 10.0, 14.0, 13.0, 23.0, 27.0, 22.0, 30.0, 29.0, 37.0, 27.0, 49.0, 57.0, 51.0, 43.0, 44.0, 39.0, 43.0, 42.0, 56.0, 47.0, 33.0, 27.0, 32.0, 43.0, 28.0, 21.0, 18.0, 14.0, 13.0, 6.0, 3.0, 9.0, 5.0, 5.0, 8.0, 3.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.046875, -5.815673828125, -5.58447265625, -5.353271484375, -5.1220703125, -4.890869140625, -4.65966796875, -4.428466796875, -4.197265625, -3.966064453125, -3.73486328125, -3.503662109375, -3.2724609375, -3.041259765625, -2.81005859375, -2.578857421875, -2.34765625, -2.116455078125, -1.88525390625, -1.654052734375, -1.4228515625, -1.191650390625, -0.96044921875, -0.729248046875, -0.498046875, -0.266845703125, -0.03564453125, 0.195556640625, 0.4267578125, 0.657958984375, 0.88916015625, 1.120361328125, 1.3515625, 1.582763671875, 1.81396484375, 2.045166015625, 2.2763671875, 2.507568359375, 2.73876953125, 2.969970703125, 3.201171875, 3.432373046875, 3.66357421875, 3.894775390625, 4.1259765625, 4.357177734375, 4.58837890625, 4.819580078125, 5.05078125, 5.281982421875, 5.51318359375, 5.744384765625, 5.9755859375, 6.206787109375, 6.43798828125, 6.669189453125, 6.900390625, 7.131591796875, 7.36279296875, 7.593994140625, 7.8251953125, 8.056396484375, 8.28759765625, 8.518798828125, 8.75]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 12.0, 9.0, 19.0, 13.0, 31.0, 30.0, 41.0, 64.0, 77.0, 105.0, 137.0, 202.0, 275.0, 471.0, 687.0, 1201.0, 4167.0, 226606.0, 3923754.0, 31036.0, 2425.0, 976.0, 579.0, 401.0, 244.0, 178.0, 119.0, 101.0, 91.0, 52.0, 44.0, 27.0, 25.0, 27.0, 18.0, 15.0, 8.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.1875, -36.73828125, -35.2890625, -33.83984375, -32.390625, -30.94140625, -29.4921875, -28.04296875, -26.59375, -25.14453125, -23.6953125, -22.24609375, -20.796875, -19.34765625, -17.8984375, -16.44921875, -15.0, -13.55078125, -12.1015625, -10.65234375, -9.203125, -7.75390625, -6.3046875, -4.85546875, -3.40625, -1.95703125, -0.5078125, 0.94140625, 2.390625, 3.83984375, 5.2890625, 6.73828125, 8.1875, 9.63671875, 11.0859375, 12.53515625, 13.984375, 15.43359375, 16.8828125, 18.33203125, 19.78125, 21.23046875, 22.6796875, 24.12890625, 25.578125, 27.02734375, 28.4765625, 29.92578125, 31.375, 32.82421875, 34.2734375, 35.72265625, 37.171875, 38.62109375, 40.0703125, 41.51953125, 42.96875, 44.41796875, 45.8671875, 47.31640625, 48.765625, 50.21484375, 51.6640625, 53.11328125, 54.5625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 3.0, 3.0, 5.0, 8.0, 13.0, 21.0, 29.0, 31.0, 77.0, 130.0, 180.0, 313.0, 456.0, 670.0, 653.0, 524.0, 333.0, 225.0, 127.0, 89.0, 63.0, 33.0, 18.0, 15.0, 11.0, 12.0, 4.0, 10.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.2890625, -9.89404296875, -9.4990234375, -9.10400390625, -8.708984375, -8.31396484375, -7.9189453125, -7.52392578125, -7.12890625, -6.73388671875, -6.3388671875, -5.94384765625, -5.548828125, -5.15380859375, -4.7587890625, -4.36376953125, -3.96875, -3.57373046875, -3.1787109375, -2.78369140625, -2.388671875, -1.99365234375, -1.5986328125, -1.20361328125, -0.80859375, -0.41357421875, -0.0185546875, 0.37646484375, 0.771484375, 1.16650390625, 1.5615234375, 1.95654296875, 2.3515625, 2.74658203125, 3.1416015625, 3.53662109375, 3.931640625, 4.32666015625, 4.7216796875, 5.11669921875, 5.51171875, 5.90673828125, 6.3017578125, 6.69677734375, 7.091796875, 7.48681640625, 7.8818359375, 8.27685546875, 8.671875, 9.06689453125, 9.4619140625, 9.85693359375, 10.251953125, 10.64697265625, 11.0419921875, 11.43701171875, 11.83203125, 12.22705078125, 12.6220703125, 13.01708984375, 13.412109375, 13.80712890625, 14.2021484375, 14.59716796875, 14.9921875]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 4.0, 5.0, 13.0, 14.0, 32.0, 47.0, 93.0, 204.0, 524.0, 1460.0, 5838.0, 36938.0, 836389.0, 3186583.0, 110482.0, 11732.0, 2579.0, 781.0, 291.0, 133.0, 59.0, 36.0, 23.0, 9.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.6796875, -15.1239013671875, -14.568115234375, -14.0123291015625, -13.45654296875, -12.9007568359375, -12.344970703125, -11.7891845703125, -11.2333984375, -10.6776123046875, -10.121826171875, -9.5660400390625, -9.01025390625, -8.4544677734375, -7.898681640625, -7.3428955078125, -6.787109375, -6.2313232421875, -5.675537109375, -5.1197509765625, -4.56396484375, -4.0081787109375, -3.452392578125, -2.8966064453125, -2.3408203125, -1.7850341796875, -1.229248046875, -0.6734619140625, -0.11767578125, 0.4381103515625, 0.993896484375, 1.5496826171875, 2.10546875, 2.6612548828125, 3.217041015625, 3.7728271484375, 4.32861328125, 4.8843994140625, 5.440185546875, 5.9959716796875, 6.5517578125, 7.1075439453125, 7.663330078125, 8.2191162109375, 8.77490234375, 9.3306884765625, 9.886474609375, 10.4422607421875, 10.998046875, 11.5538330078125, 12.109619140625, 12.6654052734375, 13.22119140625, 13.7769775390625, 14.332763671875, 14.8885498046875, 15.4443359375, 16.0001220703125, 16.555908203125, 17.1116943359375, 17.66748046875, 18.2232666015625, 18.779052734375, 19.3348388671875, 19.890625]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 7.0, 15.0, 20.0, 36.0, 92.0, 130.0, 178.0, 160.0, 138.0, 96.0, 60.0, 26.0, 26.0, 8.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.20745086669922, -50.938514709472656, -47.669578552246094, -44.40064239501953, -41.13170623779297, -37.862770080566406, -34.593833923339844, -31.32489776611328, -28.05596160888672, -24.787025451660156, -21.518089294433594, -18.24915313720703, -14.980216979980469, -11.711280822753906, -8.442344665527344, -5.173408508300781, -1.9044723510742188, 1.3644638061523438, 4.633399963378906, 7.902336120605469, 11.171272277832031, 14.440208435058594, 17.709144592285156, 20.97808074951172, 24.24701690673828, 27.515953063964844, 30.784889221191406, 34.05382537841797, 37.32276153564453, 40.591697692871094, 43.860633850097656, 47.12957000732422, 50.39851379394531, 53.667449951171875, 56.93638610839844, 60.205322265625, 63.47425842285156, 66.74319458007812, 70.01213073730469, 73.28106689453125, 76.55000305175781, 79.81893920898438, 83.08787536621094, 86.3568115234375, 89.62574768066406, 92.89468383789062, 96.16361999511719, 99.43255615234375, 102.70149230957031, 105.97042846679688, 109.23936462402344, 112.50830078125, 115.77723693847656, 119.04617309570312, 122.31510925292969, 125.58404541015625, 128.8529815673828, 132.12191772460938, 135.39085388183594, 138.6597900390625, 141.92872619628906, 145.19766235351562, 148.4665985107422, 151.73553466796875, 155.0044708251953]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 6.0, 3.0, 5.0, 2.0, 4.0, 3.0, 6.0, 4.0, 10.0, 10.0, 6.0, 6.0, 20.0, 27.0, 19.0, 23.0, 23.0, 30.0, 38.0, 35.0, 36.0, 39.0, 35.0, 40.0, 36.0, 44.0, 46.0, 43.0, 37.0, 25.0, 39.0, 27.0, 29.0, 33.0, 34.0, 31.0, 19.0, 25.0, 23.0, 18.0, 20.0, 13.0, 8.0, 4.0, 5.0, 8.0, 5.0, 4.0, 5.0, 6.0, 1.0, 1.0, 1.0, 1.0], "bins": [-42.063720703125, -40.90061950683594, -39.737518310546875, -38.57441711425781, -37.41131591796875, -36.24821090698242, -35.08510971069336, -33.9220085144043, -32.758907318115234, -31.595806121826172, -30.43270492553711, -29.269601821899414, -28.10650062561035, -26.94339942932129, -25.780296325683594, -24.61719512939453, -23.45409393310547, -22.290992736816406, -21.127891540527344, -19.96478843688965, -18.801687240600586, -17.638586044311523, -16.475482940673828, -15.312381744384766, -14.149280548095703, -12.98617935180664, -11.823077201843262, -10.659975051879883, -9.49687385559082, -8.333772659301758, -7.170670509338379, -6.007568359375, -4.8444671630859375, -3.681365489959717, -2.518263816833496, -1.3551621437072754, -0.1920604705810547, 0.971041202545166, 2.1341428756713867, 3.2972450256347656, 4.460346221923828, 5.623447895050049, 6.7865495681762695, 7.94965124130249, 9.112752914428711, 10.275854110717773, 11.438956260681152, 12.602058410644531, 13.765159606933594, 14.928260803222656, 16.09136199951172, 17.254465103149414, 18.417566299438477, 19.58066749572754, 20.743770599365234, 21.906871795654297, 23.06997299194336, 24.233074188232422, 25.396175384521484, 26.55927848815918, 27.722379684448242, 28.885480880737305, 30.048583984375, 31.211685180664062, 32.374786376953125]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 5.0, 8.0, 6.0, 6.0, 8.0, 8.0, 13.0, 12.0, 17.0, 30.0, 24.0, 29.0, 48.0, 38.0, 33.0, 38.0, 47.0, 45.0, 39.0, 41.0, 54.0, 49.0, 49.0, 36.0, 43.0, 34.0, 35.0, 36.0, 25.0, 23.0, 26.0, 24.0, 16.0, 8.0, 11.0, 7.0, 10.0, 8.0, 2.0, 5.0, 7.0, 3.0, 1.0, 1.0, 1.0], "bins": [-81.625, -79.52294921875, -77.4208984375, -75.31884765625, -73.216796875, -71.11474609375, -69.0126953125, -66.91064453125, -64.80859375, -62.70654296875, -60.6044921875, -58.50244140625, -56.400390625, -54.29833984375, -52.1962890625, -50.09423828125, -47.9921875, -45.89013671875, -43.7880859375, -41.68603515625, -39.583984375, -37.48193359375, -35.3798828125, -33.27783203125, -31.17578125, -29.07373046875, -26.9716796875, -24.86962890625, -22.767578125, -20.66552734375, -18.5634765625, -16.46142578125, -14.359375, -12.25732421875, -10.1552734375, -8.05322265625, -5.951171875, -3.84912109375, -1.7470703125, 0.35498046875, 2.45703125, 4.55908203125, 6.6611328125, 8.76318359375, 10.865234375, 12.96728515625, 15.0693359375, 17.17138671875, 19.2734375, 21.37548828125, 23.4775390625, 25.57958984375, 27.681640625, 29.78369140625, 31.8857421875, 33.98779296875, 36.08984375, 38.19189453125, 40.2939453125, 42.39599609375, 44.498046875, 46.60009765625, 48.7021484375, 50.80419921875, 52.90625]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 1.0, 5.0, 10.0, 18.0, 14.0, 32.0, 54.0, 67.0, 96.0, 152.0, 209.0, 323.0, 442.0, 622.0, 909.0, 1446.0, 2093.0, 3199.0, 4563.0, 6971.0, 10482.0, 16616.0, 26390.0, 44190.0, 77391.0, 143717.0, 234219.0, 201818.0, 112405.0, 61888.0, 35822.0, 21905.0, 13622.0, 8877.0, 5826.0, 3951.0, 2606.0, 1750.0, 1224.0, 860.0, 569.0, 396.0, 249.0, 177.0, 124.0, 85.0, 57.0, 54.0, 27.0, 17.0, 9.0, 6.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.7734375, -6.55352783203125, -6.3336181640625, -6.11370849609375, -5.893798828125, -5.67388916015625, -5.4539794921875, -5.23406982421875, -5.01416015625, -4.79425048828125, -4.5743408203125, -4.35443115234375, -4.134521484375, -3.91461181640625, -3.6947021484375, -3.47479248046875, -3.2548828125, -3.03497314453125, -2.8150634765625, -2.59515380859375, -2.375244140625, -2.15533447265625, -1.9354248046875, -1.71551513671875, -1.49560546875, -1.27569580078125, -1.0557861328125, -0.83587646484375, -0.615966796875, -0.39605712890625, -0.1761474609375, 0.04376220703125, 0.263671875, 0.48358154296875, 0.7034912109375, 0.92340087890625, 1.143310546875, 1.36322021484375, 1.5831298828125, 1.80303955078125, 2.02294921875, 2.24285888671875, 2.4627685546875, 2.68267822265625, 2.902587890625, 3.12249755859375, 3.3424072265625, 3.56231689453125, 3.7822265625, 4.00213623046875, 4.2220458984375, 4.44195556640625, 4.661865234375, 4.88177490234375, 5.1016845703125, 5.32159423828125, 5.54150390625, 5.76141357421875, 5.9813232421875, 6.20123291015625, 6.421142578125, 6.64105224609375, 6.8609619140625, 7.08087158203125, 7.30078125]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 6.0, 5.0, 15.0, 15.0, 20.0, 17.0, 16.0, 26.0, 24.0, 27.0, 27.0, 32.0, 30.0, 57.0, 52.0, 50.0, 39.0, 1079.0, 52.0, 44.0, 32.0, 39.0, 37.0, 47.0, 22.0, 28.0, 26.0, 27.0, 20.0, 18.0, 21.0, 17.0, 8.0, 7.0, 5.0, 9.0, 9.0, 8.0, 5.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.75, -37.4443359375, -36.138671875, -34.8330078125, -33.52734375, -32.2216796875, -30.916015625, -29.6103515625, -28.3046875, -26.9990234375, -25.693359375, -24.3876953125, -23.08203125, -21.7763671875, -20.470703125, -19.1650390625, -17.859375, -16.5537109375, -15.248046875, -13.9423828125, -12.63671875, -11.3310546875, -10.025390625, -8.7197265625, -7.4140625, -6.1083984375, -4.802734375, -3.4970703125, -2.19140625, -0.8857421875, 0.419921875, 1.7255859375, 3.03125, 4.3369140625, 5.642578125, 6.9482421875, 8.25390625, 9.5595703125, 10.865234375, 12.1708984375, 13.4765625, 14.7822265625, 16.087890625, 17.3935546875, 18.69921875, 20.0048828125, 21.310546875, 22.6162109375, 23.921875, 25.2275390625, 26.533203125, 27.8388671875, 29.14453125, 30.4501953125, 31.755859375, 33.0615234375, 34.3671875, 35.6728515625, 36.978515625, 38.2841796875, 39.58984375, 40.8955078125, 42.201171875, 43.5068359375, 44.8125]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 7.0, 6.0, 5.0, 9.0, 23.0, 52.0, 42.0, 58.0, 100.0, 121.0, 211.0, 288.0, 430.0, 576.0, 842.0, 1238.0, 1806.0, 2688.0, 3880.0, 5711.0, 8710.0, 12860.0, 20017.0, 31006.0, 48289.0, 81736.0, 150304.0, 1291970.0, 180584.0, 96526.0, 55521.0, 34871.0, 22244.0, 14539.0, 9595.0, 6478.0, 4317.0, 2899.0, 1983.0, 1374.0, 1008.0, 696.0, 480.0, 306.0, 217.0, 175.0, 120.0, 72.0, 50.0, 32.0, 19.0, 15.0, 21.0, 10.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.29296875, -6.08758544921875, -5.8822021484375, -5.67681884765625, -5.471435546875, -5.26605224609375, -5.0606689453125, -4.85528564453125, -4.64990234375, -4.44451904296875, -4.2391357421875, -4.03375244140625, -3.828369140625, -3.62298583984375, -3.4176025390625, -3.21221923828125, -3.0068359375, -2.80145263671875, -2.5960693359375, -2.39068603515625, -2.185302734375, -1.97991943359375, -1.7745361328125, -1.56915283203125, -1.36376953125, -1.15838623046875, -0.9530029296875, -0.74761962890625, -0.542236328125, -0.33685302734375, -0.1314697265625, 0.07391357421875, 0.279296875, 0.48468017578125, 0.6900634765625, 0.89544677734375, 1.100830078125, 1.30621337890625, 1.5115966796875, 1.71697998046875, 1.92236328125, 2.12774658203125, 2.3331298828125, 2.53851318359375, 2.743896484375, 2.94927978515625, 3.1546630859375, 3.36004638671875, 3.5654296875, 3.77081298828125, 3.9761962890625, 4.18157958984375, 4.386962890625, 4.59234619140625, 4.7977294921875, 5.00311279296875, 5.20849609375, 5.41387939453125, 5.6192626953125, 5.82464599609375, 6.030029296875, 6.23541259765625, 6.4407958984375, 6.64617919921875, 6.8515625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 7.0, 2.0, 6.0, 4.0, 10.0, 6.0, 17.0, 7.0, 15.0, 19.0, 24.0, 33.0, 34.0, 40.0, 70.0, 75.0, 84.0, 93.0, 91.0, 75.0, 61.0, 46.0, 36.0, 33.0, 24.0, 18.0, 17.0, 14.0, 8.0, 8.0, 10.0, 2.0, 7.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.027679443359375, -0.02662801742553711, -0.02557659149169922, -0.024525165557861328, -0.023473739624023438, -0.022422313690185547, -0.021370887756347656, -0.020319461822509766, -0.019268035888671875, -0.018216609954833984, -0.017165184020996094, -0.016113758087158203, -0.015062332153320312, -0.014010906219482422, -0.012959480285644531, -0.01190805435180664, -0.01085662841796875, -0.00980520248413086, -0.008753776550292969, -0.007702350616455078, -0.0066509246826171875, -0.005599498748779297, -0.004548072814941406, -0.0034966468811035156, -0.002445220947265625, -0.0013937950134277344, -0.00034236907958984375, 0.0007090568542480469, 0.0017604827880859375, 0.002811908721923828, 0.0038633346557617188, 0.004914760589599609, 0.0059661865234375, 0.007017612457275391, 0.008069038391113281, 0.009120464324951172, 0.010171890258789062, 0.011223316192626953, 0.012274742126464844, 0.013326168060302734, 0.014377593994140625, 0.015429019927978516, 0.016480445861816406, 0.017531871795654297, 0.018583297729492188, 0.019634723663330078, 0.02068614959716797, 0.02173757553100586, 0.02278900146484375, 0.02384042739868164, 0.02489185333251953, 0.025943279266357422, 0.026994705200195312, 0.028046131134033203, 0.029097557067871094, 0.030148983001708984, 0.031200408935546875, 0.032251834869384766, 0.033303260803222656, 0.03435468673706055, 0.03540611267089844, 0.03645753860473633, 0.03750896453857422, 0.03856039047241211, 0.03961181640625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 3.0, 5.0, 7.0, 6.0, 7.0, 10.0, 18.0, 21.0, 22.0, 49.0, 61.0, 78.0, 129.0, 204.0, 341.0, 602.0, 1261.0, 3811.0, 16075.0, 104197.0, 616194.0, 260882.0, 33900.0, 6635.0, 2028.0, 835.0, 396.0, 264.0, 144.0, 111.0, 74.0, 52.0, 37.0, 25.0, 11.0, 18.0, 14.0, 7.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.277099609375, -0.26955223083496094, -0.2620048522949219, -0.2544574737548828, -0.24691009521484375, -0.2393627166748047, -0.23181533813476562, -0.22426795959472656, -0.2167205810546875, -0.20917320251464844, -0.20162582397460938, -0.1940784454345703, -0.18653106689453125, -0.1789836883544922, -0.17143630981445312, -0.16388893127441406, -0.156341552734375, -0.14879417419433594, -0.14124679565429688, -0.1336994171142578, -0.12615203857421875, -0.11860466003417969, -0.11105728149414062, -0.10350990295410156, -0.0959625244140625, -0.08841514587402344, -0.08086776733398438, -0.07332038879394531, -0.06577301025390625, -0.05822563171386719, -0.050678253173828125, -0.04313087463378906, -0.03558349609375, -0.028036117553710938, -0.020488739013671875, -0.012941360473632812, -0.00539398193359375, 0.0021533966064453125, 0.009700775146484375, 0.017248153686523438, 0.0247955322265625, 0.03234291076660156, 0.039890289306640625, 0.04743766784667969, 0.05498504638671875, 0.06253242492675781, 0.07007980346679688, 0.07762718200683594, 0.085174560546875, 0.09272193908691406, 0.10026931762695312, 0.10781669616699219, 0.11536407470703125, 0.12291145324707031, 0.13045883178710938, 0.13800621032714844, 0.1455535888671875, 0.15310096740722656, 0.16064834594726562, 0.1681957244873047, 0.17574310302734375, 0.1832904815673828, 0.19083786010742188, 0.19838523864746094, 0.2059326171875]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 6.0, 11.0, 16.0, 39.0, 58.0, 141.0, 178.0, 189.0, 155.0, 102.0, 62.0, 29.0, 13.0, 5.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.07190457731485367, -0.07035074383020401, -0.06879691034555435, -0.0672430694103241, -0.06568923592567444, -0.06413540244102478, -0.06258156895637512, -0.061027731746435165, -0.05947389826178551, -0.05792006477713585, -0.05636622756719589, -0.054812394082546234, -0.05325855687260628, -0.05170472338795662, -0.05015088617801666, -0.048597052693367004, -0.047043219208717346, -0.04548938572406769, -0.04393554851412773, -0.04238171502947807, -0.040827877819538116, -0.03927404433488846, -0.0377202108502388, -0.03616637364029884, -0.03461253643035889, -0.03305870294570923, -0.03150486573576927, -0.029951032251119614, -0.028397196903824806, -0.02684336155653, -0.02528952620923519, -0.023735690861940384, -0.022181859239935875, -0.020628023892641068, -0.01907418854534626, -0.017520353198051453, -0.015966519713401794, -0.014412684366106987, -0.01285884901881218, -0.011305014602839947, -0.00975117925554514, -0.008197343908250332, -0.006643509492278099, -0.005089674144983292, -0.0035358392633497715, -0.0019820043817162514, -0.00042816903442144394, 0.0011256653815507889, 0.0026795007288455963, 0.0042333356104791164, 0.0057871704921126366, 0.007341005839407444, 0.008894840255379677, 0.010448675602674484, 0.012002510949969292, 0.013556345365941525, 0.015110180713236332, 0.016664015129208565, 0.018217850476503372, 0.01977168582379818, 0.021325521171092987, 0.022879354655742645, 0.024433191865682602, 0.02598702535033226, 0.027540860697627068]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 5.0, 4.0, 9.0, 13.0, 5.0, 9.0, 14.0, 7.0, 17.0, 12.0, 14.0, 24.0, 31.0, 21.0, 30.0, 34.0, 34.0, 34.0, 35.0, 40.0, 36.0, 43.0, 41.0, 44.0, 47.0, 39.0, 42.0, 46.0, 28.0, 25.0, 33.0, 27.0, 13.0, 26.0, 13.0, 20.0, 19.0, 10.0, 12.0, 10.0, 9.0, 13.0, 4.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.013593435287475586, -0.013115603476762772, -0.012637771666049957, -0.012159939855337143, -0.011682108044624329, -0.011204276233911514, -0.0107264444231987, -0.010248612612485886, -0.009770780801773071, -0.009292948991060257, -0.008815117180347443, -0.008337285369634628, -0.007859453558921814, -0.007381621748209, -0.006903789937496185, -0.006425958126783371, -0.005948126316070557, -0.005470294505357742, -0.004992462694644928, -0.004514630883932114, -0.004036799073219299, -0.003558967262506485, -0.0030811354517936707, -0.0026033036410808563, -0.002125471830368042, -0.0016476400196552277, -0.0011698082089424133, -0.000691976398229599, -0.00021414458751678467, 0.00026368722319602966, 0.000741519033908844, 0.0012193508446216583, 0.0016971826553344727, 0.002175014466047287, 0.0026528462767601013, 0.0031306780874729156, 0.00360850989818573, 0.004086341708898544, 0.004564173519611359, 0.005042005330324173, 0.005519837141036987, 0.005997668951749802, 0.006475500762462616, 0.00695333257317543, 0.007431164383888245, 0.007908996194601059, 0.008386828005313873, 0.008864659816026688, 0.009342491626739502, 0.009820323437452316, 0.01029815524816513, 0.010775987058877945, 0.01125381886959076, 0.011731650680303574, 0.012209482491016388, 0.012687314301729202, 0.013165146112442017, 0.013642977923154831, 0.014120809733867645, 0.01459864154458046, 0.015076473355293274, 0.015554305166006088, 0.016032136976718903, 0.016509968787431717, 0.01698780059814453]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 5.0, 7.0, 7.0, 6.0, 8.0, 8.0, 13.0, 12.0, 17.0, 30.0, 23.0, 30.0, 48.0, 38.0, 36.0, 35.0, 47.0, 45.0, 39.0, 43.0, 53.0, 49.0, 48.0, 37.0, 42.0, 34.0, 35.0, 35.0, 27.0, 22.0, 26.0, 24.0, 16.0, 8.0, 11.0, 7.0, 10.0, 8.0, 2.0, 5.0, 8.0, 2.0, 1.0, 1.0, 1.0], "bins": [-81.6875, -79.5830078125, -77.478515625, -75.3740234375, -73.26953125, -71.1650390625, -69.060546875, -66.9560546875, -64.8515625, -62.7470703125, -60.642578125, -58.5380859375, -56.43359375, -54.3291015625, -52.224609375, -50.1201171875, -48.015625, -45.9111328125, -43.806640625, -41.7021484375, -39.59765625, -37.4931640625, -35.388671875, -33.2841796875, -31.1796875, -29.0751953125, -26.970703125, -24.8662109375, -22.76171875, -20.6572265625, -18.552734375, -16.4482421875, -14.34375, -12.2392578125, -10.134765625, -8.0302734375, -5.92578125, -3.8212890625, -1.716796875, 0.3876953125, 2.4921875, 4.5966796875, 6.701171875, 8.8056640625, 10.91015625, 13.0146484375, 15.119140625, 17.2236328125, 19.328125, 21.4326171875, 23.537109375, 25.6416015625, 27.74609375, 29.8505859375, 31.955078125, 34.0595703125, 36.1640625, 38.2685546875, 40.373046875, 42.4775390625, 44.58203125, 46.6865234375, 48.791015625, 50.8955078125, 53.0]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 4.0, 7.0, 4.0, 7.0, 8.0, 16.0, 15.0, 18.0, 26.0, 24.0, 32.0, 56.0, 79.0, 100.0, 186.0, 225.0, 422.0, 720.0, 1158.0, 2120.0, 4237.0, 9434.0, 27848.0, 118959.0, 544028.0, 260591.0, 50619.0, 14899.0, 5843.0, 2890.0, 1574.0, 854.0, 522.0, 336.0, 232.0, 118.0, 81.0, 63.0, 51.0, 35.0, 30.0, 27.0, 17.0, 4.0, 5.0, 8.0, 5.0, 11.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-16.03125, -15.555908203125, -15.08056640625, -14.605224609375, -14.1298828125, -13.654541015625, -13.17919921875, -12.703857421875, -12.228515625, -11.753173828125, -11.27783203125, -10.802490234375, -10.3271484375, -9.851806640625, -9.37646484375, -8.901123046875, -8.42578125, -7.950439453125, -7.47509765625, -6.999755859375, -6.5244140625, -6.049072265625, -5.57373046875, -5.098388671875, -4.623046875, -4.147705078125, -3.67236328125, -3.197021484375, -2.7216796875, -2.246337890625, -1.77099609375, -1.295654296875, -0.8203125, -0.344970703125, 0.13037109375, 0.605712890625, 1.0810546875, 1.556396484375, 2.03173828125, 2.507080078125, 2.982421875, 3.457763671875, 3.93310546875, 4.408447265625, 4.8837890625, 5.359130859375, 5.83447265625, 6.309814453125, 6.78515625, 7.260498046875, 7.73583984375, 8.211181640625, 8.6865234375, 9.161865234375, 9.63720703125, 10.112548828125, 10.587890625, 11.063232421875, 11.53857421875, 12.013916015625, 12.4892578125, 12.964599609375, 13.43994140625, 13.915283203125, 14.390625]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 8.0, 15.0, 23.0, 43.0, 48.0, 97.0, 115.0, 147.0, 2148.0, 125.0, 98.0, 84.0, 47.0, 31.0, 15.0, 2.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-237.0, -229.861328125, -222.72265625, -215.583984375, -208.4453125, -201.306640625, -194.16796875, -187.029296875, -179.890625, -172.751953125, -165.61328125, -158.474609375, -151.3359375, -144.197265625, -137.05859375, -129.919921875, -122.78125, -115.642578125, -108.50390625, -101.365234375, -94.2265625, -87.087890625, -79.94921875, -72.810546875, -65.671875, -58.533203125, -51.39453125, -44.255859375, -37.1171875, -29.978515625, -22.83984375, -15.701171875, -8.5625, -1.423828125, 5.71484375, 12.853515625, 19.9921875, 27.130859375, 34.26953125, 41.408203125, 48.546875, 55.685546875, 62.82421875, 69.962890625, 77.1015625, 84.240234375, 91.37890625, 98.517578125, 105.65625, 112.794921875, 119.93359375, 127.072265625, 134.2109375, 141.349609375, 148.48828125, 155.626953125, 162.765625, 169.904296875, 177.04296875, 184.181640625, 191.3203125, 198.458984375, 205.59765625, 212.736328125, 219.875]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 4.0, 10.0, 7.0, 16.0, 16.0, 21.0, 48.0, 113.0, 199.0, 387.0, 922.0, 2918.0, 37296.0, 3060608.0, 38402.0, 2942.0, 947.0, 381.0, 209.0, 113.0, 43.0, 29.0, 27.0, 14.0, 7.0, 1.0, 6.0, 6.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.6875, -41.33251953125, -39.9775390625, -38.62255859375, -37.267578125, -35.91259765625, -34.5576171875, -33.20263671875, -31.84765625, -30.49267578125, -29.1376953125, -27.78271484375, -26.427734375, -25.07275390625, -23.7177734375, -22.36279296875, -21.0078125, -19.65283203125, -18.2978515625, -16.94287109375, -15.587890625, -14.23291015625, -12.8779296875, -11.52294921875, -10.16796875, -8.81298828125, -7.4580078125, -6.10302734375, -4.748046875, -3.39306640625, -2.0380859375, -0.68310546875, 0.671875, 2.02685546875, 3.3818359375, 4.73681640625, 6.091796875, 7.44677734375, 8.8017578125, 10.15673828125, 11.51171875, 12.86669921875, 14.2216796875, 15.57666015625, 16.931640625, 18.28662109375, 19.6416015625, 20.99658203125, 22.3515625, 23.70654296875, 25.0615234375, 26.41650390625, 27.771484375, 29.12646484375, 30.4814453125, 31.83642578125, 33.19140625, 34.54638671875, 35.9013671875, 37.25634765625, 38.611328125, 39.96630859375, 41.3212890625, 42.67626953125, 44.03125]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 7.0, 7.0, 4.0, 7.0, 17.0, 46.0, 88.0, 193.0, 283.0, 213.0, 83.0, 29.0, 13.0, 3.0, 5.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-101.46654510498047, -94.00914001464844, -86.5517349243164, -79.09432983398438, -71.63692474365234, -64.17951965332031, -56.72211837768555, -49.264713287353516, -41.807308197021484, -34.34990310668945, -26.892498016357422, -19.435094833374023, -11.977689743041992, -4.520286560058594, 2.9371185302734375, 10.394523620605469, 17.8519287109375, 25.30933380126953, 32.76673889160156, 40.224143981933594, 47.681549072265625, 55.13895034790039, 62.59635543823242, 70.05375671386719, 77.51116943359375, 84.96857452392578, 92.42597961425781, 99.88338470458984, 107.34078979492188, 114.79818725585938, 122.25559997558594, 129.71299743652344, 137.17039489746094, 144.62779235839844, 152.085205078125, 159.5426025390625, 167.00001525878906, 174.45741271972656, 181.91482543945312, 189.37222290039062, 196.8296356201172, 204.2870330810547, 211.74444580078125, 219.20184326171875, 226.6592559814453, 234.1166534423828, 241.57406616210938, 249.03146362304688, 256.4888610839844, 263.9462585449219, 271.4036560058594, 278.861083984375, 286.3184814453125, 293.77587890625, 301.2332763671875, 308.6907043457031, 316.1481018066406, 323.6054992675781, 331.0628967285156, 338.52032470703125, 345.97772216796875, 353.43511962890625, 360.89251708984375, 368.3499450683594, 375.8073425292969]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 7.0, 4.0, 11.0, 8.0, 16.0, 12.0, 21.0, 17.0, 22.0, 26.0, 31.0, 25.0, 24.0, 43.0, 29.0, 38.0, 47.0, 42.0, 38.0, 46.0, 55.0, 39.0, 38.0, 42.0, 21.0, 35.0, 35.0, 31.0, 33.0, 27.0, 16.0, 21.0, 13.0, 18.0, 17.0, 15.0, 8.0, 4.0, 6.0, 8.0, 6.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-107.51020812988281, -104.12420654296875, -100.73821258544922, -97.35221099853516, -93.9662094116211, -90.58021545410156, -87.1942138671875, -83.80821228027344, -80.4222183227539, -77.03621673583984, -73.65022277832031, -70.26422119140625, -66.87821960449219, -63.492225646972656, -60.106224060058594, -56.7202262878418, -53.334224700927734, -49.94822692871094, -46.562225341796875, -43.17622756958008, -39.79022979736328, -36.40422821044922, -33.01823043823242, -29.632232666015625, -26.246232986450195, -22.860233306884766, -19.47423553466797, -16.08823585510254, -12.702237129211426, -9.316238403320312, -5.930238723754883, -2.544240951538086, 0.8417587280273438, 4.227757453918457, 7.6137566566467285, 10.999755859375, 14.385754585266113, 17.771753311157227, 21.157752990722656, 24.543750762939453, 27.929750442504883, 31.315750122070312, 34.70174789428711, 38.087745666503906, 41.47374725341797, 44.859745025634766, 48.24574279785156, 51.631744384765625, 55.01774215698242, 58.40373992919922, 61.78974151611328, 65.17573547363281, 68.56173706054688, 71.94773864746094, 75.333740234375, 78.71973419189453, 82.1057357788086, 85.49173736572266, 88.87773132324219, 92.26373291015625, 95.64973449707031, 99.03572845458984, 102.4217300415039, 105.80772399902344, 109.1937255859375]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 9.0, 15.0, 33.0, 57.0, 78.0, 125.0, 206.0, 278.0, 379.0, 613.0, 953.0, 1889.0, 1040796.0, 1104.0, 625.0, 434.0, 310.0, 229.0, 165.0, 105.0, 63.0, 46.0, 18.0, 16.0, 7.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-71.52371215820312, -69.69764709472656, -67.87158966064453, -66.0455322265625, -64.21946716308594, -62.39340591430664, -60.567344665527344, -58.74128341674805, -56.91522216796875, -55.08916091918945, -53.263099670410156, -51.43703842163086, -49.61097717285156, -47.784915924072266, -45.95885467529297, -44.13279342651367, -42.306732177734375, -40.48067092895508, -38.65460968017578, -36.828548431396484, -35.00248718261719, -33.17642593383789, -31.350364685058594, -29.524303436279297, -27.6982421875, -25.872180938720703, -24.046119689941406, -22.22005844116211, -20.393997192382812, -18.567935943603516, -16.74187469482422, -14.915813446044922, -13.089752197265625, -11.263690948486328, -9.437629699707031, -7.611568450927734, -5.7855072021484375, -3.9594459533691406, -2.1333847045898438, -0.3073234558105469, 1.51873779296875, 3.344799041748047, 5.170860290527344, 6.996921539306641, 8.822982788085938, 10.649044036865234, 12.475105285644531, 14.301166534423828, 16.127227783203125, 17.953289031982422, 19.77935028076172, 21.605411529541016, 23.431472778320312, 25.25753402709961, 27.083595275878906, 28.909656524658203, 30.7357177734375, 32.5617790222168, 34.387840270996094, 36.21390151977539, 38.03996276855469, 39.866024017333984, 41.69208526611328, 43.51814651489258, 45.344207763671875]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 6.0, 7.0, 6.0, 6.0, 11.0, 9.0, 20.0, 47.0, 135.0, 44084.0, 51419584.0, 106.0, 45.0, 32.0, 11.0, 5.0, 7.0, 1.0, 3.0, 1.0, 1.0, 3.0, 6.0, 8.0, 6.0, 0.0, 4.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3738.0, -3582.353759765625, -3426.70751953125, -3271.061279296875, -3115.4150390625, -2959.768798828125, -2804.12255859375, -2648.4765625, -2492.830078125, -2337.183837890625, -2181.53759765625, -2025.891357421875, -1870.2451171875, -1714.598876953125, -1558.9527587890625, -1403.3065185546875, -1247.660400390625, -1092.01416015625, -936.367919921875, -780.7217407226562, -625.0755004882812, -469.42926025390625, -313.7830810546875, -158.1368408203125, -2.4906005859375, 153.15562438964844, 308.8018493652344, 464.44805908203125, 620.0942993164062, 775.7405395507812, 931.38671875, 1087.032958984375, 1242.67919921875, 1398.325439453125, 1553.9716796875, 1709.617919921875, 1865.26416015625, 2020.910400390625, 2176.556640625, 2332.20263671875, 2487.84912109375, 2643.495361328125, 2799.1416015625, 2954.787841796875, 3110.43408203125, 3266.080322265625, 3421.7265625, 3577.37255859375, 3733.018798828125, 3888.6650390625, 4044.311279296875, 4199.95751953125, 4355.603515625, 4511.25, 4666.89599609375, 4822.54248046875, 4978.1884765625, 5133.83447265625, 5289.48095703125, 5445.126953125, 5600.7734375, 5756.41943359375, 5912.06591796875, 6067.7119140625, 6223.3583984375]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 3.0, 5.0, 5.0, 8.0, 16.0, 21.0, 24.0, 41.0, 81.0, 124.0, 151.0, 216.0, 361.0, 467.0, 720.0, 1025.0, 1452.0, 2191.0, 3210.0, 4492.0, 6664.0, 9964.0, 14955.0, 22921.0, 35894.0, 56951.0, 92879.0, 158900.0, 292016.0, 620144.0, 3797450.0, 528428.0, 260328.0, 144165.0, 85236.0, 51846.0, 32885.0, 21479.0, 13939.0, 9217.0, 6369.0, 4406.0, 2906.0, 2043.0, 1484.0, 978.0, 735.0, 565.0, 332.0, 221.0, 164.0, 125.0, 87.0, 56.0, 36.0, 21.0, 14.0, 13.0, 9.0, 10.0, 3.0, 1.0, 2.0], "bins": [-3.087890625, -2.989593505859375, -2.89129638671875, -2.792999267578125, -2.6947021484375, -2.596405029296875, -2.49810791015625, -2.399810791015625, -2.301513671875, -2.203216552734375, -2.10491943359375, -2.006622314453125, -1.9083251953125, -1.810028076171875, -1.71173095703125, -1.613433837890625, -1.51513671875, -1.416839599609375, -1.31854248046875, -1.220245361328125, -1.1219482421875, -1.023651123046875, -0.92535400390625, -0.827056884765625, -0.728759765625, -0.630462646484375, -0.53216552734375, -0.433868408203125, -0.3355712890625, -0.237274169921875, -0.13897705078125, -0.040679931640625, 0.0576171875, 0.155914306640625, 0.25421142578125, 0.352508544921875, 0.4508056640625, 0.549102783203125, 0.64739990234375, 0.745697021484375, 0.843994140625, 0.942291259765625, 1.04058837890625, 1.138885498046875, 1.2371826171875, 1.335479736328125, 1.43377685546875, 1.532073974609375, 1.63037109375, 1.728668212890625, 1.82696533203125, 1.925262451171875, 2.0235595703125, 2.121856689453125, 2.22015380859375, 2.318450927734375, 2.416748046875, 2.515045166015625, 2.61334228515625, 2.711639404296875, 2.8099365234375, 2.908233642578125, 3.00653076171875, 3.104827880859375, 3.203125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 4.0, 5.0, 4.0, 5.0, 6.0, 11.0, 14.0, 15.0, 4.0, 18.0, 24.0, 18.0, 29.0, 29.0, 26.0, 32.0, 26.0, 29.0, 33.0, 34.0, 54.0, 88.0, 377.0, 637.0, 84.0, 28.0, 40.0, 44.0, 33.0, 33.0, 38.0, 19.0, 22.0, 32.0, 20.0, 16.0, 15.0, 11.0, 16.0, 16.0, 6.0, 5.0, 8.0, 4.0, 6.0, 5.0, 3.0, 4.0, 3.0], "bins": [-15.171875, -14.774658203125, -14.37744140625, -13.980224609375, -13.5830078125, -13.185791015625, -12.78857421875, -12.391357421875, -11.994140625, -11.596923828125, -11.19970703125, -10.802490234375, -10.4052734375, -10.008056640625, -9.61083984375, -9.213623046875, -8.81640625, -8.419189453125, -8.02197265625, -7.624755859375, -7.2275390625, -6.830322265625, -6.43310546875, -6.035888671875, -5.638671875, -5.241455078125, -4.84423828125, -4.447021484375, -4.0498046875, -3.652587890625, -3.25537109375, -2.858154296875, -2.4609375, -2.063720703125, -1.66650390625, -1.269287109375, -0.8720703125, -0.474853515625, -0.07763671875, 0.319580078125, 0.716796875, 1.114013671875, 1.51123046875, 1.908447265625, 2.3056640625, 2.702880859375, 3.10009765625, 3.497314453125, 3.89453125, 4.291748046875, 4.68896484375, 5.086181640625, 5.4833984375, 5.880615234375, 6.27783203125, 6.675048828125, 7.072265625, 7.469482421875, 7.86669921875, 8.263916015625, 8.6611328125, 9.058349609375, 9.45556640625, 9.852783203125, 10.25]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 14.0, 5.0, 8.0, 9.0, 9.0, 25.0, 40.0, 62.0, 63.0, 110.0, 146.0, 242.0, 359.0, 566.0, 880.0, 1373.0, 2292.0, 3680.0, 6089.0, 10063.0, 17544.0, 30879.0, 55932.0, 106812.0, 214971.0, 503150.0, 4047304.0, 733867.0, 269354.0, 130454.0, 67825.0, 36782.0, 20477.0, 11741.0, 7091.0, 4230.0, 2497.0, 1599.0, 1090.0, 636.0, 414.0, 275.0, 159.0, 110.0, 78.0, 39.0, 29.0, 36.0, 12.0, 8.0, 5.0, 2.0, 0.0, 4.0, 2.0, 3.0, 2.0], "bins": [-5.30078125, -5.14324951171875, -4.9857177734375, -4.82818603515625, -4.670654296875, -4.51312255859375, -4.3555908203125, -4.19805908203125, -4.04052734375, -3.88299560546875, -3.7254638671875, -3.56793212890625, -3.410400390625, -3.25286865234375, -3.0953369140625, -2.93780517578125, -2.7802734375, -2.62274169921875, -2.4652099609375, -2.30767822265625, -2.150146484375, -1.99261474609375, -1.8350830078125, -1.67755126953125, -1.52001953125, -1.36248779296875, -1.2049560546875, -1.04742431640625, -0.889892578125, -0.73236083984375, -0.5748291015625, -0.41729736328125, -0.259765625, -0.10223388671875, 0.0552978515625, 0.21282958984375, 0.370361328125, 0.52789306640625, 0.6854248046875, 0.84295654296875, 1.00048828125, 1.15802001953125, 1.3155517578125, 1.47308349609375, 1.630615234375, 1.78814697265625, 1.9456787109375, 2.10321044921875, 2.2607421875, 2.41827392578125, 2.5758056640625, 2.73333740234375, 2.890869140625, 3.04840087890625, 3.2059326171875, 3.36346435546875, 3.52099609375, 3.67852783203125, 3.8360595703125, 3.99359130859375, 4.151123046875, 4.30865478515625, 4.4661865234375, 4.62371826171875, 4.78125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 6.0, 6.0, 12.0, 13.0, 11.0, 10.0, 16.0, 16.0, 20.0, 31.0, 19.0, 23.0, 41.0, 44.0, 38.0, 48.0, 55.0, 83.0, 286.0, 674.0, 109.0, 47.0, 52.0, 46.0, 33.0, 37.0, 33.0, 38.0, 30.0, 21.0, 24.0, 17.0, 17.0, 16.0, 5.0, 16.0, 4.0, 7.0, 4.0, 7.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.578125, -8.2965087890625, -8.014892578125, -7.7332763671875, -7.45166015625, -7.1700439453125, -6.888427734375, -6.6068115234375, -6.3251953125, -6.0435791015625, -5.761962890625, -5.4803466796875, -5.19873046875, -4.9171142578125, -4.635498046875, -4.3538818359375, -4.072265625, -3.7906494140625, -3.509033203125, -3.2274169921875, -2.94580078125, -2.6641845703125, -2.382568359375, -2.1009521484375, -1.8193359375, -1.5377197265625, -1.256103515625, -0.9744873046875, -0.69287109375, -0.4112548828125, -0.129638671875, 0.1519775390625, 0.43359375, 0.7152099609375, 0.996826171875, 1.2784423828125, 1.56005859375, 1.8416748046875, 2.123291015625, 2.4049072265625, 2.6865234375, 2.9681396484375, 3.249755859375, 3.5313720703125, 3.81298828125, 4.0946044921875, 4.376220703125, 4.6578369140625, 4.939453125, 5.2210693359375, 5.502685546875, 5.7843017578125, 6.06591796875, 6.3475341796875, 6.629150390625, 6.9107666015625, 7.1923828125, 7.4739990234375, 7.755615234375, 8.0372314453125, 8.31884765625, 8.6004638671875, 8.882080078125, 9.1636962890625, 9.4453125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 6.0, 10.0, 8.0, 11.0, 20.0, 26.0, 20.0, 21.0, 48.0, 52.0, 68.0, 92.0, 82.0, 151.0, 191.0, 218.0, 275.0, 419.0, 542.0, 709.0, 952.0, 1341.0, 2153.0, 3316.0, 5494.0, 10757.0, 22427.0, 62965.0, 2998295.0, 3066450.0, 63480.0, 23367.0, 10816.0, 5686.0, 3423.0, 2183.0, 1364.0, 984.0, 718.0, 603.0, 398.0, 272.0, 225.0, 177.0, 136.0, 113.0, 88.0, 72.0, 47.0, 44.0, 38.0, 33.0, 14.0, 11.0, 13.0, 15.0, 3.0, 2.0, 3.0, 3.0, 3.0], "bins": [-13.546875, -13.12353515625, -12.7001953125, -12.27685546875, -11.853515625, -11.43017578125, -11.0068359375, -10.58349609375, -10.16015625, -9.73681640625, -9.3134765625, -8.89013671875, -8.466796875, -8.04345703125, -7.6201171875, -7.19677734375, -6.7734375, -6.35009765625, -5.9267578125, -5.50341796875, -5.080078125, -4.65673828125, -4.2333984375, -3.81005859375, -3.38671875, -2.96337890625, -2.5400390625, -2.11669921875, -1.693359375, -1.27001953125, -0.8466796875, -0.42333984375, 0.0, 0.42333984375, 0.8466796875, 1.27001953125, 1.693359375, 2.11669921875, 2.5400390625, 2.96337890625, 3.38671875, 3.81005859375, 4.2333984375, 4.65673828125, 5.080078125, 5.50341796875, 5.9267578125, 6.35009765625, 6.7734375, 7.19677734375, 7.6201171875, 8.04345703125, 8.466796875, 8.89013671875, 9.3134765625, 9.73681640625, 10.16015625, 10.58349609375, 11.0068359375, 11.43017578125, 11.853515625, 12.27685546875, 12.7001953125, 13.12353515625, 13.546875]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 4.0, 7.0, 8.0, 10.0, 7.0, 13.0, 13.0, 15.0, 13.0, 14.0, 24.0, 22.0, 21.0, 22.0, 25.0, 22.0, 33.0, 37.0, 46.0, 78.0, 116.0, 243.0, 506.0, 177.0, 91.0, 71.0, 47.0, 36.0, 48.0, 41.0, 25.0, 23.0, 24.0, 20.0, 17.0, 17.0, 13.0, 11.0, 16.0, 8.0, 6.0, 8.0, 6.0, 6.0, 8.0, 3.0, 5.0, 0.0, 2.0, 0.0, 2.0], "bins": [-6.40625, -6.22637939453125, -6.0465087890625, -5.86663818359375, -5.686767578125, -5.50689697265625, -5.3270263671875, -5.14715576171875, -4.96728515625, -4.78741455078125, -4.6075439453125, -4.42767333984375, -4.247802734375, -4.06793212890625, -3.8880615234375, -3.70819091796875, -3.5283203125, -3.34844970703125, -3.1685791015625, -2.98870849609375, -2.808837890625, -2.62896728515625, -2.4490966796875, -2.26922607421875, -2.08935546875, -1.90948486328125, -1.7296142578125, -1.54974365234375, -1.369873046875, -1.19000244140625, -1.0101318359375, -0.83026123046875, -0.650390625, -0.47052001953125, -0.2906494140625, -0.11077880859375, 0.069091796875, 0.24896240234375, 0.4288330078125, 0.60870361328125, 0.78857421875, 0.96844482421875, 1.1483154296875, 1.32818603515625, 1.508056640625, 1.68792724609375, 1.8677978515625, 2.04766845703125, 2.2275390625, 2.40740966796875, 2.5872802734375, 2.76715087890625, 2.947021484375, 3.12689208984375, 3.3067626953125, 3.48663330078125, 3.66650390625, 3.84637451171875, 4.0262451171875, 4.20611572265625, 4.385986328125, 4.56585693359375, 4.7457275390625, 4.92559814453125, 5.10546875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 6.0, 4.0, 10.0, 14.0, 41.0, 106.0, 341.0, 353.0, 85.0, 31.0, 9.0, 6.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-62.273681640625, -61.02841567993164, -59.78315353393555, -58.53788757324219, -57.292625427246094, -56.047359466552734, -54.802093505859375, -53.55683135986328, -52.31156539916992, -51.06629943847656, -49.82103729248047, -48.57577133178711, -47.33050537109375, -46.085243225097656, -44.8399772644043, -43.59471130371094, -42.349449157714844, -41.104183197021484, -39.85892105102539, -38.61365509033203, -37.36839294433594, -36.12312698364258, -34.87786102294922, -33.632598876953125, -32.387332916259766, -31.14206886291504, -29.896804809570312, -28.651538848876953, -27.406274795532227, -26.1610107421875, -24.91574478149414, -23.670480728149414, -22.425214767456055, -21.179950714111328, -19.93468475341797, -18.689420700073242, -17.444156646728516, -16.19889259338379, -14.953627586364746, -13.708362579345703, -12.463098526000977, -11.21783447265625, -9.972569465637207, -8.727304458618164, -7.4820404052734375, -6.236775875091553, -4.991511344909668, -3.746246337890625, -2.5009822845458984, -1.2557177543640137, -0.010453224182128906, 1.2348113059997559, 2.4800758361816406, 3.7253403663635254, 4.97060489654541, 6.215869903564453, 7.46113395690918, 8.706398010253906, 9.95166301727295, 11.196928024291992, 12.442192077636719, 13.687456130981445, 14.932721138000488, 16.17798614501953, 17.423250198364258]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 7.0, 9.0, 12.0, 10.0, 11.0, 12.0, 21.0, 18.0, 29.0, 24.0, 21.0, 25.0, 23.0, 31.0, 32.0, 35.0, 39.0, 48.0, 38.0, 39.0, 45.0, 47.0, 36.0, 49.0, 38.0, 40.0, 38.0, 37.0, 27.0, 22.0, 26.0, 23.0, 14.0, 9.0, 13.0, 14.0, 11.0, 3.0, 7.0, 7.0, 4.0, 4.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.506961822509766, -8.229288101196289, -7.951613903045654, -7.673940181732178, -7.396266460418701, -7.118592262268066, -6.84091854095459, -6.563244819641113, -6.285571098327637, -6.00789737701416, -5.730223178863525, -5.452549457550049, -5.174875736236572, -4.8972015380859375, -4.619527816772461, -4.341854095458984, -4.06417989730835, -3.786505937576294, -3.5088322162628174, -3.2311582565307617, -2.953484535217285, -2.6758105754852295, -2.398136615753174, -2.1204628944396973, -1.8427889347076416, -1.5651150941848755, -1.2874412536621094, -1.0097672939300537, -0.7320934534072876, -0.4544196128845215, -0.17674565315246582, 0.10092818737030029, 0.3786020278930664, 0.6562758684158325, 0.9339497685432434, 1.2116236686706543, 1.4892975091934204, 1.7669713497161865, 2.044645309448242, 2.3223190307617188, 2.5999929904937744, 2.87766695022583, 3.1553406715393066, 3.4330146312713623, 3.710688591003418, 3.9883623123168945, 4.266036033630371, 4.543710231781006, 4.821383953094482, 5.099057674407959, 5.376731872558594, 5.65440559387207, 5.932079315185547, 6.209753036499023, 6.487427234649658, 6.765100955963135, 7.0427751541137695, 7.320448875427246, 7.598123073577881, 7.875796794891357, 8.153470993041992, 8.431144714355469, 8.708818435668945, 8.986492156982422, 9.264165878295898]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 3.0, 9.0, 12.0, 18.0, 23.0, 54.0, 72.0, 87.0, 165.0, 255.0, 438.0, 692.0, 1353.0, 2765.0, 6494.0, 19200.0, 119560.0, 3969088.0, 51699.0, 12588.0, 4720.0, 2175.0, 1100.0, 609.0, 374.0, 239.0, 150.0, 95.0, 67.0, 45.0, 41.0, 22.0, 15.0, 15.0, 7.0, 8.0, 4.0, 5.0, 6.0, 5.0, 4.0, 3.0, 4.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1680908203125, -0.1602039337158203, -0.15231704711914062, -0.14443016052246094, -0.13654327392578125, -0.12865638732910156, -0.12076950073242188, -0.11288261413574219, -0.1049957275390625, -0.09710884094238281, -0.08922195434570312, -0.08133506774902344, -0.07344818115234375, -0.06556129455566406, -0.057674407958984375, -0.04978752136230469, -0.041900634765625, -0.03401374816894531, -0.026126861572265625, -0.018239974975585938, -0.01035308837890625, -0.0024662017822265625, 0.005420684814453125, 0.013307571411132812, 0.0211944580078125, 0.029081344604492188, 0.036968231201171875, 0.04485511779785156, 0.05274200439453125, 0.06062889099121094, 0.06851577758789062, 0.07640266418457031, 0.08428955078125, 0.09217643737792969, 0.10006332397460938, 0.10795021057128906, 0.11583709716796875, 0.12372398376464844, 0.13161087036132812, 0.1394977569580078, 0.1473846435546875, 0.1552715301513672, 0.16315841674804688, 0.17104530334472656, 0.17893218994140625, 0.18681907653808594, 0.19470596313476562, 0.2025928497314453, 0.210479736328125, 0.2183666229248047, 0.22625350952148438, 0.23414039611816406, 0.24202728271484375, 0.24991416931152344, 0.2578010559082031, 0.2656879425048828, 0.2735748291015625, 0.2814617156982422, 0.2893486022949219, 0.29723548889160156, 0.30512237548828125, 0.31300926208496094, 0.3208961486816406, 0.3287830352783203, 0.336669921875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 6.0, 6.0, 13.0, 7.0, 11.0, 18.0, 24.0, 142.0, 653.0, 32.0, 18.0, 9.0, 11.0, 9.0, 13.0, 2.0, 6.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0281982421875, -0.026807308197021484, -0.02541637420654297, -0.024025440216064453, -0.022634506225585938, -0.021243572235107422, -0.019852638244628906, -0.01846170425415039, -0.017070770263671875, -0.01567983627319336, -0.014288902282714844, -0.012897968292236328, -0.011507034301757812, -0.010116100311279297, -0.008725166320800781, -0.007334232330322266, -0.00594329833984375, -0.004552364349365234, -0.0031614303588867188, -0.0017704963684082031, -0.0003795623779296875, 0.0010113716125488281, 0.0024023056030273438, 0.0037932395935058594, 0.005184173583984375, 0.006575107574462891, 0.007966041564941406, 0.009356975555419922, 0.010747909545898438, 0.012138843536376953, 0.013529777526855469, 0.014920711517333984, 0.0163116455078125, 0.017702579498291016, 0.01909351348876953, 0.020484447479248047, 0.021875381469726562, 0.023266315460205078, 0.024657249450683594, 0.02604818344116211, 0.027439117431640625, 0.02883005142211914, 0.030220985412597656, 0.03161191940307617, 0.03300285339355469, 0.0343937873840332, 0.03578472137451172, 0.037175655364990234, 0.03856658935546875, 0.039957523345947266, 0.04134845733642578, 0.0427393913269043, 0.04413032531738281, 0.04552125930786133, 0.046912193298339844, 0.04830312728881836, 0.049694061279296875, 0.05108499526977539, 0.052475929260253906, 0.05386686325073242, 0.05525779724121094, 0.05664873123168945, 0.05803966522216797, 0.059430599212646484, 0.060821533203125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 7.0, 9.0, 8.0, 8.0, 16.0, 30.0, 40.0, 51.0, 74.0, 111.0, 204.0, 321.0, 568.0, 885.0, 1808.0, 3456.0, 7550.0, 19259.0, 60975.0, 328875.0, 3197429.0, 467160.0, 71311.0, 20100.0, 7324.0, 3208.0, 1529.0, 753.0, 433.0, 270.0, 167.0, 114.0, 77.0, 48.0, 25.0, 24.0, 14.0, 12.0, 6.0, 6.0, 1.0, 3.0, 5.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.16162109375, -0.1561565399169922, -0.15069198608398438, -0.14522743225097656, -0.13976287841796875, -0.13429832458496094, -0.12883377075195312, -0.12336921691894531, -0.1179046630859375, -0.11244010925292969, -0.10697555541992188, -0.10151100158691406, -0.09604644775390625, -0.09058189392089844, -0.08511734008789062, -0.07965278625488281, -0.074188232421875, -0.06872367858886719, -0.06325912475585938, -0.05779457092285156, -0.05233001708984375, -0.04686546325683594, -0.041400909423828125, -0.03593635559082031, -0.0304718017578125, -0.025007247924804688, -0.019542694091796875, -0.014078140258789062, -0.00861358642578125, -0.0031490325927734375, 0.002315521240234375, 0.0077800750732421875, 0.01324462890625, 0.018709182739257812, 0.024173736572265625, 0.029638290405273438, 0.03510284423828125, 0.04056739807128906, 0.046031951904296875, 0.05149650573730469, 0.0569610595703125, 0.06242561340332031, 0.06789016723632812, 0.07335472106933594, 0.07881927490234375, 0.08428382873535156, 0.08974838256835938, 0.09521293640136719, 0.100677490234375, 0.10614204406738281, 0.11160659790039062, 0.11707115173339844, 0.12253570556640625, 0.12800025939941406, 0.13346481323242188, 0.1389293670654297, 0.1443939208984375, 0.1498584747314453, 0.15532302856445312, 0.16078758239746094, 0.16625213623046875, 0.17171669006347656, 0.17718124389648438, 0.1826457977294922, 0.1881103515625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 4.0, 2.0, 5.0, 6.0, 6.0, 9.0, 14.0, 7.0, 17.0, 22.0, 27.0, 23.0, 39.0, 46.0, 77.0, 106.0, 173.0, 269.0, 553.0, 1237.0, 605.0, 308.0, 172.0, 96.0, 81.0, 54.0, 39.0, 22.0, 13.0, 12.0, 10.0, 7.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0699462890625, -0.0680837631225586, -0.06622123718261719, -0.06435871124267578, -0.062496185302734375, -0.06063365936279297, -0.05877113342285156, -0.056908607482910156, -0.05504608154296875, -0.053183555603027344, -0.05132102966308594, -0.04945850372314453, -0.047595977783203125, -0.04573345184326172, -0.04387092590332031, -0.042008399963378906, -0.0401458740234375, -0.038283348083496094, -0.03642082214355469, -0.03455829620361328, -0.032695770263671875, -0.03083324432373047, -0.028970718383789062, -0.027108192443847656, -0.02524566650390625, -0.023383140563964844, -0.021520614624023438, -0.01965808868408203, -0.017795562744140625, -0.01593303680419922, -0.014070510864257812, -0.012207984924316406, -0.010345458984375, -0.008482933044433594, -0.0066204071044921875, -0.004757881164550781, -0.002895355224609375, -0.0010328292846679688, 0.0008296966552734375, 0.0026922225952148438, 0.00455474853515625, 0.006417274475097656, 0.008279800415039062, 0.010142326354980469, 0.012004852294921875, 0.013867378234863281, 0.015729904174804688, 0.017592430114746094, 0.0194549560546875, 0.021317481994628906, 0.023180007934570312, 0.02504253387451172, 0.026905059814453125, 0.02876758575439453, 0.030630111694335938, 0.032492637634277344, 0.03435516357421875, 0.036217689514160156, 0.03808021545410156, 0.03994274139404297, 0.041805267333984375, 0.04366779327392578, 0.04553031921386719, 0.047392845153808594, 0.04925537109375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 6.0, 8.0, 22.0, 44.0, 79.0, 177.0, 335.0, 214.0, 83.0, 22.0, 8.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4162243604660034, -1.388873815536499, -1.361523151397705, -1.3341726064682007, -1.3068219423294067, -1.2794713973999023, -1.2521207332611084, -1.224770188331604, -1.1974196434020996, -1.1700690984725952, -1.1427184343338013, -1.1153678894042969, -1.088017225265503, -1.0606666803359985, -1.0333160161972046, -1.0059654712677002, -0.9786148071289062, -0.9512642025947571, -0.9239135980606079, -0.8965629935264587, -0.8692123889923096, -0.8418618440628052, -0.814511239528656, -0.7871606349945068, -0.7598100304603577, -0.7324594259262085, -0.7051088213920593, -0.6777582168579102, -0.6504076719284058, -0.6230570077896118, -0.5957064628601074, -0.5683558583259583, -0.5410052537918091, -0.5136546492576599, -0.48630404472351074, -0.45895346999168396, -0.4316028654575348, -0.4042522609233856, -0.37690168619155884, -0.34955108165740967, -0.3222004771232605, -0.29484987258911133, -0.26749926805496216, -0.24014869332313538, -0.2127980887889862, -0.18544748425483704, -0.15809689462184906, -0.13074630498886108, -0.10339570045471191, -0.07604510337114334, -0.04869450628757477, -0.021343909204006195, 0.006006687879562378, 0.03335729241371155, 0.060707882046699524, 0.0880584716796875, 0.11540907621383667, 0.14275968074798584, 0.17011027038097382, 0.1974608600139618, 0.22481146454811096, 0.25216206908226013, 0.2795126438140869, 0.3068632483482361, 0.33421385288238525]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 12.0, 17.0, 26.0, 37.0, 53.0, 65.0, 94.0, 93.0, 97.0, 87.0, 87.0, 96.0, 69.0, 52.0, 44.0, 24.0, 17.0, 13.0, 8.0, 6.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6731529235839844, -0.6549403071403503, -0.6367277503013611, -0.618515133857727, -0.6003025770187378, -0.5820899605751038, -0.5638773441314697, -0.5456647872924805, -0.5274521708488464, -0.5092395544052124, -0.49102699756622314, -0.4728143811225891, -0.45460179448127747, -0.4363892078399658, -0.4181765913963318, -0.39996400475502014, -0.3817514181137085, -0.36353883147239685, -0.3453262448310852, -0.32711362838745117, -0.3089010417461395, -0.2906884551048279, -0.27247583866119385, -0.2542632520198822, -0.23605066537857056, -0.2178380787372589, -0.19962547719478607, -0.18141287565231323, -0.1632002890110016, -0.14498770236968994, -0.1267751008272171, -0.10856249928474426, -0.09034997224807739, -0.07213737815618515, -0.05392478406429291, -0.035712189972400665, -0.017499595880508423, 0.0007129982113838196, 0.018925592303276062, 0.0371381938457489, 0.05535078048706055, 0.07356337457895279, 0.09177596867084503, 0.10998856276273727, 0.12820115685462952, 0.14641374349594116, 0.164626345038414, 0.18283894658088684, 0.2010515332221985, 0.21926411986351013, 0.23747672140598297, 0.2556893229484558, 0.27390190958976746, 0.2921144962310791, 0.31032711267471313, 0.3285396993160248, 0.3467522859573364, 0.36496487259864807, 0.3831774592399597, 0.40139007568359375, 0.4196026623249054, 0.43781524896621704, 0.4560278654098511, 0.4742404520511627, 0.49245303869247437]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 7.0, 7.0, 15.0, 11.0, 24.0, 33.0, 46.0, 59.0, 79.0, 120.0, 149.0, 247.0, 331.0, 445.0, 692.0, 1112.0, 1759.0, 3012.0, 5617.0, 11806.0, 29152.0, 277329.0, 645881.0, 40313.0, 14369.0, 6726.0, 3555.0, 1962.0, 1197.0, 777.0, 508.0, 351.0, 224.0, 196.0, 120.0, 90.0, 71.0, 48.0, 35.0, 18.0, 23.0, 8.0, 11.0, 10.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.2139892578125, -0.2077178955078125, -0.201446533203125, -0.1951751708984375, -0.18890380859375, -0.1826324462890625, -0.176361083984375, -0.1700897216796875, -0.163818359375, -0.1575469970703125, -0.151275634765625, -0.1450042724609375, -0.13873291015625, -0.1324615478515625, -0.126190185546875, -0.1199188232421875, -0.1136474609375, -0.1073760986328125, -0.101104736328125, -0.0948333740234375, -0.08856201171875, -0.0822906494140625, -0.076019287109375, -0.0697479248046875, -0.0634765625, -0.0572052001953125, -0.050933837890625, -0.0446624755859375, -0.03839111328125, -0.0321197509765625, -0.025848388671875, -0.0195770263671875, -0.0133056640625, -0.0070343017578125, -0.000762939453125, 0.0055084228515625, 0.01177978515625, 0.0180511474609375, 0.024322509765625, 0.0305938720703125, 0.036865234375, 0.0431365966796875, 0.049407958984375, 0.0556793212890625, 0.06195068359375, 0.0682220458984375, 0.074493408203125, 0.0807647705078125, 0.0870361328125, 0.0933074951171875, 0.099578857421875, 0.1058502197265625, 0.11212158203125, 0.1183929443359375, 0.124664306640625, 0.1309356689453125, 0.13720703125, 0.1434783935546875, 0.149749755859375, 0.1560211181640625, 0.16229248046875, 0.1685638427734375, 0.174835205078125, 0.1811065673828125, 0.1873779296875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 2.0, 7.0, 15.0, 8.0, 9.0, 13.0, 33.0, 80.0, 204.0, 288.0, 185.0, 76.0, 12.0, 12.0, 8.0, 9.0, 10.0, 5.0, 3.0, 2.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03900146484375, -0.03779792785644531, -0.036594390869140625, -0.03539085388183594, -0.03418731689453125, -0.03298377990722656, -0.031780242919921875, -0.030576705932617188, -0.0293731689453125, -0.028169631958007812, -0.026966094970703125, -0.025762557983398438, -0.02455902099609375, -0.023355484008789062, -0.022151947021484375, -0.020948410034179688, -0.019744873046875, -0.018541336059570312, -0.017337799072265625, -0.016134262084960938, -0.01493072509765625, -0.013727188110351562, -0.012523651123046875, -0.011320114135742188, -0.0101165771484375, -0.008913040161132812, -0.007709503173828125, -0.0065059661865234375, -0.00530242919921875, -0.0040988922119140625, -0.002895355224609375, -0.0016918182373046875, -0.00048828125, 0.0007152557373046875, 0.001918792724609375, 0.0031223297119140625, 0.00432586669921875, 0.0055294036865234375, 0.006732940673828125, 0.007936477661132812, 0.0091400146484375, 0.010343551635742188, 0.011547088623046875, 0.012750625610351562, 0.01395416259765625, 0.015157699584960938, 0.016361236572265625, 0.017564773559570312, 0.018768310546875, 0.019971847534179688, 0.021175384521484375, 0.022378921508789062, 0.02358245849609375, 0.024785995483398438, 0.025989532470703125, 0.027193069458007812, 0.0283966064453125, 0.029600143432617188, 0.030803680419921875, 0.03200721740722656, 0.03321075439453125, 0.03441429138183594, 0.035617828369140625, 0.03682136535644531, 0.03802490234375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 8.0, 3.0, 6.0, 12.0, 17.0, 27.0, 44.0, 66.0, 116.0, 287.0, 865.0, 3944.0, 38319.0, 881467.0, 113981.0, 7272.0, 1283.0, 426.0, 172.0, 87.0, 53.0, 42.0, 18.0, 9.0, 8.0, 10.0, 5.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.483154296875, -0.4662971496582031, -0.44944000244140625, -0.4325828552246094, -0.4157257080078125, -0.3988685607910156, -0.38201141357421875, -0.3651542663574219, -0.348297119140625, -0.3314399719238281, -0.31458282470703125, -0.2977256774902344, -0.2808685302734375, -0.2640113830566406, -0.24715423583984375, -0.23029708862304688, -0.21343994140625, -0.19658279418945312, -0.17972564697265625, -0.16286849975585938, -0.1460113525390625, -0.12915420532226562, -0.11229705810546875, -0.09543991088867188, -0.078582763671875, -0.061725616455078125, -0.04486846923828125, -0.028011322021484375, -0.0111541748046875, 0.005702972412109375, 0.02256011962890625, 0.039417266845703125, 0.0562744140625, 0.07313156127929688, 0.08998870849609375, 0.10684585571289062, 0.1237030029296875, 0.14056015014648438, 0.15741729736328125, 0.17427444458007812, 0.191131591796875, 0.20798873901367188, 0.22484588623046875, 0.24170303344726562, 0.2585601806640625, 0.2754173278808594, 0.29227447509765625, 0.3091316223144531, 0.32598876953125, 0.3428459167480469, 0.35970306396484375, 0.3765602111816406, 0.3934173583984375, 0.4102745056152344, 0.42713165283203125, 0.4439888000488281, 0.460845947265625, 0.4777030944824219, 0.49456024169921875, 0.5114173889160156, 0.5282745361328125, 0.5451316833496094, 0.5619888305664062, 0.5788459777832031, 0.595703125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 5.0, 0.0, 1.0, 1.0, 2.0, 4.0, 7.0, 3.0, 2.0, 5.0, 13.0, 9.0, 6.0, 14.0, 15.0, 22.0, 28.0, 30.0, 27.0, 32.0, 24.0, 36.0, 36.0, 35.0, 40.0, 44.0, 48.0, 43.0, 47.0, 45.0, 45.0, 34.0, 27.0, 35.0, 41.0, 31.0, 20.0, 23.0, 21.0, 23.0, 12.0, 13.0, 19.0, 10.0, 11.0, 8.0, 7.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.143310546875, -0.13879013061523438, -0.13426971435546875, -0.12974929809570312, -0.1252288818359375, -0.12070846557617188, -0.11618804931640625, -0.11166763305664062, -0.107147216796875, -0.10262680053710938, -0.09810638427734375, -0.09358596801757812, -0.0890655517578125, -0.08454513549804688, -0.08002471923828125, -0.07550430297851562, -0.07098388671875, -0.06646347045898438, -0.06194305419921875, -0.057422637939453125, -0.0529022216796875, -0.048381805419921875, -0.04386138916015625, -0.039340972900390625, -0.034820556640625, -0.030300140380859375, -0.02577972412109375, -0.021259307861328125, -0.0167388916015625, -0.012218475341796875, -0.00769805908203125, -0.003177642822265625, 0.0013427734375, 0.005863189697265625, 0.01038360595703125, 0.014904022216796875, 0.0194244384765625, 0.023944854736328125, 0.02846527099609375, 0.032985687255859375, 0.037506103515625, 0.042026519775390625, 0.04654693603515625, 0.051067352294921875, 0.0555877685546875, 0.060108184814453125, 0.06462860107421875, 0.06914901733398438, 0.07366943359375, 0.07818984985351562, 0.08271026611328125, 0.08723068237304688, 0.0917510986328125, 0.09627151489257812, 0.10079193115234375, 0.10531234741210938, 0.109832763671875, 0.11435317993164062, 0.11887359619140625, 0.12339401245117188, 0.1279144287109375, 0.13243484497070312, 0.13695526123046875, 0.14147567749023438, 0.14599609375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 2.0, 3.0, 5.0, 8.0, 15.0, 21.0, 23.0, 17.0, 46.0, 54.0, 105.0, 185.0, 282.0, 524.0, 1138.0, 2787.0, 10020.0, 177834.0, 828231.0, 20120.0, 4044.0, 1464.0, 700.0, 361.0, 215.0, 116.0, 89.0, 41.0, 27.0, 18.0, 17.0, 10.0, 14.0, 7.0, 5.0, 4.0, 7.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.499267578125, -0.4850730895996094, -0.47087860107421875, -0.4566841125488281, -0.4424896240234375, -0.4282951354980469, -0.41410064697265625, -0.3999061584472656, -0.385711669921875, -0.3715171813964844, -0.35732269287109375, -0.3431282043457031, -0.3289337158203125, -0.3147392272949219, -0.30054473876953125, -0.2863502502441406, -0.27215576171875, -0.2579612731933594, -0.24376678466796875, -0.22957229614257812, -0.2153778076171875, -0.20118331909179688, -0.18698883056640625, -0.17279434204101562, -0.158599853515625, -0.14440536499023438, -0.13021087646484375, -0.11601638793945312, -0.1018218994140625, -0.08762741088867188, -0.07343292236328125, -0.059238433837890625, -0.0450439453125, -0.030849456787109375, -0.01665496826171875, -0.002460479736328125, 0.0117340087890625, 0.025928497314453125, 0.04012298583984375, 0.054317474365234375, 0.068511962890625, 0.08270645141601562, 0.09690093994140625, 0.11109542846679688, 0.1252899169921875, 0.13948440551757812, 0.15367889404296875, 0.16787338256835938, 0.18206787109375, 0.19626235961914062, 0.21045684814453125, 0.22465133666992188, 0.2388458251953125, 0.2530403137207031, 0.26723480224609375, 0.2814292907714844, 0.295623779296875, 0.3098182678222656, 0.32401275634765625, 0.3382072448730469, 0.3524017333984375, 0.3665962219238281, 0.38079071044921875, 0.3949851989746094, 0.4091796875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 6.0, 2.0, 6.0, 4.0, 13.0, 10.0, 10.0, 17.0, 18.0, 26.0, 32.0, 48.0, 51.0, 90.0, 112.0, 72.0, 109.0, 74.0, 69.0, 57.0, 45.0, 29.0, 22.0, 21.0, 17.0, 10.0, 7.0, 8.0, 6.0, 5.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.1517276763916016e-05, -2.0821578800678253e-05, -2.012588083744049e-05, -1.9430182874202728e-05, -1.8734484910964966e-05, -1.8038786947727203e-05, -1.734308898448944e-05, -1.664739102125168e-05, -1.5951693058013916e-05, -1.5255995094776154e-05, -1.4560297131538391e-05, -1.3864599168300629e-05, -1.3168901205062866e-05, -1.2473203241825104e-05, -1.1777505278587341e-05, -1.1081807315349579e-05, -1.0386109352111816e-05, -9.690411388874054e-06, -8.994713425636292e-06, -8.299015462398529e-06, -7.603317499160767e-06, -6.907619535923004e-06, -6.211921572685242e-06, -5.516223609447479e-06, -4.820525646209717e-06, -4.124827682971954e-06, -3.429129719734192e-06, -2.7334317564964294e-06, -2.037733793258667e-06, -1.3420358300209045e-06, -6.463378667831421e-07, 4.936009645462036e-08, 7.450580596923828e-07, 1.4407560229301453e-06, 2.1364539861679077e-06, 2.83215194940567e-06, 3.5278499126434326e-06, 4.223547875881195e-06, 4.9192458391189575e-06, 5.61494380235672e-06, 6.310641765594482e-06, 7.006339728832245e-06, 7.702037692070007e-06, 8.39773565530777e-06, 9.093433618545532e-06, 9.789131581783295e-06, 1.0484829545021057e-05, 1.118052750825882e-05, 1.1876225471496582e-05, 1.2571923434734344e-05, 1.3267621397972107e-05, 1.396331936120987e-05, 1.4659017324447632e-05, 1.5354715287685394e-05, 1.6050413250923157e-05, 1.674611121416092e-05, 1.744180917739868e-05, 1.8137507140636444e-05, 1.8833205103874207e-05, 1.952890306711197e-05, 2.022460103034973e-05, 2.0920298993587494e-05, 2.1615996956825256e-05, 2.231169492006302e-05, 2.300739288330078e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 1.0, 4.0, 2.0, 4.0, 2.0, 8.0, 14.0, 15.0, 16.0, 18.0, 24.0, 33.0, 49.0, 39.0, 85.0, 87.0, 145.0, 225.0, 291.0, 460.0, 666.0, 1163.0, 1932.0, 3266.0, 6414.0, 13741.0, 35500.0, 120110.0, 513000.0, 250222.0, 59656.0, 20930.0, 9142.0, 4615.0, 2451.0, 1441.0, 939.0, 555.0, 394.0, 255.0, 174.0, 139.0, 89.0, 71.0, 43.0, 34.0, 27.0, 21.0, 12.0, 12.0, 9.0, 4.0, 5.0, 3.0, 0.0, 0.0, 4.0], "bins": [-0.17529296875, -0.17038726806640625, -0.1654815673828125, -0.16057586669921875, -0.155670166015625, -0.15076446533203125, -0.1458587646484375, -0.14095306396484375, -0.13604736328125, -0.13114166259765625, -0.1262359619140625, -0.12133026123046875, -0.116424560546875, -0.11151885986328125, -0.1066131591796875, -0.10170745849609375, -0.0968017578125, -0.09189605712890625, -0.0869903564453125, -0.08208465576171875, -0.077178955078125, -0.07227325439453125, -0.0673675537109375, -0.06246185302734375, -0.05755615234375, -0.05265045166015625, -0.0477447509765625, -0.04283905029296875, -0.037933349609375, -0.03302764892578125, -0.0281219482421875, -0.02321624755859375, -0.018310546875, -0.01340484619140625, -0.0084991455078125, -0.00359344482421875, 0.001312255859375, 0.00621795654296875, 0.0111236572265625, 0.01602935791015625, 0.02093505859375, 0.02584075927734375, 0.0307464599609375, 0.03565216064453125, 0.040557861328125, 0.04546356201171875, 0.0503692626953125, 0.05527496337890625, 0.0601806640625, 0.06508636474609375, 0.0699920654296875, 0.07489776611328125, 0.079803466796875, 0.08470916748046875, 0.0896148681640625, 0.09452056884765625, 0.09942626953125, 0.10433197021484375, 0.1092376708984375, 0.11414337158203125, 0.119049072265625, 0.12395477294921875, 0.1288604736328125, 0.13376617431640625, 0.138671875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0, 2.0, 8.0, 10.0, 9.0, 8.0, 15.0, 25.0, 23.0, 25.0, 47.0, 48.0, 57.0, 79.0, 90.0, 81.0, 83.0, 69.0, 64.0, 55.0, 35.0, 38.0, 25.0, 20.0, 11.0, 18.0, 15.0, 6.0, 10.0, 3.0, 4.0, 4.0, 0.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.139892578125, -0.1342315673828125, -0.128570556640625, -0.1229095458984375, -0.11724853515625, -0.1115875244140625, -0.105926513671875, -0.1002655029296875, -0.0946044921875, -0.0889434814453125, -0.083282470703125, -0.0776214599609375, -0.07196044921875, -0.0662994384765625, -0.060638427734375, -0.0549774169921875, -0.04931640625, -0.0436553955078125, -0.037994384765625, -0.0323333740234375, -0.02667236328125, -0.0210113525390625, -0.015350341796875, -0.0096893310546875, -0.0040283203125, 0.0016326904296875, 0.007293701171875, 0.0129547119140625, 0.01861572265625, 0.0242767333984375, 0.029937744140625, 0.0355987548828125, 0.041259765625, 0.0469207763671875, 0.052581787109375, 0.0582427978515625, 0.06390380859375, 0.0695648193359375, 0.075225830078125, 0.0808868408203125, 0.0865478515625, 0.0922088623046875, 0.097869873046875, 0.1035308837890625, 0.10919189453125, 0.1148529052734375, 0.120513916015625, 0.1261749267578125, 0.1318359375, 0.1374969482421875, 0.143157958984375, 0.1488189697265625, 0.15447998046875, 0.1601409912109375, 0.165802001953125, 0.1714630126953125, 0.1771240234375, 0.1827850341796875, 0.188446044921875, 0.1941070556640625, 0.19976806640625, 0.2054290771484375, 0.211090087890625, 0.2167510986328125, 0.222412109375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 4.0, 3.0, 2.0, 5.0, 11.0, 25.0, 37.0, 86.0, 296.0, 399.0, 91.0, 26.0, 11.0, 6.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4275641441345215, -3.30173921585083, -3.1759145259857178, -3.0500898361206055, -2.924264907836914, -2.7984399795532227, -2.6726152896881104, -2.546790599822998, -2.4209656715393066, -2.2951407432556152, -2.169316053390503, -2.0434913635253906, -1.9176664352416992, -1.7918416261672974, -1.6660168170928955, -1.5401920080184937, -1.4143671989440918, -1.28854238986969, -1.162717580795288, -1.0368927717208862, -0.9110679626464844, -0.7852431535720825, -0.6594183444976807, -0.5335935354232788, -0.40776872634887695, -0.2819439172744751, -0.15611910820007324, -0.030294299125671387, 0.09553050994873047, 0.22135531902313232, 0.3471801280975342, 0.47300493717193604, 0.5988302230834961, 0.724655032157898, 0.8504798412322998, 0.9763046503067017, 1.1021294593811035, 1.2279542684555054, 1.3537790775299072, 1.479603886604309, 1.605428695678711, 1.7312535047531128, 1.8570783138275146, 1.9829031229019165, 2.1087279319763184, 2.2345528602600098, 2.360377550125122, 2.4862022399902344, 2.612027168273926, 2.737852096557617, 2.8636767864227295, 2.989501476287842, 3.115326404571533, 3.2411513328552246, 3.366976022720337, 3.492800712585449, 3.6186256408691406, 3.744450569152832, 3.8702752590179443, 3.9960999488830566, 4.121924877166748, 4.2477498054504395, 4.373574256896973, 4.499399185180664, 4.6252241134643555]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 5.0, 2.0, 8.0, 5.0, 7.0, 7.0, 14.0, 15.0, 39.0, 56.0, 81.0, 120.0, 139.0, 139.0, 119.0, 73.0, 48.0, 36.0, 18.0, 17.0, 11.0, 12.0, 5.0, 2.0, 3.0, 4.0, 6.0, 1.0, 2.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4463467597961426, -2.3524675369262695, -2.2585883140563965, -2.1647090911865234, -2.0708298683166504, -1.9769506454467773, -1.8830714225769043, -1.7891921997070312, -1.6953129768371582, -1.6014337539672852, -1.507554531097412, -1.413675308227539, -1.319796085357666, -1.225916862487793, -1.13203763961792, -1.0381584167480469, -0.9442793130874634, -0.8504000902175903, -0.7565208673477173, -0.6626416444778442, -0.5687624216079712, -0.47488322854042053, -0.3810040354728699, -0.2871248126029968, -0.19324558973312378, -0.09936637431383133, -0.005487158894538879, 0.08839204907417297, 0.18227127194404602, 0.27615049481391907, 0.3700296878814697, 0.4639089107513428, 0.5577881336212158, 0.6516673564910889, 0.7455465793609619, 0.839425802230835, 0.933305025100708, 1.027184247970581, 1.121063470840454, 1.2149426937103271, 1.3088219165802002, 1.4027011394500732, 1.4965803623199463, 1.5904595851898193, 1.6843388080596924, 1.7782180309295654, 1.8720972537994385, 1.9659764766693115, 2.0598554611206055, 2.1537346839904785, 2.2476139068603516, 2.3414931297302246, 2.4353723526000977, 2.5292515754699707, 2.6231307983398438, 2.717010021209717, 2.81088924407959, 2.904768466949463, 2.998647689819336, 3.092526912689209, 3.186406135559082, 3.280285358428955, 3.374164581298828, 3.468043804168701, 3.561923027038574]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 5.0, 6.0, 5.0, 5.0, 13.0, 9.0, 7.0, 16.0, 14.0, 25.0, 36.0, 57.0, 176.0, 989.0, 19669.0, 4145720.0, 25608.0, 1476.0, 233.0, 81.0, 33.0, 20.0, 20.0, 14.0, 5.0, 5.0, 6.0, 7.0, 3.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.173828125, -2.107025146484375, -2.04022216796875, -1.973419189453125, -1.9066162109375, -1.839813232421875, -1.77301025390625, -1.706207275390625, -1.639404296875, -1.572601318359375, -1.50579833984375, -1.438995361328125, -1.3721923828125, -1.305389404296875, -1.23858642578125, -1.171783447265625, -1.10498046875, -1.038177490234375, -0.97137451171875, -0.904571533203125, -0.8377685546875, -0.770965576171875, -0.70416259765625, -0.637359619140625, -0.570556640625, -0.503753662109375, -0.43695068359375, -0.370147705078125, -0.3033447265625, -0.236541748046875, -0.16973876953125, -0.102935791015625, -0.0361328125, 0.030670166015625, 0.09747314453125, 0.164276123046875, 0.2310791015625, 0.297882080078125, 0.36468505859375, 0.431488037109375, 0.498291015625, 0.565093994140625, 0.63189697265625, 0.698699951171875, 0.7655029296875, 0.832305908203125, 0.89910888671875, 0.965911865234375, 1.03271484375, 1.099517822265625, 1.16632080078125, 1.233123779296875, 1.2999267578125, 1.366729736328125, 1.43353271484375, 1.500335693359375, 1.567138671875, 1.633941650390625, 1.70074462890625, 1.767547607421875, 1.8343505859375, 1.901153564453125, 1.96795654296875, 2.034759521484375, 2.1015625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 4.0, 4.0, 7.0, 8.0, 12.0, 15.0, 21.0, 28.0, 60.0, 85.0, 132.0, 140.0, 160.0, 122.0, 72.0, 35.0, 25.0, 15.0, 11.0, 6.0, 4.0, 4.0, 3.0, 6.0, 2.0, 5.0, 2.0, 7.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0228729248046875, -0.02195572853088379, -0.021038532257080078, -0.020121335983276367, -0.019204139709472656, -0.018286943435668945, -0.017369747161865234, -0.016452550888061523, -0.015535354614257812, -0.014618158340454102, -0.01370096206665039, -0.01278376579284668, -0.011866569519042969, -0.010949373245239258, -0.010032176971435547, -0.009114980697631836, -0.008197784423828125, -0.007280588150024414, -0.006363391876220703, -0.005446195602416992, -0.004528999328613281, -0.0036118030548095703, -0.0026946067810058594, -0.0017774105072021484, -0.0008602142333984375, 5.698204040527344e-05, 0.0009741783142089844, 0.0018913745880126953, 0.0028085708618164062, 0.003725767135620117, 0.004642963409423828, 0.005560159683227539, 0.00647735595703125, 0.007394552230834961, 0.008311748504638672, 0.009228944778442383, 0.010146141052246094, 0.011063337326049805, 0.011980533599853516, 0.012897729873657227, 0.013814926147460938, 0.014732122421264648, 0.01564931869506836, 0.01656651496887207, 0.01748371124267578, 0.018400907516479492, 0.019318103790283203, 0.020235300064086914, 0.021152496337890625, 0.022069692611694336, 0.022986888885498047, 0.023904085159301758, 0.02482128143310547, 0.02573847770690918, 0.02665567398071289, 0.0275728702545166, 0.028490066528320312, 0.029407262802124023, 0.030324459075927734, 0.031241655349731445, 0.032158851623535156, 0.03307604789733887, 0.03399324417114258, 0.03491044044494629, 0.03582763671875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [4.0, 0.0, 4.0, 6.0, 30.0, 61.0, 246.0, 919.0, 6290.0, 277269.0, 3891578.0, 15369.0, 1649.0, 464.0, 175.0, 93.0, 48.0, 39.0, 22.0, 14.0, 6.0, 5.0, 7.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.316650390625, -0.2855033874511719, -0.25435638427734375, -0.22320938110351562, -0.1920623779296875, -0.16091537475585938, -0.12976837158203125, -0.09862136840820312, -0.067474365234375, -0.036327362060546875, -0.00518035888671875, 0.025966644287109375, 0.0571136474609375, 0.08826065063476562, 0.11940765380859375, 0.15055465698242188, 0.18170166015625, 0.21284866333007812, 0.24399566650390625, 0.2751426696777344, 0.3062896728515625, 0.3374366760253906, 0.36858367919921875, 0.3997306823730469, 0.430877685546875, 0.4620246887207031, 0.49317169189453125, 0.5243186950683594, 0.5554656982421875, 0.5866127014160156, 0.6177597045898438, 0.6489067077636719, 0.6800537109375, 0.7112007141113281, 0.7423477172851562, 0.7734947204589844, 0.8046417236328125, 0.8357887268066406, 0.8669357299804688, 0.8980827331542969, 0.929229736328125, 0.9603767395019531, 0.9915237426757812, 1.0226707458496094, 1.0538177490234375, 1.0849647521972656, 1.1161117553710938, 1.1472587585449219, 1.17840576171875, 1.2095527648925781, 1.2406997680664062, 1.2718467712402344, 1.3029937744140625, 1.3341407775878906, 1.3652877807617188, 1.3964347839355469, 1.427581787109375, 1.4587287902832031, 1.4898757934570312, 1.5210227966308594, 1.5521697998046875, 1.5833168029785156, 1.6144638061523438, 1.6456108093261719, 1.6767578125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 10.0, 3.0, 3.0, 9.0, 17.0, 14.0, 13.0, 15.0, 26.0, 48.0, 75.0, 173.0, 437.0, 1499.0, 953.0, 344.0, 152.0, 76.0, 61.0, 35.0, 22.0, 17.0, 16.0, 8.0, 4.0, 5.0, 7.0, 8.0, 4.0, 2.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.04608154296875, -0.04467201232910156, -0.043262481689453125, -0.04185295104980469, -0.04044342041015625, -0.03903388977050781, -0.037624359130859375, -0.03621482849121094, -0.0348052978515625, -0.03339576721191406, -0.031986236572265625, -0.030576705932617188, -0.02916717529296875, -0.027757644653320312, -0.026348114013671875, -0.024938583374023438, -0.023529052734375, -0.022119522094726562, -0.020709991455078125, -0.019300460815429688, -0.01789093017578125, -0.016481399536132812, -0.015071868896484375, -0.013662338256835938, -0.0122528076171875, -0.010843276977539062, -0.009433746337890625, -0.008024215698242188, -0.00661468505859375, -0.0052051544189453125, -0.003795623779296875, -0.0023860931396484375, -0.0009765625, 0.0004329681396484375, 0.001842498779296875, 0.0032520294189453125, 0.00466156005859375, 0.0060710906982421875, 0.007480621337890625, 0.008890151977539062, 0.0102996826171875, 0.011709213256835938, 0.013118743896484375, 0.014528274536132812, 0.01593780517578125, 0.017347335815429688, 0.018756866455078125, 0.020166397094726562, 0.021575927734375, 0.022985458374023438, 0.024394989013671875, 0.025804519653320312, 0.02721405029296875, 0.028623580932617188, 0.030033111572265625, 0.03144264221191406, 0.0328521728515625, 0.03426170349121094, 0.035671234130859375, 0.03708076477050781, 0.03849029541015625, 0.03989982604980469, 0.041309356689453125, 0.04271888732910156, 0.04412841796875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 8.0, 454.0, 497.0, 43.0, 12.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39107492566108704, -0.2905176877975464, -0.18996047973632812, -0.08940324187278748, 0.011153966188430786, 0.11171117424964905, 0.21226844191551208, 0.31282564997673035, 0.4133828580379486, 0.5139400959014893, 0.6144973039627075, 0.7150545120239258, 0.815611720085144, 0.9161689281463623, 1.0167262554168701, 1.1172834634780884, 1.2178406715393066, 1.318397879600525, 1.4189550876617432, 1.519512414932251, 1.6200695037841797, 1.7206268310546875, 1.8211840391159058, 1.921741247177124, 2.0222983360290527, 2.1228556632995605, 2.2234127521514893, 2.323970079421997, 2.424527168273926, 2.5250844955444336, 2.6256418228149414, 2.72619891166687, 2.826756000518799, 2.9273133277893066, 3.0278704166412354, 3.128427743911743, 3.228984832763672, 3.3295421600341797, 3.4300994873046875, 3.530656576156616, 3.631213665008545, 3.7317709922790527, 3.8323280811309814, 3.9328854084014893, 4.033442497253418, 4.133999824523926, 4.234557151794434, 4.335114479064941, 4.435671806335449, 4.536229133605957, 4.636786460876465, 4.7373433113098145, 4.837900638580322, 4.93845796585083, 5.039015293121338, 5.1395721435546875, 5.240129470825195, 5.340686798095703, 5.441244125366211, 5.5418009757995605, 5.642358303070068, 5.742915630340576, 5.843472957611084, 5.944029808044434, 6.044587135314941]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 6.0, 6.0, 8.0, 15.0, 17.0, 18.0, 18.0, 31.0, 29.0, 44.0, 46.0, 53.0, 71.0, 57.0, 81.0, 85.0, 53.0, 57.0, 63.0, 52.0, 33.0, 32.0, 21.0, 25.0, 15.0, 12.0, 11.0, 10.0, 10.0, 4.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3589369058609009, -0.3487369418144226, -0.33853697776794434, -0.3283369839191437, -0.3181370198726654, -0.30793705582618713, -0.29773709177970886, -0.2875371277332306, -0.27733713388442993, -0.26713716983795166, -0.2569372057914734, -0.24673722684383392, -0.23653724789619446, -0.2263372838497162, -0.21613731980323792, -0.20593735575675964, -0.19573739171028137, -0.1855374276638031, -0.17533744871616364, -0.16513748466968536, -0.1549375057220459, -0.14473754167556763, -0.13453757762908936, -0.12433760613203049, -0.11413763463497162, -0.10393766313791275, -0.09373769164085388, -0.08353772759437561, -0.07333775609731674, -0.06313778460025787, -0.052937816828489304, -0.042737849056720734, -0.032537877559661865, -0.022337907925248146, -0.012137938290834427, -0.0019379686564207077, 0.008262000977993011, 0.01846197247505188, 0.02866194024682045, 0.03886190801858902, 0.04906187951564789, 0.05926185101270676, 0.06946182250976562, 0.0796617865562439, 0.08986175805330276, 0.10006172955036163, 0.1102616935968399, 0.12046166509389877, 0.13066163659095764, 0.1408616006374359, 0.15106157958507538, 0.16126154363155365, 0.17146152257919312, 0.1816614866256714, 0.19186145067214966, 0.20206141471862793, 0.2122613936662674, 0.22246135771274567, 0.23266133666038513, 0.2428613007068634, 0.2530612647533417, 0.26326125860214233, 0.2734612226486206, 0.2836611866950989, 0.29386115074157715]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 4.0, 6.0, 9.0, 19.0, 19.0, 25.0, 57.0, 60.0, 107.0, 163.0, 240.0, 375.0, 593.0, 959.0, 1631.0, 2619.0, 4768.0, 9097.0, 20058.0, 54205.0, 205515.0, 508677.0, 158629.0, 44866.0, 17134.0, 8070.0, 4320.0, 2432.0, 1450.0, 852.0, 543.0, 363.0, 248.0, 161.0, 93.0, 61.0, 42.0, 24.0, 19.0, 13.0, 10.0, 7.0, 14.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1304931640625, -0.12605667114257812, -0.12162017822265625, -0.11718368530273438, -0.1127471923828125, -0.10831069946289062, -0.10387420654296875, -0.09943771362304688, -0.095001220703125, -0.09056472778320312, -0.08612823486328125, -0.08169174194335938, -0.0772552490234375, -0.07281875610351562, -0.06838226318359375, -0.06394577026367188, -0.05950927734375, -0.055072784423828125, -0.05063629150390625, -0.046199798583984375, -0.0417633056640625, -0.037326812744140625, -0.03289031982421875, -0.028453826904296875, -0.024017333984375, -0.019580841064453125, -0.01514434814453125, -0.010707855224609375, -0.0062713623046875, -0.001834869384765625, 0.00260162353515625, 0.007038116455078125, 0.011474609375, 0.015911102294921875, 0.02034759521484375, 0.024784088134765625, 0.0292205810546875, 0.033657073974609375, 0.03809356689453125, 0.042530059814453125, 0.046966552734375, 0.051403045654296875, 0.05583953857421875, 0.060276031494140625, 0.0647125244140625, 0.06914901733398438, 0.07358551025390625, 0.07802200317382812, 0.08245849609375, 0.08689498901367188, 0.09133148193359375, 0.09576797485351562, 0.1002044677734375, 0.10464096069335938, 0.10907745361328125, 0.11351394653320312, 0.117950439453125, 0.12238693237304688, 0.12682342529296875, 0.13125991821289062, 0.1356964111328125, 0.14013290405273438, 0.14456939697265625, 0.14900588989257812, 0.1534423828125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 7.0, 3.0, 5.0, 9.0, 6.0, 8.0, 12.0, 25.0, 32.0, 45.0, 62.0, 56.0, 78.0, 81.0, 86.0, 92.0, 72.0, 63.0, 58.0, 48.0, 37.0, 22.0, 23.0, 13.0, 9.0, 5.0, 5.0, 4.0, 3.0, 1.0, 2.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.016754150390625, -0.016226768493652344, -0.015699386596679688, -0.015172004699707031, -0.014644622802734375, -0.014117240905761719, -0.013589859008789062, -0.013062477111816406, -0.01253509521484375, -0.012007713317871094, -0.011480331420898438, -0.010952949523925781, -0.010425567626953125, -0.009898185729980469, -0.009370803833007812, -0.008843421936035156, -0.0083160400390625, -0.007788658142089844, -0.0072612762451171875, -0.006733894348144531, -0.006206512451171875, -0.005679130554199219, -0.0051517486572265625, -0.004624366760253906, -0.00409698486328125, -0.0035696029663085938, -0.0030422210693359375, -0.0025148391723632812, -0.001987457275390625, -0.0014600753784179688, -0.0009326934814453125, -0.00040531158447265625, 0.0001220703125, 0.0006494522094726562, 0.0011768341064453125, 0.0017042160034179688, 0.002231597900390625, 0.0027589797973632812, 0.0032863616943359375, 0.0038137435913085938, 0.00434112548828125, 0.004868507385253906, 0.0053958892822265625, 0.005923271179199219, 0.006450653076171875, 0.006978034973144531, 0.0075054168701171875, 0.008032798767089844, 0.0085601806640625, 0.009087562561035156, 0.009614944458007812, 0.010142326354980469, 0.010669708251953125, 0.011197090148925781, 0.011724472045898438, 0.012251853942871094, 0.01277923583984375, 0.013306617736816406, 0.013833999633789062, 0.014361381530761719, 0.014888763427734375, 0.015416145324707031, 0.015943527221679688, 0.016470909118652344, 0.016998291015625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 4.0, 3.0, 5.0, 3.0, 0.0, 3.0, 3.0, 6.0, 2.0, 1.0, 7.0, 9.0, 13.0, 29.0, 126.0, 1434.0, 48227.0, 951374.0, 45702.0, 1374.0, 133.0, 30.0, 13.0, 8.0, 5.0, 7.0, 6.0, 4.0, 4.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.67041015625, -0.65203857421875, -0.6336669921875, -0.61529541015625, -0.596923828125, -0.57855224609375, -0.5601806640625, -0.54180908203125, -0.5234375, -0.50506591796875, -0.4866943359375, -0.46832275390625, -0.449951171875, -0.43157958984375, -0.4132080078125, -0.39483642578125, -0.37646484375, -0.35809326171875, -0.3397216796875, -0.32135009765625, -0.302978515625, -0.28460693359375, -0.2662353515625, -0.24786376953125, -0.2294921875, -0.21112060546875, -0.1927490234375, -0.17437744140625, -0.156005859375, -0.13763427734375, -0.1192626953125, -0.10089111328125, -0.08251953125, -0.06414794921875, -0.0457763671875, -0.02740478515625, -0.009033203125, 0.00933837890625, 0.0277099609375, 0.04608154296875, 0.064453125, 0.08282470703125, 0.1011962890625, 0.11956787109375, 0.137939453125, 0.15631103515625, 0.1746826171875, 0.19305419921875, 0.21142578125, 0.22979736328125, 0.2481689453125, 0.26654052734375, 0.284912109375, 0.30328369140625, 0.3216552734375, 0.34002685546875, 0.3583984375, 0.37677001953125, 0.3951416015625, 0.41351318359375, 0.431884765625, 0.45025634765625, 0.4686279296875, 0.48699951171875, 0.50537109375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 5.0, 7.0, 6.0, 9.0, 5.0, 6.0, 17.0, 15.0, 16.0, 17.0, 22.0, 15.0, 24.0, 30.0, 25.0, 28.0, 28.0, 33.0, 35.0, 36.0, 40.0, 47.0, 39.0, 48.0, 49.0, 44.0, 44.0, 43.0, 27.0, 38.0, 28.0, 27.0, 20.0, 19.0, 15.0, 17.0, 11.0, 15.0, 14.0, 5.0, 6.0, 6.0, 11.0, 6.0, 4.0, 5.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07659912109375, -0.07422637939453125, -0.0718536376953125, -0.06948089599609375, -0.067108154296875, -0.06473541259765625, -0.0623626708984375, -0.05998992919921875, -0.0576171875, -0.05524444580078125, -0.0528717041015625, -0.05049896240234375, -0.048126220703125, -0.04575347900390625, -0.0433807373046875, -0.04100799560546875, -0.03863525390625, -0.03626251220703125, -0.0338897705078125, -0.03151702880859375, -0.029144287109375, -0.02677154541015625, -0.0243988037109375, -0.02202606201171875, -0.0196533203125, -0.01728057861328125, -0.0149078369140625, -0.01253509521484375, -0.010162353515625, -0.00778961181640625, -0.0054168701171875, -0.00304412841796875, -0.00067138671875, 0.00170135498046875, 0.0040740966796875, 0.00644683837890625, 0.008819580078125, 0.01119232177734375, 0.0135650634765625, 0.01593780517578125, 0.018310546875, 0.02068328857421875, 0.0230560302734375, 0.02542877197265625, 0.027801513671875, 0.03017425537109375, 0.0325469970703125, 0.03491973876953125, 0.03729248046875, 0.03966522216796875, 0.0420379638671875, 0.04441070556640625, 0.046783447265625, 0.04915618896484375, 0.0515289306640625, 0.05390167236328125, 0.0562744140625, 0.05864715576171875, 0.0610198974609375, 0.06339263916015625, 0.065765380859375, 0.06813812255859375, 0.0705108642578125, 0.07288360595703125, 0.07525634765625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 5.0, 11.0, 26.0, 129.0, 1130.0, 1043186.0, 3757.0, 227.0, 58.0, 12.0, 5.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.36328125, -4.233642578125, -4.10400390625, -3.974365234375, -3.8447265625, -3.715087890625, -3.58544921875, -3.455810546875, -3.326171875, -3.196533203125, -3.06689453125, -2.937255859375, -2.8076171875, -2.677978515625, -2.54833984375, -2.418701171875, -2.2890625, -2.159423828125, -2.02978515625, -1.900146484375, -1.7705078125, -1.640869140625, -1.51123046875, -1.381591796875, -1.251953125, -1.122314453125, -0.99267578125, -0.863037109375, -0.7333984375, -0.603759765625, -0.47412109375, -0.344482421875, -0.21484375, -0.085205078125, 0.04443359375, 0.174072265625, 0.3037109375, 0.433349609375, 0.56298828125, 0.692626953125, 0.822265625, 0.951904296875, 1.08154296875, 1.211181640625, 1.3408203125, 1.470458984375, 1.60009765625, 1.729736328125, 1.859375, 1.989013671875, 2.11865234375, 2.248291015625, 2.3779296875, 2.507568359375, 2.63720703125, 2.766845703125, 2.896484375, 3.026123046875, 3.15576171875, 3.285400390625, 3.4150390625, 3.544677734375, 3.67431640625, 3.803955078125, 3.93359375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 5.0, 5.0, 3.0, 2.0, 7.0, 6.0, 16.0, 15.0, 26.0, 31.0, 48.0, 114.0, 178.0, 206.0, 143.0, 67.0, 48.0, 25.0, 14.0, 21.0, 7.0, 9.0, 3.0, 1.0, 3.0, 2.0, 0.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.46574592590332e-05, -5.194917321205139e-05, -4.924088716506958e-05, -4.653260111808777e-05, -4.382431507110596e-05, -4.1116029024124146e-05, -3.8407742977142334e-05, -3.569945693016052e-05, -3.299117088317871e-05, -3.02828848361969e-05, -2.7574598789215088e-05, -2.4866312742233276e-05, -2.2158026695251465e-05, -1.9449740648269653e-05, -1.6741454601287842e-05, -1.403316855430603e-05, -1.1324882507324219e-05, -8.616596460342407e-06, -5.908310413360596e-06, -3.200024366378784e-06, -4.917383193969727e-07, 2.216547727584839e-06, 4.92483377456665e-06, 7.633119821548462e-06, 1.0341405868530273e-05, 1.3049691915512085e-05, 1.5757977962493896e-05, 1.8466264009475708e-05, 2.117455005645752e-05, 2.388283610343933e-05, 2.6591122150421143e-05, 2.9299408197402954e-05, 3.2007694244384766e-05, 3.471598029136658e-05, 3.742426633834839e-05, 4.01325523853302e-05, 4.284083843231201e-05, 4.554912447929382e-05, 4.8257410526275635e-05, 5.0965696573257446e-05, 5.367398262023926e-05, 5.638226866722107e-05, 5.909055471420288e-05, 6.179884076118469e-05, 6.45071268081665e-05, 6.721541285514832e-05, 6.992369890213013e-05, 7.263198494911194e-05, 7.534027099609375e-05, 7.804855704307556e-05, 8.075684309005737e-05, 8.346512913703918e-05, 8.6173415184021e-05, 8.888170123100281e-05, 9.158998727798462e-05, 9.429827332496643e-05, 9.700655937194824e-05, 9.971484541893005e-05, 0.00010242313146591187, 0.00010513141751289368, 0.00010783970355987549, 0.0001105479896068573, 0.00011325627565383911, 0.00011596456170082092, 0.00011867284774780273]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 6.0, 4.0, 1.0, 12.0, 12.0, 25.0, 23.0, 40.0, 57.0, 84.0, 135.0, 284.0, 678.0, 1912.0, 7049.0, 122242.0, 889388.0, 20838.0, 3669.0, 1115.0, 427.0, 207.0, 106.0, 69.0, 48.0, 29.0, 27.0, 13.0, 11.0, 11.0, 15.0, 4.0, 4.0, 3.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.432861328125, -0.4163856506347656, -0.39990997314453125, -0.3834342956542969, -0.3669586181640625, -0.3504829406738281, -0.33400726318359375, -0.3175315856933594, -0.301055908203125, -0.2845802307128906, -0.26810455322265625, -0.2516288757324219, -0.2351531982421875, -0.21867752075195312, -0.20220184326171875, -0.18572616577148438, -0.16925048828125, -0.15277481079101562, -0.13629913330078125, -0.11982345581054688, -0.1033477783203125, -0.08687210083007812, -0.07039642333984375, -0.053920745849609375, -0.037445068359375, -0.020969390869140625, -0.00449371337890625, 0.011981964111328125, 0.0284576416015625, 0.044933319091796875, 0.06140899658203125, 0.07788467407226562, 0.0943603515625, 0.11083602905273438, 0.12731170654296875, 0.14378738403320312, 0.1602630615234375, 0.17673873901367188, 0.19321441650390625, 0.20969009399414062, 0.226165771484375, 0.24264144897460938, 0.25911712646484375, 0.2755928039550781, 0.2920684814453125, 0.3085441589355469, 0.32501983642578125, 0.3414955139160156, 0.35797119140625, 0.3744468688964844, 0.39092254638671875, 0.4073982238769531, 0.4238739013671875, 0.4403495788574219, 0.45682525634765625, 0.4733009338378906, 0.489776611328125, 0.5062522888183594, 0.5227279663085938, 0.5392036437988281, 0.5556793212890625, 0.5721549987792969, 0.5886306762695312, 0.6051063537597656, 0.62158203125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 7.0, 15.0, 42.0, 85.0, 146.0, 198.0, 181.0, 144.0, 86.0, 43.0, 22.0, 11.0, 6.0, 3.0, 8.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14306640625, -0.136627197265625, -0.13018798828125, -0.123748779296875, -0.1173095703125, -0.110870361328125, -0.10443115234375, -0.097991943359375, -0.091552734375, -0.085113525390625, -0.07867431640625, -0.072235107421875, -0.0657958984375, -0.059356689453125, -0.05291748046875, -0.046478271484375, -0.0400390625, -0.033599853515625, -0.02716064453125, -0.020721435546875, -0.0142822265625, -0.007843017578125, -0.00140380859375, 0.005035400390625, 0.011474609375, 0.017913818359375, 0.02435302734375, 0.030792236328125, 0.0372314453125, 0.043670654296875, 0.05010986328125, 0.056549072265625, 0.06298828125, 0.069427490234375, 0.07586669921875, 0.082305908203125, 0.0887451171875, 0.095184326171875, 0.10162353515625, 0.108062744140625, 0.114501953125, 0.120941162109375, 0.12738037109375, 0.133819580078125, 0.1402587890625, 0.146697998046875, 0.15313720703125, 0.159576416015625, 0.166015625, 0.172454833984375, 0.17889404296875, 0.185333251953125, 0.1917724609375, 0.198211669921875, 0.20465087890625, 0.211090087890625, 0.217529296875, 0.223968505859375, 0.23040771484375, 0.236846923828125, 0.2432861328125, 0.249725341796875, 0.25616455078125, 0.262603759765625, 0.26904296875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 3.0, 15.0, 24.0, 75.0, 199.0, 323.0, 213.0, 76.0, 38.0, 20.0, 11.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9265696406364441, -0.8625232577323914, -0.7984769344329834, -0.7344305515289307, -0.6703841686248779, -0.60633784532547, -0.5422914624214172, -0.4782451093196869, -0.41419875621795654, -0.3501524031162262, -0.28610605001449585, -0.22205966711044312, -0.15801331400871277, -0.09396696090698242, -0.029920578002929688, 0.03412577509880066, 0.098172128200531, 0.16221848130226135, 0.2262648493051529, 0.29031121730804443, 0.3543575704097748, 0.4184039235115051, 0.48245030641555786, 0.5464966297149658, 0.6105430126190186, 0.6745893955230713, 0.7386357188224792, 0.802682101726532, 0.8667284250259399, 0.9307748079299927, 0.9948211908340454, 1.0588675737380981, 1.1229138374328613, 1.186960220336914, 1.2510066032409668, 1.3150529861450195, 1.3790992498397827, 1.4431456327438354, 1.5071920156478882, 1.571238398551941, 1.635284662246704, 1.6993310451507568, 1.7633774280548096, 1.8274238109588623, 1.8914700746536255, 1.9555164575576782, 2.0195627212524414, 2.083609104156494, 2.147655487060547, 2.2117018699645996, 2.2757482528686523, 2.339794635772705, 2.403841018676758, 2.4678874015808105, 2.5319337844848633, 2.595979928970337, 2.6600265502929688, 2.7240729331970215, 2.788119316101074, 2.852165699005127, 2.9162120819091797, 2.9802584648132324, 3.044304847717285, 3.108350992202759, 3.1723973751068115]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 6.0, 4.0, 4.0, 9.0, 11.0, 13.0, 20.0, 29.0, 24.0, 42.0, 55.0, 62.0, 67.0, 79.0, 79.0, 72.0, 69.0, 82.0, 66.0, 43.0, 41.0, 32.0, 20.0, 15.0, 18.0, 6.0, 3.0, 12.0, 4.0, 6.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9880886673927307, -0.959455668926239, -0.9308226704597473, -0.9021896123886108, -0.8735566139221191, -0.8449236154556274, -0.8162906169891357, -0.787657618522644, -0.7590246200561523, -0.7303916215896606, -0.701758623123169, -0.6731256246566772, -0.6444925665855408, -0.6158595681190491, -0.5872265696525574, -0.5585935711860657, -0.5299605131149292, -0.5013275146484375, -0.4726944863796234, -0.4440614879131317, -0.4154284596443176, -0.3867954611778259, -0.35816246271133423, -0.32952946424484253, -0.30089643597602844, -0.27226343750953674, -0.24363040924072266, -0.21499741077423096, -0.18636439740657806, -0.15773138403892517, -0.12909838557243347, -0.10046537220478058, -0.07183235883712769, -0.04319934919476509, -0.014566339552402496, 0.0140666663646698, 0.04269967973232269, 0.07133269309997559, 0.09996569156646729, 0.12859870493412018, 0.15723171830177307, 0.18586473166942596, 0.21449774503707886, 0.24313074350357056, 0.27176374197006226, 0.30039677023887634, 0.32902976870536804, 0.35766279697418213, 0.38629579544067383, 0.4149287939071655, 0.4435618221759796, 0.4721948206424713, 0.5008278489112854, 0.5294608473777771, 0.5580938458442688, 0.5867268443107605, 0.615359902381897, 0.6439929008483887, 0.6726258993148804, 0.7012588977813721, 0.7298919558525085, 0.7585249543190002, 0.7871579527854919, 0.8157909512519836, 0.8444239497184753]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 1.0, 2.0, 2.0, 4.0, 10.0, 8.0, 10.0, 6.0, 4.0, 7.0, 23.0, 20.0, 26.0, 45.0, 92.0, 219.0, 1120.0, 14313.0, 4141087.0, 34933.0, 1842.0, 284.0, 88.0, 29.0, 26.0, 18.0, 10.0, 14.0, 8.0, 6.0, 2.0, 4.0, 0.0, 2.0, 4.0, 2.0, 2.0, 4.0, 4.0, 4.0, 0.0, 2.0, 0.0, 2.0], "bins": [-2.0390625, -1.9862518310546875, -1.933441162109375, -1.8806304931640625, -1.82781982421875, -1.7750091552734375, -1.722198486328125, -1.6693878173828125, -1.6165771484375, -1.5637664794921875, -1.510955810546875, -1.4581451416015625, -1.40533447265625, -1.3525238037109375, -1.299713134765625, -1.2469024658203125, -1.194091796875, -1.1412811279296875, -1.088470458984375, -1.0356597900390625, -0.98284912109375, -0.9300384521484375, -0.877227783203125, -0.8244171142578125, -0.7716064453125, -0.7187957763671875, -0.665985107421875, -0.6131744384765625, -0.56036376953125, -0.5075531005859375, -0.454742431640625, -0.4019317626953125, -0.34912109375, -0.2963104248046875, -0.243499755859375, -0.1906890869140625, -0.13787841796875, -0.0850677490234375, -0.032257080078125, 0.0205535888671875, 0.0733642578125, 0.1261749267578125, 0.178985595703125, 0.2317962646484375, 0.28460693359375, 0.3374176025390625, 0.390228271484375, 0.4430389404296875, 0.495849609375, 0.5486602783203125, 0.601470947265625, 0.6542816162109375, 0.70709228515625, 0.7599029541015625, 0.812713623046875, 0.8655242919921875, 0.9183349609375, 0.9711456298828125, 1.023956298828125, 1.0767669677734375, 1.12957763671875, 1.1823883056640625, 1.235198974609375, 1.2880096435546875, 1.3408203125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 0.0, 2.0, 0.0, 6.0, 6.0, 1.0, 2.0, 5.0, 9.0, 16.0, 15.0, 26.0, 22.0, 26.0, 33.0, 43.0, 49.0, 58.0, 69.0, 78.0, 78.0, 79.0, 69.0, 61.0, 50.0, 46.0, 42.0, 31.0, 14.0, 14.0, 14.0, 3.0, 7.0, 8.0, 7.0, 5.0, 1.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0], "bins": [-0.0159454345703125, -0.015467166900634766, -0.014988899230957031, -0.014510631561279297, -0.014032363891601562, -0.013554096221923828, -0.013075828552246094, -0.01259756088256836, -0.012119293212890625, -0.01164102554321289, -0.011162757873535156, -0.010684490203857422, -0.010206222534179688, -0.009727954864501953, -0.009249687194824219, -0.008771419525146484, -0.00829315185546875, -0.007814884185791016, -0.007336616516113281, -0.006858348846435547, -0.0063800811767578125, -0.005901813507080078, -0.005423545837402344, -0.004945278167724609, -0.004467010498046875, -0.003988742828369141, -0.0035104751586914062, -0.003032207489013672, -0.0025539398193359375, -0.002075672149658203, -0.0015974044799804688, -0.0011191368103027344, -0.000640869140625, -0.00016260147094726562, 0.00031566619873046875, 0.0007939338684082031, 0.0012722015380859375, 0.0017504692077636719, 0.0022287368774414062, 0.0027070045471191406, 0.003185272216796875, 0.0036635398864746094, 0.004141807556152344, 0.004620075225830078, 0.0050983428955078125, 0.005576610565185547, 0.006054878234863281, 0.006533145904541016, 0.00701141357421875, 0.007489681243896484, 0.007967948913574219, 0.008446216583251953, 0.008924484252929688, 0.009402751922607422, 0.009881019592285156, 0.01035928726196289, 0.010837554931640625, 0.01131582260131836, 0.011794090270996094, 0.012272357940673828, 0.012750625610351562, 0.013228893280029297, 0.013707160949707031, 0.014185428619384766, 0.0146636962890625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 8.0, 4.0, 16.0, 16.0, 41.0, 74.0, 246.0, 6416.0, 4172546.0, 14466.0, 288.0, 92.0, 36.0, 21.0, 12.0, 4.0, 8.0, 2.0, 1.0, 1.0], "bins": [-3.43359375, -3.3682785034179688, -3.3029632568359375, -3.2376480102539062, -3.172332763671875, -3.1070175170898438, -3.0417022705078125, -2.9763870239257812, -2.91107177734375, -2.8457565307617188, -2.7804412841796875, -2.7151260375976562, -2.649810791015625, -2.5844955444335938, -2.5191802978515625, -2.4538650512695312, -2.3885498046875, -2.3232345581054688, -2.2579193115234375, -2.1926040649414062, -2.127288818359375, -2.0619735717773438, -1.9966583251953125, -1.9313430786132812, -1.86602783203125, -1.8007125854492188, -1.7353973388671875, -1.6700820922851562, -1.604766845703125, -1.5394515991210938, -1.4741363525390625, -1.4088211059570312, -1.343505859375, -1.2781906127929688, -1.2128753662109375, -1.1475601196289062, -1.082244873046875, -1.0169296264648438, -0.9516143798828125, -0.8862991333007812, -0.82098388671875, -0.7556686401367188, -0.6903533935546875, -0.6250381469726562, -0.559722900390625, -0.49440765380859375, -0.4290924072265625, -0.36377716064453125, -0.2984619140625, -0.23314666748046875, -0.1678314208984375, -0.10251617431640625, -0.037200927734375, 0.02811431884765625, 0.0934295654296875, 0.15874481201171875, 0.22406005859375, 0.28937530517578125, 0.3546905517578125, 0.42000579833984375, 0.485321044921875, 0.5506362915039062, 0.6159515380859375, 0.6812667846679688, 0.74658203125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 7.0, 6.0, 7.0, 9.0, 11.0, 26.0, 15.0, 20.0, 42.0, 41.0, 61.0, 88.0, 137.0, 213.0, 375.0, 1110.0, 946.0, 358.0, 194.0, 111.0, 76.0, 51.0, 35.0, 36.0, 15.0, 18.0, 12.0, 7.0, 9.0, 5.0, 9.0, 4.0, 3.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03521728515625, -0.034000396728515625, -0.03278350830078125, -0.031566619873046875, -0.0303497314453125, -0.029132843017578125, -0.02791595458984375, -0.026699066162109375, -0.025482177734375, -0.024265289306640625, -0.02304840087890625, -0.021831512451171875, -0.0206146240234375, -0.019397735595703125, -0.01818084716796875, -0.016963958740234375, -0.0157470703125, -0.014530181884765625, -0.01331329345703125, -0.012096405029296875, -0.0108795166015625, -0.009662628173828125, -0.00844573974609375, -0.007228851318359375, -0.006011962890625, -0.004795074462890625, -0.00357818603515625, -0.002361297607421875, -0.0011444091796875, 7.2479248046875e-05, 0.00128936767578125, 0.002506256103515625, 0.00372314453125, 0.004940032958984375, 0.00615692138671875, 0.007373809814453125, 0.0085906982421875, 0.009807586669921875, 0.01102447509765625, 0.012241363525390625, 0.013458251953125, 0.014675140380859375, 0.01589202880859375, 0.017108917236328125, 0.0183258056640625, 0.019542694091796875, 0.02075958251953125, 0.021976470947265625, 0.023193359375, 0.024410247802734375, 0.02562713623046875, 0.026844024658203125, 0.0280609130859375, 0.029277801513671875, 0.03049468994140625, 0.031711578369140625, 0.032928466796875, 0.034145355224609375, 0.03536224365234375, 0.036579132080078125, 0.0377960205078125, 0.039012908935546875, 0.04022979736328125, 0.041446685791015625, 0.04266357421875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 82.0, 917.0, 14.0, 3.0, 3.0], "bins": [-8.331463813781738, -8.193377494812012, -8.055292129516602, -7.917205810546875, -7.779119968414307, -7.641034126281738, -7.50294828414917, -7.364862442016602, -7.226776123046875, -7.088690280914307, -6.950604438781738, -6.812518119812012, -6.674432277679443, -6.536346435546875, -6.398260593414307, -6.260174751281738, -6.122088432312012, -5.984002590179443, -5.845916748046875, -5.707830429077148, -5.56974458694458, -5.431658744812012, -5.293572902679443, -5.155487060546875, -5.017401218414307, -4.879315376281738, -4.74122953414917, -4.603143215179443, -4.465057373046875, -4.326971530914307, -4.188885688781738, -4.050799369812012, -3.9127135276794434, -3.774627685546875, -3.6365416049957275, -3.498455762863159, -3.3603696823120117, -3.2222838401794434, -3.084197998046875, -2.9461119174957275, -2.80802583694458, -2.6699399948120117, -2.5318539142608643, -2.393768072128296, -2.2556819915771484, -2.11759614944458, -1.9795101881027222, -1.8414242267608643, -1.7033382654190063, -1.5652523040771484, -1.4271663427352905, -1.2890803813934326, -1.1509945392608643, -1.0129084587097168, -0.8748226165771484, -0.7367366552352905, -0.5986506938934326, -0.4605647325515747, -0.3224788010120392, -0.18439286947250366, -0.04630690813064575, 0.09177905321121216, 0.2298649549484253, 0.3679509162902832, 0.5060368776321411]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 0.0, 9.0, 14.0, 26.0, 39.0, 44.0, 78.0, 85.0, 90.0, 101.0, 104.0, 108.0, 76.0, 71.0, 47.0, 27.0, 20.0, 20.0, 13.0, 4.0, 7.0, 7.0, 3.0, 4.0, 3.0, 0.0, 2.0, 3.0], "bins": [-0.48254889249801636, -0.4720497727394104, -0.46155062317848206, -0.4510515034198761, -0.44055235385894775, -0.4300532341003418, -0.41955408453941345, -0.4090549647808075, -0.39855581521987915, -0.3880566954612732, -0.37755754590034485, -0.3670584261417389, -0.35655927658081055, -0.3460601568222046, -0.33556100726127625, -0.3250618875026703, -0.31456273794174194, -0.304063618183136, -0.29356446862220764, -0.2830653488636017, -0.27256619930267334, -0.2620670795440674, -0.25156792998313904, -0.24106881022453308, -0.23056969046592712, -0.22007055580615997, -0.20957142114639282, -0.19907228648662567, -0.18857315182685852, -0.17807401716709137, -0.16757488250732422, -0.15707576274871826, -0.14657661318778992, -0.13607747852802277, -0.12557834386825562, -0.11507920920848846, -0.10458007454872131, -0.09408093988895416, -0.08358181267976761, -0.07308267802000046, -0.0625835433602333, -0.052084408700466156, -0.041585274040699005, -0.031086143106222153, -0.020587008446455002, -0.010087873786687851, 0.00041125714778900146, 0.010910391807556152, 0.021409526467323303, 0.031908661127090454, 0.042407795786857605, 0.05290692672133446, 0.0634060651063919, 0.07390519976615906, 0.08440432697534561, 0.09490346163511276, 0.10540259629487991, 0.11590173095464706, 0.12640085816383362, 0.13689999282360077, 0.14739912748336792, 0.15789826214313507, 0.16839739680290222, 0.17889653146266937, 0.18939566612243652]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 4.0, 1.0, 5.0, 6.0, 4.0, 7.0, 14.0, 11.0, 16.0, 10.0, 17.0, 22.0, 21.0, 26.0, 36.0, 29.0, 25.0, 33.0, 53.0, 42.0, 320.0, 524931.0, 522216.0, 293.0, 58.0, 47.0, 40.0, 31.0, 31.0, 43.0, 29.0, 26.0, 25.0, 16.0, 16.0, 9.0, 4.0, 9.0, 8.0, 5.0, 3.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0], "bins": [-1.4755859375, -1.4334259033203125, -1.391265869140625, -1.3491058349609375, -1.30694580078125, -1.2647857666015625, -1.222625732421875, -1.1804656982421875, -1.1383056640625, -1.0961456298828125, -1.053985595703125, -1.0118255615234375, -0.96966552734375, -0.9275054931640625, -0.885345458984375, -0.8431854248046875, -0.801025390625, -0.7588653564453125, -0.716705322265625, -0.6745452880859375, -0.63238525390625, -0.5902252197265625, -0.548065185546875, -0.5059051513671875, -0.4637451171875, -0.4215850830078125, -0.379425048828125, -0.3372650146484375, -0.29510498046875, -0.2529449462890625, -0.210784912109375, -0.1686248779296875, -0.12646484375, -0.0843048095703125, -0.042144775390625, 1.52587890625e-05, 0.04217529296875, 0.0843353271484375, 0.126495361328125, 0.1686553955078125, 0.2108154296875, 0.2529754638671875, 0.295135498046875, 0.3372955322265625, 0.37945556640625, 0.4216156005859375, 0.463775634765625, 0.5059356689453125, 0.548095703125, 0.5902557373046875, 0.632415771484375, 0.6745758056640625, 0.71673583984375, 0.7588958740234375, 0.801055908203125, 0.8432159423828125, 0.8853759765625, 0.9275360107421875, 0.969696044921875, 1.0118560791015625, 1.05401611328125, 1.0961761474609375, 1.138336181640625, 1.1804962158203125, 1.22265625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 22.0, 54.0, 69.0, 105.0, 174.0, 181.0, 166.0, 107.0, 80.0, 29.0, 11.0, 8.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.061492919921875, -0.060167551040649414, -0.05884218215942383, -0.05751681327819824, -0.056191444396972656, -0.05486607551574707, -0.053540706634521484, -0.0522153377532959, -0.05088996887207031, -0.04956459999084473, -0.04823923110961914, -0.046913862228393555, -0.04558849334716797, -0.04426312446594238, -0.0429377555847168, -0.04161238670349121, -0.040287017822265625, -0.03896164894104004, -0.03763628005981445, -0.03631091117858887, -0.03498554229736328, -0.033660173416137695, -0.03233480453491211, -0.031009435653686523, -0.029684066772460938, -0.02835869789123535, -0.027033329010009766, -0.02570796012878418, -0.024382591247558594, -0.023057222366333008, -0.021731853485107422, -0.020406484603881836, -0.01908111572265625, -0.017755746841430664, -0.016430377960205078, -0.015105009078979492, -0.013779640197753906, -0.01245427131652832, -0.011128902435302734, -0.009803533554077148, -0.008478164672851562, -0.0071527957916259766, -0.005827426910400391, -0.004502058029174805, -0.0031766891479492188, -0.0018513202667236328, -0.0005259513854980469, 0.0007994174957275391, 0.002124786376953125, 0.003450155258178711, 0.004775524139404297, 0.006100893020629883, 0.007426261901855469, 0.008751630783081055, 0.01007699966430664, 0.011402368545532227, 0.012727737426757812, 0.014053106307983398, 0.015378475189208984, 0.01670384407043457, 0.018029212951660156, 0.019354581832885742, 0.020679950714111328, 0.022005319595336914, 0.0233306884765625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 7.0, 6.0, 10.0, 7.0, 11.0, 13.0, 15.0, 27.0, 28.0, 43.0, 73.0, 83.0, 140.0, 235.0, 373.0, 729.0, 1561.0, 3777.0, 11252.0, 45385.0, 261930.0, 553102.0, 131210.0, 26099.0, 7189.0, 2658.0, 1110.0, 583.0, 303.0, 190.0, 118.0, 80.0, 60.0, 38.0, 28.0, 21.0, 17.0, 12.0, 6.0, 6.0, 7.0, 3.0, 5.0, 1.0, 6.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.322021484375, -0.3113975524902344, -0.30077362060546875, -0.2901496887207031, -0.2795257568359375, -0.2689018249511719, -0.25827789306640625, -0.24765396118164062, -0.237030029296875, -0.22640609741210938, -0.21578216552734375, -0.20515823364257812, -0.1945343017578125, -0.18391036987304688, -0.17328643798828125, -0.16266250610351562, -0.15203857421875, -0.14141464233398438, -0.13079071044921875, -0.12016677856445312, -0.1095428466796875, -0.09891891479492188, -0.08829498291015625, -0.07767105102539062, -0.067047119140625, -0.056423187255859375, -0.04579925537109375, -0.035175323486328125, -0.0245513916015625, -0.013927459716796875, -0.00330352783203125, 0.007320404052734375, 0.0179443359375, 0.028568267822265625, 0.03919219970703125, 0.049816131591796875, 0.0604400634765625, 0.07106399536132812, 0.08168792724609375, 0.09231185913085938, 0.102935791015625, 0.11355972290039062, 0.12418365478515625, 0.13480758666992188, 0.1454315185546875, 0.15605545043945312, 0.16667938232421875, 0.17730331420898438, 0.18792724609375, 0.19855117797851562, 0.20917510986328125, 0.21979904174804688, 0.2304229736328125, 0.24104690551757812, 0.25167083740234375, 0.2622947692871094, 0.272918701171875, 0.2835426330566406, 0.29416656494140625, 0.3047904968261719, 0.3154144287109375, 0.3260383605957031, 0.33666229248046875, 0.3472862243652344, 0.35791015625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 8.0, 10.0, 7.0, 8.0, 12.0, 16.0, 23.0, 16.0, 36.0, 29.0, 29.0, 46.0, 44.0, 48.0, 52.0, 46.0, 39.0, 60.0, 39.0, 43.0, 41.0, 46.0, 33.0, 46.0, 31.0, 32.0, 19.0, 29.0, 29.0, 17.0, 18.0, 8.0, 7.0, 7.0, 2.0, 7.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0997314453125, -0.09676265716552734, -0.09379386901855469, -0.09082508087158203, -0.08785629272460938, -0.08488750457763672, -0.08191871643066406, -0.0789499282836914, -0.07598114013671875, -0.0730123519897461, -0.07004356384277344, -0.06707477569580078, -0.06410598754882812, -0.06113719940185547, -0.05816841125488281, -0.055199623107910156, -0.0522308349609375, -0.049262046813964844, -0.04629325866699219, -0.04332447052001953, -0.040355682373046875, -0.03738689422607422, -0.03441810607910156, -0.031449317932128906, -0.02848052978515625, -0.025511741638183594, -0.022542953491210938, -0.01957416534423828, -0.016605377197265625, -0.013636589050292969, -0.010667800903320312, -0.007699012756347656, -0.004730224609375, -0.0017614364624023438, 0.0012073516845703125, 0.004176139831542969, 0.007144927978515625, 0.010113716125488281, 0.013082504272460938, 0.016051292419433594, 0.01902008056640625, 0.021988868713378906, 0.024957656860351562, 0.02792644500732422, 0.030895233154296875, 0.03386402130126953, 0.03683280944824219, 0.039801597595214844, 0.0427703857421875, 0.045739173889160156, 0.04870796203613281, 0.05167675018310547, 0.054645538330078125, 0.05761432647705078, 0.06058311462402344, 0.0635519027709961, 0.06652069091796875, 0.0694894790649414, 0.07245826721191406, 0.07542705535888672, 0.07839584350585938, 0.08136463165283203, 0.08433341979980469, 0.08730220794677734, 0.09027099609375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 5.0, 8.0, 6.0, 9.0, 17.0, 24.0, 42.0, 73.0, 116.0, 197.0, 366.0, 772.0, 1905.0, 6375.0, 39463.0, 755856.0, 222416.0, 15137.0, 3339.0, 1192.0, 544.0, 281.0, 154.0, 83.0, 42.0, 35.0, 20.0, 22.0, 10.0, 11.0, 11.0, 8.0, 4.0, 5.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.63525390625, -0.6158676147460938, -0.5964813232421875, -0.5770950317382812, -0.557708740234375, -0.5383224487304688, -0.5189361572265625, -0.49954986572265625, -0.48016357421875, -0.46077728271484375, -0.4413909912109375, -0.42200469970703125, -0.402618408203125, -0.38323211669921875, -0.3638458251953125, -0.34445953369140625, -0.3250732421875, -0.30568695068359375, -0.2863006591796875, -0.26691436767578125, -0.247528076171875, -0.22814178466796875, -0.2087554931640625, -0.18936920166015625, -0.16998291015625, -0.15059661865234375, -0.1312103271484375, -0.11182403564453125, -0.092437744140625, -0.07305145263671875, -0.0536651611328125, -0.03427886962890625, -0.014892578125, 0.00449371337890625, 0.0238800048828125, 0.04326629638671875, 0.062652587890625, 0.08203887939453125, 0.1014251708984375, 0.12081146240234375, 0.14019775390625, 0.15958404541015625, 0.1789703369140625, 0.19835662841796875, 0.217742919921875, 0.23712921142578125, 0.2565155029296875, 0.27590179443359375, 0.2952880859375, 0.31467437744140625, 0.3340606689453125, 0.35344696044921875, 0.372833251953125, 0.39221954345703125, 0.4116058349609375, 0.43099212646484375, 0.45037841796875, 0.46976470947265625, 0.4891510009765625, 0.5085372924804688, 0.527923583984375, 0.5473098754882812, 0.5666961669921875, 0.5860824584960938, 0.60546875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 5.0, 16.0, 11.0, 24.0, 47.0, 62.0, 92.0, 147.0, 142.0, 143.0, 101.0, 54.0, 47.0, 29.0, 17.0, 12.0, 14.0, 6.0, 5.0, 5.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.729364395141602e-05, -6.534717977046967e-05, -6.340071558952332e-05, -6.145425140857697e-05, -5.9507787227630615e-05, -5.7561323046684265e-05, -5.5614858865737915e-05, -5.3668394684791565e-05, -5.1721930503845215e-05, -4.9775466322898865e-05, -4.7829002141952515e-05, -4.5882537961006165e-05, -4.3936073780059814e-05, -4.1989609599113464e-05, -4.0043145418167114e-05, -3.8096681237220764e-05, -3.6150217056274414e-05, -3.4203752875328064e-05, -3.2257288694381714e-05, -3.0310824513435364e-05, -2.8364360332489014e-05, -2.6417896151542664e-05, -2.4471431970596313e-05, -2.2524967789649963e-05, -2.0578503608703613e-05, -1.8632039427757263e-05, -1.6685575246810913e-05, -1.4739111065864563e-05, -1.2792646884918213e-05, -1.0846182703971863e-05, -8.899718523025513e-06, -6.953254342079163e-06, -5.0067901611328125e-06, -3.0603259801864624e-06, -1.1138617992401123e-06, 8.326023817062378e-07, 2.779066562652588e-06, 4.725530743598938e-06, 6.671994924545288e-06, 8.618459105491638e-06, 1.0564923286437988e-05, 1.2511387467384338e-05, 1.4457851648330688e-05, 1.640431582927704e-05, 1.835078001022339e-05, 2.029724419116974e-05, 2.224370837211609e-05, 2.419017255306244e-05, 2.613663673400879e-05, 2.808310091495514e-05, 3.002956509590149e-05, 3.197602927684784e-05, 3.392249345779419e-05, 3.586895763874054e-05, 3.781542181968689e-05, 3.976188600063324e-05, 4.170835018157959e-05, 4.365481436252594e-05, 4.560127854347229e-05, 4.754774272441864e-05, 4.949420690536499e-05, 5.144067108631134e-05, 5.338713526725769e-05, 5.533359944820404e-05, 5.728006362915039e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 8.0, 9.0, 14.0, 19.0, 30.0, 55.0, 74.0, 126.0, 237.0, 505.0, 1290.0, 4370.0, 22390.0, 767667.0, 233863.0, 13037.0, 3052.0, 929.0, 367.0, 202.0, 104.0, 71.0, 31.0, 41.0, 21.0, 12.0, 12.0, 5.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9033203125, -0.8730621337890625, -0.842803955078125, -0.8125457763671875, -0.78228759765625, -0.7520294189453125, -0.721771240234375, -0.6915130615234375, -0.6612548828125, -0.6309967041015625, -0.600738525390625, -0.5704803466796875, -0.54022216796875, -0.5099639892578125, -0.479705810546875, -0.4494476318359375, -0.419189453125, -0.3889312744140625, -0.358673095703125, -0.3284149169921875, -0.29815673828125, -0.2678985595703125, -0.237640380859375, -0.2073822021484375, -0.1771240234375, -0.1468658447265625, -0.116607666015625, -0.0863494873046875, -0.05609130859375, -0.0258331298828125, 0.004425048828125, 0.0346832275390625, 0.06494140625, 0.0951995849609375, 0.125457763671875, 0.1557159423828125, 0.18597412109375, 0.2162322998046875, 0.246490478515625, 0.2767486572265625, 0.3070068359375, 0.3372650146484375, 0.367523193359375, 0.3977813720703125, 0.42803955078125, 0.4582977294921875, 0.488555908203125, 0.5188140869140625, 0.549072265625, 0.5793304443359375, 0.609588623046875, 0.6398468017578125, 0.67010498046875, 0.7003631591796875, 0.730621337890625, 0.7608795166015625, 0.7911376953125, 0.8213958740234375, 0.851654052734375, 0.8819122314453125, 0.91217041015625, 0.9424285888671875, 0.972686767578125, 1.0029449462890625, 1.033203125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 5.0, 5.0, 3.0, 9.0, 12.0, 20.0, 43.0, 89.0, 183.0, 226.0, 185.0, 105.0, 46.0, 19.0, 14.0, 9.0, 7.0, 7.0, 4.0, 5.0, 2.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.529296875, -0.5168685913085938, -0.5044403076171875, -0.49201202392578125, -0.479583740234375, -0.46715545654296875, -0.4547271728515625, -0.44229888916015625, -0.42987060546875, -0.41744232177734375, -0.4050140380859375, -0.39258575439453125, -0.380157470703125, -0.36772918701171875, -0.3553009033203125, -0.34287261962890625, -0.3304443359375, -0.31801605224609375, -0.3055877685546875, -0.29315948486328125, -0.280731201171875, -0.26830291748046875, -0.2558746337890625, -0.24344635009765625, -0.23101806640625, -0.21858978271484375, -0.2061614990234375, -0.19373321533203125, -0.181304931640625, -0.16887664794921875, -0.1564483642578125, -0.14402008056640625, -0.131591796875, -0.11916351318359375, -0.1067352294921875, -0.09430694580078125, -0.081878662109375, -0.06945037841796875, -0.0570220947265625, -0.04459381103515625, -0.03216552734375, -0.01973724365234375, -0.0073089599609375, 0.00511932373046875, 0.017547607421875, 0.02997589111328125, 0.0424041748046875, 0.05483245849609375, 0.0672607421875, 0.07968902587890625, 0.0921173095703125, 0.10454559326171875, 0.116973876953125, 0.12940216064453125, 0.1418304443359375, 0.15425872802734375, 0.16668701171875, 0.17911529541015625, 0.1915435791015625, 0.20397186279296875, 0.216400146484375, 0.22882843017578125, 0.2412567138671875, 0.25368499755859375, 0.26611328125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 31.0, 423.0, 492.0, 48.0, 8.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.483553886413574, -4.139206409454346, -3.794858932495117, -3.4505116939544678, -3.1061642169952393, -2.7618167400360107, -2.4174695014953613, -2.073122024536133, -1.7287745475769043, -1.3844270706176758, -1.0400797128677368, -0.6957323551177979, -0.35138487815856934, -0.00703740119934082, 0.3373098373413086, 0.6816573143005371, 1.0260047912597656, 1.3703522682189941, 1.714699625968933, 2.059046983718872, 2.4033944606781006, 2.747741937637329, 3.0920891761779785, 3.436436653137207, 3.7807841300964355, 4.125131607055664, 4.469479084014893, 4.813826560974121, 5.158173561096191, 5.502521514892578, 5.846868515014648, 6.191215991973877, 6.535564422607422, 6.87991189956665, 7.224259376525879, 7.568606376647949, 7.912954330444336, 8.257301330566406, 8.601648330688477, 8.945996284484863, 9.29034423828125, 9.63469123840332, 9.979039192199707, 10.323386192321777, 10.667734146118164, 11.012081146240234, 11.356428146362305, 11.700776100158691, 12.045123100280762, 12.389470100402832, 12.733818054199219, 13.078165054321289, 13.422513008117676, 13.766860008239746, 14.111207962036133, 14.455554962158203, 14.799901962280273, 15.144248962402344, 15.48859691619873, 15.8329439163208, 16.177291870117188, 16.521638870239258, 16.865985870361328, 17.21033477783203, 17.5546817779541]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 12.0, 20.0, 32.0, 43.0, 67.0, 87.0, 113.0, 128.0, 98.0, 126.0, 109.0, 57.0, 41.0, 35.0, 16.0, 11.0, 3.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1933109760284424, -1.135461688041687, -1.077612280845642, -1.0197629928588867, -0.9619137048721313, -0.9040643572807312, -0.846215009689331, -0.7883657217025757, -0.7305164337158203, -0.6726670861244202, -0.6148177981376648, -0.5569684505462646, -0.4991191625595093, -0.44126981496810913, -0.38342049717903137, -0.3255711793899536, -0.26772183179855347, -0.2098725140094757, -0.15202319622039795, -0.094173863530159, -0.03632454574108124, 0.021524786949157715, 0.07937410473823547, 0.13722342252731323, 0.195072740316391, 0.25292205810546875, 0.3107713758945465, 0.36862069368362427, 0.4264700412750244, 0.4843193590641022, 0.5421686768531799, 0.6000180244445801, 0.6578673124313354, 0.7157166600227356, 0.773565948009491, 0.8314152956008911, 0.8892645835876465, 0.9471139311790466, 1.0049632787704468, 1.0628125667572021, 1.1206618547439575, 1.178511142730713, 1.2363605499267578, 1.2942098379135132, 1.3520591259002686, 1.4099085330963135, 1.4677578210830688, 1.5256071090698242, 1.5834565162658691, 1.6413058042526245, 1.6991552114486694, 1.7570044994354248, 1.8148537874221802, 1.8727030754089355, 1.9305524826049805, 1.9884017705917358, 2.046251058578491, 2.104100465774536, 2.161949634552002, 2.219799041748047, 2.277648448944092, 2.3354976177215576, 2.3933470249176025, 2.4511961936950684, 2.5090456008911133]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 4.0, 14.0, 8.0, 11.0, 16.0, 23.0, 21.0, 41.0, 39.0, 62.0, 73.0, 152.0, 314.0, 1346.0, 2509924.0, 1679724.0, 1730.0, 343.0, 135.0, 75.0, 66.0, 38.0, 31.0, 26.0, 20.0, 12.0, 12.0, 5.0, 2.0, 6.0, 6.0, 4.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.640625, -3.5559539794921875, -3.471282958984375, -3.3866119384765625, -3.30194091796875, -3.2172698974609375, -3.132598876953125, -3.0479278564453125, -2.9632568359375, -2.8785858154296875, -2.793914794921875, -2.7092437744140625, -2.62457275390625, -2.5399017333984375, -2.455230712890625, -2.3705596923828125, -2.285888671875, -2.2012176513671875, -2.116546630859375, -2.0318756103515625, -1.94720458984375, -1.8625335693359375, -1.777862548828125, -1.6931915283203125, -1.6085205078125, -1.5238494873046875, -1.439178466796875, -1.3545074462890625, -1.26983642578125, -1.1851654052734375, -1.100494384765625, -1.0158233642578125, -0.93115234375, -0.8464813232421875, -0.761810302734375, -0.6771392822265625, -0.59246826171875, -0.5077972412109375, -0.423126220703125, -0.3384552001953125, -0.2537841796875, -0.1691131591796875, -0.084442138671875, 0.0002288818359375, 0.08489990234375, 0.1695709228515625, 0.254241943359375, 0.3389129638671875, 0.423583984375, 0.5082550048828125, 0.592926025390625, 0.6775970458984375, 0.76226806640625, 0.8469390869140625, 0.931610107421875, 1.0162811279296875, 1.1009521484375, 1.1856231689453125, 1.270294189453125, 1.3549652099609375, 1.43963623046875, 1.5243072509765625, 1.608978271484375, 1.6936492919921875, 1.7783203125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 6.0, 6.0, 5.0, 15.0, 14.0, 28.0, 31.0, 57.0, 52.0, 63.0, 79.0, 86.0, 106.0, 88.0, 66.0, 82.0, 72.0, 43.0, 32.0, 25.0, 16.0, 9.0, 3.0, 9.0, 8.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0404052734375, -0.039382219314575195, -0.03835916519165039, -0.037336111068725586, -0.03631305694580078, -0.03529000282287598, -0.03426694869995117, -0.03324389457702637, -0.03222084045410156, -0.031197786331176758, -0.030174732208251953, -0.02915167808532715, -0.028128623962402344, -0.02710556983947754, -0.026082515716552734, -0.02505946159362793, -0.024036407470703125, -0.02301335334777832, -0.021990299224853516, -0.02096724510192871, -0.019944190979003906, -0.0189211368560791, -0.017898082733154297, -0.016875028610229492, -0.015851974487304688, -0.014828920364379883, -0.013805866241455078, -0.012782812118530273, -0.011759757995605469, -0.010736703872680664, -0.00971364974975586, -0.008690595626831055, -0.00766754150390625, -0.006644487380981445, -0.005621433258056641, -0.004598379135131836, -0.0035753250122070312, -0.0025522708892822266, -0.0015292167663574219, -0.0005061626434326172, 0.0005168914794921875, 0.0015399456024169922, 0.002562999725341797, 0.0035860538482666016, 0.004609107971191406, 0.005632162094116211, 0.006655216217041016, 0.00767827033996582, 0.008701324462890625, 0.00972437858581543, 0.010747432708740234, 0.011770486831665039, 0.012793540954589844, 0.013816595077514648, 0.014839649200439453, 0.015862703323364258, 0.016885757446289062, 0.017908811569213867, 0.018931865692138672, 0.019954919815063477, 0.02097797393798828, 0.022001028060913086, 0.02302408218383789, 0.024047136306762695, 0.0250701904296875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 7.0, 4.0, 5.0, 9.0, 15.0, 9.0, 14.0, 31.0, 29.0, 58.0, 69.0, 106.0, 110.0, 112.0, 188.0, 1013.0, 4175694.0, 15661.0, 426.0, 152.0, 135.0, 139.0, 78.0, 78.0, 46.0, 45.0, 22.0, 19.0, 4.0, 5.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-8.078125, -7.83880615234375, -7.5994873046875, -7.36016845703125, -7.120849609375, -6.88153076171875, -6.6422119140625, -6.40289306640625, -6.16357421875, -5.92425537109375, -5.6849365234375, -5.44561767578125, -5.206298828125, -4.96697998046875, -4.7276611328125, -4.48834228515625, -4.2490234375, -4.00970458984375, -3.7703857421875, -3.53106689453125, -3.291748046875, -3.05242919921875, -2.8131103515625, -2.57379150390625, -2.33447265625, -2.09515380859375, -1.8558349609375, -1.61651611328125, -1.377197265625, -1.13787841796875, -0.8985595703125, -0.65924072265625, -0.419921875, -0.18060302734375, 0.0587158203125, 0.29803466796875, 0.537353515625, 0.77667236328125, 1.0159912109375, 1.25531005859375, 1.49462890625, 1.73394775390625, 1.9732666015625, 2.21258544921875, 2.451904296875, 2.69122314453125, 2.9305419921875, 3.16986083984375, 3.4091796875, 3.64849853515625, 3.8878173828125, 4.12713623046875, 4.366455078125, 4.60577392578125, 4.8450927734375, 5.08441162109375, 5.32373046875, 5.56304931640625, 5.8023681640625, 6.04168701171875, 6.281005859375, 6.52032470703125, 6.7596435546875, 6.99896240234375, 7.23828125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 7.0, 4.0, 15.0, 31.0, 61.0, 114.0, 369.0, 2141.0, 964.0, 213.0, 92.0, 36.0, 18.0, 11.0, 8.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18310546875, -0.17652320861816406, -0.16994094848632812, -0.1633586883544922, -0.15677642822265625, -0.1501941680908203, -0.14361190795898438, -0.13702964782714844, -0.1304473876953125, -0.12386512756347656, -0.11728286743164062, -0.11070060729980469, -0.10411834716796875, -0.09753608703613281, -0.09095382690429688, -0.08437156677246094, -0.077789306640625, -0.07120704650878906, -0.06462478637695312, -0.05804252624511719, -0.05146026611328125, -0.04487800598144531, -0.038295745849609375, -0.03171348571777344, -0.0251312255859375, -0.018548965454101562, -0.011966705322265625, -0.0053844451904296875, 0.00119781494140625, 0.0077800750732421875, 0.014362335205078125, 0.020944595336914062, 0.02752685546875, 0.03410911560058594, 0.040691375732421875, 0.04727363586425781, 0.05385589599609375, 0.06043815612792969, 0.06702041625976562, 0.07360267639160156, 0.0801849365234375, 0.08676719665527344, 0.09334945678710938, 0.09993171691894531, 0.10651397705078125, 0.11309623718261719, 0.11967849731445312, 0.12626075744628906, 0.132843017578125, 0.13942527770996094, 0.14600753784179688, 0.1525897979736328, 0.15917205810546875, 0.1657543182373047, 0.17233657836914062, 0.17891883850097656, 0.1855010986328125, 0.19208335876464844, 0.19866561889648438, 0.2052478790283203, 0.21183013916015625, 0.2184123992919922, 0.22499465942382812, 0.23157691955566406, 0.2381591796875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 7.0, 1.0, 10.0, 11.0, 32.0, 88.0, 241.0, 430.0, 111.0, 46.0, 16.0, 7.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1266584396362305, -4.938282012939453, -4.749905586242676, -4.561529159545898, -4.373152732849121, -4.184776306152344, -3.9963996410369873, -3.80802321434021, -3.6196467876434326, -3.4312703609466553, -3.242893934249878, -3.0545172691345215, -2.866140842437744, -2.677764415740967, -2.4893879890441895, -2.301011562347412, -2.1126351356506348, -1.9242587089538574, -1.73588228225708, -1.5475057363510132, -1.3591293096542358, -1.1707528829574585, -0.9823763370513916, -0.7939999103546143, -0.6056234836578369, -0.4172470271587372, -0.22887057065963745, -0.04049408435821533, 0.147882342338562, 0.33625876903533936, 0.5246353149414062, 0.7130117416381836, 0.9013881683349609, 1.0897645950317383, 1.2781410217285156, 1.4665175676345825, 1.6548939943313599, 1.8432704210281372, 2.031646966934204, 2.2200233936309814, 2.408399820327759, 2.596776247024536, 2.7851526737213135, 2.97352933883667, 3.1619057655334473, 3.3502821922302246, 3.538658618927002, 3.7270350456237793, 3.9154114723205566, 4.103787899017334, 4.292164325714111, 4.480540752410889, 4.668917179107666, 4.857293605804443, 5.045670509338379, 5.234046936035156, 5.422423362731934, 5.610799789428711, 5.799176216125488, 5.987552642822266, 6.175929069519043, 6.36430549621582, 6.552681922912598, 6.741058349609375, 6.929434776306152]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 4.0, 9.0, 6.0, 9.0, 8.0, 27.0, 31.0, 35.0, 67.0, 67.0, 108.0, 74.0, 103.0, 74.0, 91.0, 72.0, 62.0, 44.0, 47.0, 26.0, 23.0, 12.0, 5.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6516462564468384, -0.6281753182411194, -0.6047043800354004, -0.5812334418296814, -0.5577625036239624, -0.5342915654182434, -0.5108206272125244, -0.48734965920448303, -0.46387872099876404, -0.44040778279304504, -0.41693684458732605, -0.39346587657928467, -0.3699949383735657, -0.3465240001678467, -0.3230530619621277, -0.2995821237564087, -0.2761111855506897, -0.2526402473449707, -0.2291693091392517, -0.20569835603237152, -0.18222741782665253, -0.15875647962093353, -0.13528552651405334, -0.11181458830833435, -0.08834365010261536, -0.06487271189689636, -0.04140176624059677, -0.01793082058429718, 0.005540117621421814, 0.029011055827140808, 0.052482008934020996, 0.07595294713973999, 0.09942394495010376, 0.12289488315582275, 0.14636582136154175, 0.16983677446842194, 0.19330771267414093, 0.21677865087985992, 0.2402496039867401, 0.2637205421924591, 0.2871914803981781, 0.3106624186038971, 0.3341333568096161, 0.35760432481765747, 0.38107526302337646, 0.40454620122909546, 0.42801713943481445, 0.45148807764053345, 0.47495901584625244, 0.49842995405197144, 0.5219008922576904, 0.5453718304634094, 0.5688427686691284, 0.5923137068748474, 0.6157846450805664, 0.6392556428909302, 0.6627265214920044, 0.6861974596977234, 0.7096683979034424, 0.7331393361091614, 0.7566102743148804, 0.7800812125205994, 0.8035521507263184, 0.8270231485366821, 0.8504940867424011]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 8.0, 4.0, 8.0, 12.0, 21.0, 20.0, 28.0, 50.0, 72.0, 93.0, 169.0, 349.0, 723.0, 1944.0, 7747.0, 68450.0, 862624.0, 93101.0, 9262.0, 2100.0, 818.0, 356.0, 205.0, 109.0, 84.0, 60.0, 36.0, 20.0, 14.0, 25.0, 10.0, 8.0, 5.0, 4.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.37109375, -2.290863037109375, -2.21063232421875, -2.130401611328125, -2.0501708984375, -1.969940185546875, -1.88970947265625, -1.809478759765625, -1.729248046875, -1.649017333984375, -1.56878662109375, -1.488555908203125, -1.4083251953125, -1.328094482421875, -1.24786376953125, -1.167633056640625, -1.08740234375, -1.007171630859375, -0.92694091796875, -0.846710205078125, -0.7664794921875, -0.686248779296875, -0.60601806640625, -0.525787353515625, -0.445556640625, -0.365325927734375, -0.28509521484375, -0.204864501953125, -0.1246337890625, -0.044403076171875, 0.03582763671875, 0.116058349609375, 0.1962890625, 0.276519775390625, 0.35675048828125, 0.436981201171875, 0.5172119140625, 0.597442626953125, 0.67767333984375, 0.757904052734375, 0.838134765625, 0.918365478515625, 0.99859619140625, 1.078826904296875, 1.1590576171875, 1.239288330078125, 1.31951904296875, 1.399749755859375, 1.47998046875, 1.560211181640625, 1.64044189453125, 1.720672607421875, 1.8009033203125, 1.881134033203125, 1.96136474609375, 2.041595458984375, 2.121826171875, 2.202056884765625, 2.28228759765625, 2.362518310546875, 2.4427490234375, 2.522979736328125, 2.60321044921875, 2.683441162109375, 2.763671875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 6.0, 4.0, 13.0, 12.0, 18.0, 20.0, 35.0, 46.0, 50.0, 67.0, 65.0, 95.0, 85.0, 79.0, 66.0, 79.0, 69.0, 51.0, 35.0, 27.0, 35.0, 10.0, 15.0, 11.0, 4.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0496826171875, -0.048462629318237305, -0.04724264144897461, -0.046022653579711914, -0.04480266571044922, -0.04358267784118652, -0.04236268997192383, -0.04114270210266113, -0.03992271423339844, -0.03870272636413574, -0.03748273849487305, -0.03626275062561035, -0.035042762756347656, -0.03382277488708496, -0.032602787017822266, -0.03138279914855957, -0.030162811279296875, -0.02894282341003418, -0.027722835540771484, -0.02650284767150879, -0.025282859802246094, -0.0240628719329834, -0.022842884063720703, -0.021622896194458008, -0.020402908325195312, -0.019182920455932617, -0.017962932586669922, -0.016742944717407227, -0.015522956848144531, -0.014302968978881836, -0.01308298110961914, -0.011862993240356445, -0.01064300537109375, -0.009423017501831055, -0.00820302963256836, -0.006983041763305664, -0.005763053894042969, -0.0045430660247802734, -0.003323078155517578, -0.002103090286254883, -0.0008831024169921875, 0.0003368854522705078, 0.0015568733215332031, 0.0027768611907958984, 0.003996849060058594, 0.005216836929321289, 0.006436824798583984, 0.00765681266784668, 0.008876800537109375, 0.01009678840637207, 0.011316776275634766, 0.012536764144897461, 0.013756752014160156, 0.014976739883422852, 0.016196727752685547, 0.017416715621948242, 0.018636703491210938, 0.019856691360473633, 0.021076679229736328, 0.022296667098999023, 0.02351665496826172, 0.024736642837524414, 0.02595663070678711, 0.027176618576049805, 0.0283966064453125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 4.0, 5.0, 19.0, 13.0, 21.0, 26.0, 33.0, 56.0, 103.0, 131.0, 225.0, 353.0, 696.0, 1355.0, 3382.0, 11059.0, 47556.0, 423201.0, 488064.0, 53521.0, 11940.0, 3666.0, 1443.0, 662.0, 375.0, 240.0, 137.0, 85.0, 64.0, 38.0, 24.0, 26.0, 7.0, 14.0, 8.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.869140625, -0.838134765625, -0.80712890625, -0.776123046875, -0.7451171875, -0.714111328125, -0.68310546875, -0.652099609375, -0.62109375, -0.590087890625, -0.55908203125, -0.528076171875, -0.4970703125, -0.466064453125, -0.43505859375, -0.404052734375, -0.373046875, -0.342041015625, -0.31103515625, -0.280029296875, -0.2490234375, -0.218017578125, -0.18701171875, -0.156005859375, -0.125, -0.093994140625, -0.06298828125, -0.031982421875, -0.0009765625, 0.030029296875, 0.06103515625, 0.092041015625, 0.123046875, 0.154052734375, 0.18505859375, 0.216064453125, 0.2470703125, 0.278076171875, 0.30908203125, 0.340087890625, 0.37109375, 0.402099609375, 0.43310546875, 0.464111328125, 0.4951171875, 0.526123046875, 0.55712890625, 0.588134765625, 0.619140625, 0.650146484375, 0.68115234375, 0.712158203125, 0.7431640625, 0.774169921875, 0.80517578125, 0.836181640625, 0.8671875, 0.898193359375, 0.92919921875, 0.960205078125, 0.9912109375, 1.022216796875, 1.05322265625, 1.084228515625, 1.115234375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 2.0, 9.0, 9.0, 14.0, 8.0, 13.0, 16.0, 25.0, 20.0, 26.0, 18.0, 29.0, 36.0, 24.0, 38.0, 39.0, 32.0, 38.0, 50.0, 44.0, 45.0, 45.0, 51.0, 42.0, 36.0, 32.0, 41.0, 25.0, 16.0, 28.0, 22.0, 14.0, 18.0, 21.0, 16.0, 7.0, 7.0, 10.0, 8.0, 5.0, 6.0, 6.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.1612548828125, -0.1566791534423828, -0.15210342407226562, -0.14752769470214844, -0.14295196533203125, -0.13837623596191406, -0.13380050659179688, -0.1292247772216797, -0.1246490478515625, -0.12007331848144531, -0.11549758911132812, -0.11092185974121094, -0.10634613037109375, -0.10177040100097656, -0.09719467163085938, -0.09261894226074219, -0.088043212890625, -0.08346748352050781, -0.07889175415039062, -0.07431602478027344, -0.06974029541015625, -0.06516456604003906, -0.060588836669921875, -0.05601310729980469, -0.0514373779296875, -0.04686164855957031, -0.042285919189453125, -0.03771018981933594, -0.03313446044921875, -0.028558731079101562, -0.023983001708984375, -0.019407272338867188, -0.01483154296875, -0.010255813598632812, -0.005680084228515625, -0.0011043548583984375, 0.00347137451171875, 0.008047103881835938, 0.012622833251953125, 0.017198562622070312, 0.0217742919921875, 0.026350021362304688, 0.030925750732421875, 0.03550148010253906, 0.04007720947265625, 0.04465293884277344, 0.049228668212890625, 0.05380439758300781, 0.058380126953125, 0.06295585632324219, 0.06753158569335938, 0.07210731506347656, 0.07668304443359375, 0.08125877380371094, 0.08583450317382812, 0.09041023254394531, 0.0949859619140625, 0.09956169128417969, 0.10413742065429688, 0.10871315002441406, 0.11328887939453125, 0.11786460876464844, 0.12244033813476562, 0.1270160675048828, 0.131591796875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 2.0, 7.0, 5.0, 13.0, 19.0, 26.0, 38.0, 57.0, 91.0, 207.0, 354.0, 758.0, 2105.0, 9938.0, 183246.0, 822921.0, 22922.0, 3619.0, 1149.0, 450.0, 246.0, 141.0, 79.0, 43.0, 35.0, 18.0, 17.0, 14.0, 12.0, 8.0, 4.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2275390625, -1.1868896484375, -1.146240234375, -1.1055908203125, -1.06494140625, -1.0242919921875, -0.983642578125, -0.9429931640625, -0.90234375, -0.8616943359375, -0.821044921875, -0.7803955078125, -0.73974609375, -0.6990966796875, -0.658447265625, -0.6177978515625, -0.5771484375, -0.5364990234375, -0.495849609375, -0.4552001953125, -0.41455078125, -0.3739013671875, -0.333251953125, -0.2926025390625, -0.251953125, -0.2113037109375, -0.170654296875, -0.1300048828125, -0.08935546875, -0.0487060546875, -0.008056640625, 0.0325927734375, 0.0732421875, 0.1138916015625, 0.154541015625, 0.1951904296875, 0.23583984375, 0.2764892578125, 0.317138671875, 0.3577880859375, 0.3984375, 0.4390869140625, 0.479736328125, 0.5203857421875, 0.56103515625, 0.6016845703125, 0.642333984375, 0.6829833984375, 0.7236328125, 0.7642822265625, 0.804931640625, 0.8455810546875, 0.88623046875, 0.9268798828125, 0.967529296875, 1.0081787109375, 1.048828125, 1.0894775390625, 1.130126953125, 1.1707763671875, 1.21142578125, 1.2520751953125, 1.292724609375, 1.3333740234375, 1.3740234375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 4.0, 6.0, 13.0, 23.0, 29.0, 66.0, 120.0, 218.0, 225.0, 139.0, 79.0, 40.0, 24.0, 14.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001766681671142578, -0.000171637162566185, -0.00016660615801811218, -0.00016157515347003937, -0.00015654414892196655, -0.00015151314437389374, -0.00014648213982582092, -0.0001414511352777481, -0.0001364201307296753, -0.00013138912618160248, -0.00012635812163352966, -0.00012132711708545685, -0.00011629611253738403, -0.00011126510798931122, -0.0001062341034412384, -0.00010120309889316559, -9.617209434509277e-05, -9.114108979701996e-05, -8.611008524894714e-05, -8.107908070087433e-05, -7.604807615280151e-05, -7.10170716047287e-05, -6.598606705665588e-05, -6.095506250858307e-05, -5.5924057960510254e-05, -5.089305341243744e-05, -4.5862048864364624e-05, -4.083104431629181e-05, -3.5800039768218994e-05, -3.076903522014618e-05, -2.5738030672073364e-05, -2.070702612400055e-05, -1.5676021575927734e-05, -1.064501702785492e-05, -5.6140124797821045e-06, -5.830079317092896e-07, 4.447996616363525e-06, 9.47900116443634e-06, 1.4510005712509155e-05, 1.954101026058197e-05, 2.4572014808654785e-05, 2.96030193567276e-05, 3.4634023904800415e-05, 3.966502845287323e-05, 4.4696033000946045e-05, 4.972703754901886e-05, 5.4758042097091675e-05, 5.978904664516449e-05, 6.48200511932373e-05, 6.985105574131012e-05, 7.488206028938293e-05, 7.991306483745575e-05, 8.494406938552856e-05, 8.997507393360138e-05, 9.50060784816742e-05, 0.00010003708302974701, 0.00010506808757781982, 0.00011009909212589264, 0.00011513009667396545, 0.00012016110122203827, 0.00012519210577011108, 0.0001302231103181839, 0.00013525411486625671, 0.00014028511941432953, 0.00014531612396240234]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 4.0, 4.0, 4.0, 4.0, 6.0, 5.0, 12.0, 14.0, 16.0, 24.0, 20.0, 40.0, 54.0, 77.0, 115.0, 179.0, 371.0, 717.0, 1518.0, 3562.0, 11073.0, 55042.0, 680097.0, 258017.0, 25941.0, 6642.0, 2518.0, 1117.0, 548.0, 290.0, 187.0, 99.0, 52.0, 59.0, 33.0, 23.0, 13.0, 11.0, 13.0, 11.0, 5.0, 2.0, 10.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.7548828125, -0.7318649291992188, -0.7088470458984375, -0.6858291625976562, -0.662811279296875, -0.6397933959960938, -0.6167755126953125, -0.5937576293945312, -0.57073974609375, -0.5477218627929688, -0.5247039794921875, -0.5016860961914062, -0.478668212890625, -0.45565032958984375, -0.4326324462890625, -0.40961456298828125, -0.3865966796875, -0.36357879638671875, -0.3405609130859375, -0.31754302978515625, -0.294525146484375, -0.27150726318359375, -0.2484893798828125, -0.22547149658203125, -0.20245361328125, -0.17943572998046875, -0.1564178466796875, -0.13339996337890625, -0.110382080078125, -0.08736419677734375, -0.0643463134765625, -0.04132843017578125, -0.018310546875, 0.00470733642578125, 0.0277252197265625, 0.05074310302734375, 0.073760986328125, 0.09677886962890625, 0.1197967529296875, 0.14281463623046875, 0.16583251953125, 0.18885040283203125, 0.2118682861328125, 0.23488616943359375, 0.257904052734375, 0.28092193603515625, 0.3039398193359375, 0.32695770263671875, 0.3499755859375, 0.37299346923828125, 0.3960113525390625, 0.41902923583984375, 0.442047119140625, 0.46506500244140625, 0.4880828857421875, 0.5111007690429688, 0.53411865234375, 0.5571365356445312, 0.5801544189453125, 0.6031723022460938, 0.626190185546875, 0.6492080688476562, 0.6722259521484375, 0.6952438354492188, 0.71826171875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 5.0, 4.0, 8.0, 11.0, 18.0, 21.0, 36.0, 57.0, 52.0, 79.0, 110.0, 115.0, 125.0, 98.0, 57.0, 59.0, 38.0, 28.0, 12.0, 16.0, 5.0, 10.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.361083984375, -0.3506660461425781, -0.34024810791015625, -0.3298301696777344, -0.3194122314453125, -0.3089942932128906, -0.29857635498046875, -0.2881584167480469, -0.277740478515625, -0.2673225402832031, -0.25690460205078125, -0.24648666381835938, -0.2360687255859375, -0.22565078735351562, -0.21523284912109375, -0.20481491088867188, -0.19439697265625, -0.18397903442382812, -0.17356109619140625, -0.16314315795898438, -0.1527252197265625, -0.14230728149414062, -0.13188934326171875, -0.12147140502929688, -0.111053466796875, -0.10063552856445312, -0.09021759033203125, -0.07979965209960938, -0.0693817138671875, -0.058963775634765625, -0.04854583740234375, -0.038127899169921875, -0.0277099609375, -0.017292022705078125, -0.00687408447265625, 0.003543853759765625, 0.0139617919921875, 0.024379730224609375, 0.03479766845703125, 0.045215606689453125, 0.055633544921875, 0.06605148315429688, 0.07646942138671875, 0.08688735961914062, 0.0973052978515625, 0.10772323608398438, 0.11814117431640625, 0.12855911254882812, 0.13897705078125, 0.14939498901367188, 0.15981292724609375, 0.17023086547851562, 0.1806488037109375, 0.19106674194335938, 0.20148468017578125, 0.21190261840820312, 0.222320556640625, 0.23273849487304688, 0.24315643310546875, 0.2535743713378906, 0.2639923095703125, 0.2744102478027344, 0.28482818603515625, 0.2952461242675781, 0.3056640625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 7.0, 10.0, 25.0, 51.0, 136.0, 201.0, 257.0, 165.0, 85.0, 35.0, 10.0, 8.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.294405460357666, -6.098361968994141, -5.902318477630615, -5.706274509429932, -5.510231018066406, -5.314187526702881, -5.1181440353393555, -4.922100067138672, -4.7260565757751465, -4.530013084411621, -4.333969593048096, -4.137925624847412, -3.9418821334838867, -3.7458386421203613, -3.549795150756836, -3.3537514209747314, -3.157707929611206, -2.9616644382476807, -2.765620708465576, -2.569577217102051, -2.3735334873199463, -2.177489995956421, -1.981446385383606, -1.785402774810791, -1.589359164237976, -1.3933155536651611, -1.1972719430923462, -1.0012283325195312, -0.8051847815513611, -0.6091411709785461, -0.413097620010376, -0.21705400943756104, -0.021010398864746094, 0.17503319680690765, 0.3710767924785614, 0.567120373249054, 0.7631639838218689, 0.9592075943946838, 1.155251145362854, 1.351294755935669, 1.5473383665084839, 1.7433819770812988, 1.9394255876541138, 2.1354691982269287, 2.331512689590454, 2.5275564193725586, 2.723599910736084, 2.9196434020996094, 3.115687131881714, 3.3117306232452393, 3.5077743530273438, 3.703817844390869, 3.8998615741729736, 4.095905303955078, 4.2919487953186035, 4.487992286682129, 4.684035778045654, 4.88007926940918, 5.076122760772705, 5.272166728973389, 5.468210220336914, 5.6642537117004395, 5.860297203063965, 6.056341171264648, 6.252384662628174]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 4.0, 7.0, 6.0, 5.0, 5.0, 11.0, 19.0, 14.0, 26.0, 34.0, 38.0, 40.0, 46.0, 44.0, 44.0, 61.0, 51.0, 70.0, 48.0, 66.0, 61.0, 48.0, 47.0, 38.0, 40.0, 28.0, 29.0, 11.0, 18.0, 10.0, 9.0, 5.0, 9.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.0267624855041504, -1.972910761833191, -1.919059157371521, -1.8652074337005615, -1.811355710029602, -1.7575039863586426, -1.7036523818969727, -1.6498006582260132, -1.5959489345550537, -1.5420972108840942, -1.4882456064224243, -1.4343938827514648, -1.3805421590805054, -1.326690435409546, -1.272838830947876, -1.2189871072769165, -1.165135383605957, -1.1112836599349976, -1.0574320554733276, -1.0035803318023682, -0.9497286081314087, -0.895876944065094, -0.8420252799987793, -0.7881735563278198, -0.7343219518661499, -0.6804702877998352, -0.6266185641288757, -0.572766900062561, -0.5189151763916016, -0.46506351232528687, -0.4112118184566498, -0.3573601245880127, -0.3035084009170532, -0.24965670704841614, -0.19580501317977905, -0.14195333421230316, -0.08810164034366608, -0.034249961376190186, 0.0196017324924469, 0.07345342636108398, 0.12730512022972107, 0.18115681409835815, 0.23500850796699524, 0.2888602018356323, 0.342711865901947, 0.3965635597705841, 0.4504152536392212, 0.5042669773101807, 0.5581186413764954, 0.6119703054428101, 0.6658220291137695, 0.7196736931800842, 0.7735254168510437, 0.8273770809173584, 0.8812288045883179, 0.9350804686546326, 0.9889321327209473, 1.0427838563919067, 1.0966354608535767, 1.1504871845245361, 1.2043389081954956, 1.258190631866455, 1.312042236328125, 1.3658939599990845, 1.419745683670044]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 5.0, 3.0, 3.0, 6.0, 3.0, 5.0, 7.0, 6.0, 13.0, 9.0, 14.0, 16.0, 15.0, 24.0, 29.0, 49.0, 58.0, 116.0, 193.0, 288.0, 604.0, 1438.0, 5103.0, 26938.0, 477181.0, 3623094.0, 47116.0, 8260.0, 2104.0, 723.0, 357.0, 195.0, 112.0, 60.0, 43.0, 22.0, 18.0, 13.0, 9.0, 11.0, 10.0, 5.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.044921875, -1.981292724609375, -1.91766357421875, -1.854034423828125, -1.7904052734375, -1.726776123046875, -1.66314697265625, -1.599517822265625, -1.535888671875, -1.472259521484375, -1.40863037109375, -1.345001220703125, -1.2813720703125, -1.217742919921875, -1.15411376953125, -1.090484619140625, -1.02685546875, -0.963226318359375, -0.89959716796875, -0.835968017578125, -0.7723388671875, -0.708709716796875, -0.64508056640625, -0.581451416015625, -0.517822265625, -0.454193115234375, -0.39056396484375, -0.326934814453125, -0.2633056640625, -0.199676513671875, -0.13604736328125, -0.072418212890625, -0.0087890625, 0.054840087890625, 0.11846923828125, 0.182098388671875, 0.2457275390625, 0.309356689453125, 0.37298583984375, 0.436614990234375, 0.500244140625, 0.563873291015625, 0.62750244140625, 0.691131591796875, 0.7547607421875, 0.818389892578125, 0.88201904296875, 0.945648193359375, 1.00927734375, 1.072906494140625, 1.13653564453125, 1.200164794921875, 1.2637939453125, 1.327423095703125, 1.39105224609375, 1.454681396484375, 1.518310546875, 1.581939697265625, 1.64556884765625, 1.709197998046875, 1.7728271484375, 1.836456298828125, 1.90008544921875, 1.963714599609375, 2.02734375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 0.0, 4.0, 5.0, 6.0, 9.0, 15.0, 19.0, 21.0, 27.0, 30.0, 37.0, 40.0, 43.0, 62.0, 68.0, 67.0, 90.0, 70.0, 61.0, 60.0, 44.0, 53.0, 37.0, 31.0, 27.0, 20.0, 19.0, 9.0, 9.0, 2.0, 8.0, 1.0, 5.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.057281494140625, -0.05589771270751953, -0.05451393127441406, -0.053130149841308594, -0.051746368408203125, -0.050362586975097656, -0.04897880554199219, -0.04759502410888672, -0.04621124267578125, -0.04482746124267578, -0.04344367980957031, -0.042059898376464844, -0.040676116943359375, -0.039292335510253906, -0.03790855407714844, -0.03652477264404297, -0.0351409912109375, -0.03375720977783203, -0.03237342834472656, -0.030989646911621094, -0.029605865478515625, -0.028222084045410156, -0.026838302612304688, -0.02545452117919922, -0.02407073974609375, -0.02268695831298828, -0.021303176879882812, -0.019919395446777344, -0.018535614013671875, -0.017151832580566406, -0.015768051147460938, -0.014384269714355469, -0.01300048828125, -0.011616706848144531, -0.010232925415039062, -0.008849143981933594, -0.007465362548828125, -0.006081581115722656, -0.0046977996826171875, -0.0033140182495117188, -0.00193023681640625, -0.0005464553833007812, 0.0008373260498046875, 0.0022211074829101562, 0.003604888916015625, 0.004988670349121094, 0.0063724517822265625, 0.007756233215332031, 0.0091400146484375, 0.010523796081542969, 0.011907577514648438, 0.013291358947753906, 0.014675140380859375, 0.016058921813964844, 0.017442703247070312, 0.01882648468017578, 0.02021026611328125, 0.02159404754638672, 0.022977828979492188, 0.024361610412597656, 0.025745391845703125, 0.027129173278808594, 0.028512954711914062, 0.02989673614501953, 0.031280517578125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 4.0, 8.0, 17.0, 15.0, 40.0, 58.0, 125.0, 252.0, 641.0, 2270.0, 159447.0, 4025877.0, 4166.0, 790.0, 262.0, 119.0, 69.0, 54.0, 29.0, 18.0, 9.0, 3.0, 5.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5625, -6.3446044921875, -6.126708984375, -5.9088134765625, -5.69091796875, -5.4730224609375, -5.255126953125, -5.0372314453125, -4.8193359375, -4.6014404296875, -4.383544921875, -4.1656494140625, -3.94775390625, -3.7298583984375, -3.511962890625, -3.2940673828125, -3.076171875, -2.8582763671875, -2.640380859375, -2.4224853515625, -2.20458984375, -1.9866943359375, -1.768798828125, -1.5509033203125, -1.3330078125, -1.1151123046875, -0.897216796875, -0.6793212890625, -0.46142578125, -0.2435302734375, -0.025634765625, 0.1922607421875, 0.41015625, 0.6280517578125, 0.845947265625, 1.0638427734375, 1.28173828125, 1.4996337890625, 1.717529296875, 1.9354248046875, 2.1533203125, 2.3712158203125, 2.589111328125, 2.8070068359375, 3.02490234375, 3.2427978515625, 3.460693359375, 3.6785888671875, 3.896484375, 4.1143798828125, 4.332275390625, 4.5501708984375, 4.76806640625, 4.9859619140625, 5.203857421875, 5.4217529296875, 5.6396484375, 5.8575439453125, 6.075439453125, 6.2933349609375, 6.51123046875, 6.7291259765625, 6.947021484375, 7.1649169921875, 7.3828125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 8.0, 13.0, 29.0, 46.0, 104.0, 395.0, 2576.0, 603.0, 168.0, 59.0, 30.0, 14.0, 12.0, 4.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.64501953125, -0.6302337646484375, -0.615447998046875, -0.6006622314453125, -0.58587646484375, -0.5710906982421875, -0.556304931640625, -0.5415191650390625, -0.5267333984375, -0.5119476318359375, -0.497161865234375, -0.4823760986328125, -0.46759033203125, -0.4528045654296875, -0.438018798828125, -0.4232330322265625, -0.408447265625, -0.3936614990234375, -0.378875732421875, -0.3640899658203125, -0.34930419921875, -0.3345184326171875, -0.319732666015625, -0.3049468994140625, -0.2901611328125, -0.2753753662109375, -0.260589599609375, -0.2458038330078125, -0.23101806640625, -0.2162322998046875, -0.201446533203125, -0.1866607666015625, -0.171875, -0.1570892333984375, -0.142303466796875, -0.1275177001953125, -0.11273193359375, -0.0979461669921875, -0.083160400390625, -0.0683746337890625, -0.0535888671875, -0.0388031005859375, -0.024017333984375, -0.0092315673828125, 0.00555419921875, 0.0203399658203125, 0.035125732421875, 0.0499114990234375, 0.064697265625, 0.0794830322265625, 0.094268798828125, 0.1090545654296875, 0.12384033203125, 0.1386260986328125, 0.153411865234375, 0.1681976318359375, 0.1829833984375, 0.1977691650390625, 0.212554931640625, 0.2273406982421875, 0.24212646484375, 0.2569122314453125, 0.271697998046875, 0.2864837646484375, 0.30126953125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 2.0, 2.0, 3.0, 6.0, 10.0, 21.0, 29.0, 51.0, 91.0, 175.0, 233.0, 172.0, 95.0, 44.0, 20.0, 20.0, 8.0, 6.0, 6.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8442435264587402, -2.7480037212371826, -2.651763916015625, -2.5555241107940674, -2.4592843055725098, -2.363044500350952, -2.2668046951293945, -2.170564889907837, -2.0743250846862793, -1.9780852794647217, -1.881845474243164, -1.7856056690216064, -1.6893658638000488, -1.5931260585784912, -1.4968862533569336, -1.400646448135376, -1.3044066429138184, -1.2081668376922607, -1.1119270324707031, -1.0156872272491455, -0.9194474220275879, -0.8232076168060303, -0.7269678115844727, -0.630728006362915, -0.5344882011413574, -0.4382483959197998, -0.3420085906982422, -0.24576878547668457, -0.14952898025512695, -0.053289175033569336, 0.04295063018798828, 0.1391904354095459, 0.23543024063110352, 0.33167004585266113, 0.42790985107421875, 0.5241496562957764, 0.620389461517334, 0.7166292667388916, 0.8128690719604492, 0.9091088771820068, 1.0053486824035645, 1.101588487625122, 1.1978282928466797, 1.2940680980682373, 1.390307903289795, 1.4865477085113525, 1.5827875137329102, 1.6790273189544678, 1.7752671241760254, 1.871506929397583, 1.9677467346191406, 2.0639865398406982, 2.160226345062256, 2.2564661502838135, 2.352705955505371, 2.4489457607269287, 2.5451855659484863, 2.641425371170044, 2.7376651763916016, 2.833904981613159, 2.930144786834717, 3.0263845920562744, 3.122624397277832, 3.2188642024993896, 3.3151040077209473]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 9.0, 11.0, 15.0, 13.0, 34.0, 33.0, 51.0, 58.0, 67.0, 101.0, 93.0, 98.0, 72.0, 79.0, 68.0, 44.0, 48.0, 34.0, 26.0, 18.0, 9.0, 6.0, 9.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.323563575744629, -1.2810187339782715, -1.2384737730026245, -1.1959288120269775, -1.1533839702606201, -1.1108391284942627, -1.0682941675186157, -1.0257492065429688, -0.9832043647766113, -0.9406594634056091, -0.8981145620346069, -0.8555696606636047, -0.8130247592926025, -0.7704798579216003, -0.7279349565505981, -0.685390055179596, -0.6428451538085938, -0.6003002524375916, -0.5577553510665894, -0.5152104496955872, -0.47266554832458496, -0.43012064695358276, -0.38757574558258057, -0.34503084421157837, -0.30248594284057617, -0.259941041469574, -0.21739614009857178, -0.17485123872756958, -0.13230633735656738, -0.08976143598556519, -0.04721653461456299, -0.004671633243560791, 0.037873148918151855, 0.08041805028915405, 0.12296295166015625, 0.16550785303115845, 0.20805275440216064, 0.25059765577316284, 0.29314255714416504, 0.33568745851516724, 0.37823235988616943, 0.42077726125717163, 0.46332216262817383, 0.505867063999176, 0.5484119653701782, 0.5909568667411804, 0.6335017681121826, 0.6760466694831848, 0.718591570854187, 0.7611364722251892, 0.8036813735961914, 0.8462262749671936, 0.8887711763381958, 0.931316077709198, 0.9738609790802002, 1.0164058208465576, 1.0589507818222046, 1.1014957427978516, 1.144040584564209, 1.1865854263305664, 1.2291303873062134, 1.2716753482818604, 1.3142201900482178, 1.3567650318145752, 1.3993099927902222]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 5.0, 6.0, 13.0, 11.0, 21.0, 23.0, 38.0, 38.0, 60.0, 93.0, 108.0, 160.0, 238.0, 344.0, 741.0, 1722.0, 5014.0, 21411.0, 139342.0, 723542.0, 127380.0, 19826.0, 4858.0, 1661.0, 735.0, 423.0, 255.0, 154.0, 110.0, 63.0, 48.0, 30.0, 22.0, 21.0, 12.0, 5.0, 7.0, 2.0, 2.0, 8.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.859375, -1.798370361328125, -1.73736572265625, -1.676361083984375, -1.6153564453125, -1.554351806640625, -1.49334716796875, -1.432342529296875, -1.371337890625, -1.310333251953125, -1.24932861328125, -1.188323974609375, -1.1273193359375, -1.066314697265625, -1.00531005859375, -0.944305419921875, -0.88330078125, -0.822296142578125, -0.76129150390625, -0.700286865234375, -0.6392822265625, -0.578277587890625, -0.51727294921875, -0.456268310546875, -0.395263671875, -0.334259033203125, -0.27325439453125, -0.212249755859375, -0.1512451171875, -0.090240478515625, -0.02923583984375, 0.031768798828125, 0.0927734375, 0.153778076171875, 0.21478271484375, 0.275787353515625, 0.3367919921875, 0.397796630859375, 0.45880126953125, 0.519805908203125, 0.580810546875, 0.641815185546875, 0.70281982421875, 0.763824462890625, 0.8248291015625, 0.885833740234375, 0.94683837890625, 1.007843017578125, 1.06884765625, 1.129852294921875, 1.19085693359375, 1.251861572265625, 1.3128662109375, 1.373870849609375, 1.43487548828125, 1.495880126953125, 1.556884765625, 1.617889404296875, 1.67889404296875, 1.739898681640625, 1.8009033203125, 1.861907958984375, 1.92291259765625, 1.983917236328125, 2.044921875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 15.0, 7.0, 10.0, 17.0, 18.0, 28.0, 26.0, 36.0, 60.0, 60.0, 73.0, 85.0, 89.0, 80.0, 80.0, 72.0, 55.0, 47.0, 45.0, 24.0, 19.0, 13.0, 14.0, 5.0, 10.0, 7.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07904052734375, -0.0765371322631836, -0.07403373718261719, -0.07153034210205078, -0.06902694702148438, -0.06652355194091797, -0.06402015686035156, -0.061516761779785156, -0.05901336669921875, -0.056509971618652344, -0.05400657653808594, -0.05150318145751953, -0.048999786376953125, -0.04649639129638672, -0.04399299621582031, -0.041489601135253906, -0.0389862060546875, -0.036482810974121094, -0.03397941589355469, -0.03147602081298828, -0.028972625732421875, -0.02646923065185547, -0.023965835571289062, -0.021462440490722656, -0.01895904541015625, -0.016455650329589844, -0.013952255249023438, -0.011448860168457031, -0.008945465087890625, -0.006442070007324219, -0.0039386749267578125, -0.0014352798461914062, 0.001068115234375, 0.0035715103149414062, 0.0060749053955078125, 0.008578300476074219, 0.011081695556640625, 0.013585090637207031, 0.016088485717773438, 0.018591880798339844, 0.02109527587890625, 0.023598670959472656, 0.026102066040039062, 0.02860546112060547, 0.031108856201171875, 0.03361225128173828, 0.03611564636230469, 0.038619041442871094, 0.0411224365234375, 0.043625831604003906, 0.04612922668457031, 0.04863262176513672, 0.051136016845703125, 0.05363941192626953, 0.05614280700683594, 0.058646202087402344, 0.06114959716796875, 0.06365299224853516, 0.06615638732910156, 0.06865978240966797, 0.07116317749023438, 0.07366657257080078, 0.07616996765136719, 0.0786733627319336, 0.0811767578125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 0.0, 3.0, 4.0, 2.0, 3.0, 9.0, 10.0, 8.0, 16.0, 24.0, 30.0, 51.0, 54.0, 72.0, 111.0, 148.0, 266.0, 401.0, 645.0, 1199.0, 2417.0, 5273.0, 13206.0, 42803.0, 198217.0, 556766.0, 167223.0, 37734.0, 11907.0, 4816.0, 2206.0, 1135.0, 641.0, 360.0, 218.0, 165.0, 111.0, 72.0, 53.0, 42.0, 31.0, 25.0, 17.0, 16.0, 9.0, 8.0, 8.0, 4.0, 6.0, 6.0, 4.0, 6.0, 2.0, 1.0], "bins": [-1.0361328125, -1.0069046020507812, -0.9776763916015625, -0.9484481811523438, -0.919219970703125, -0.8899917602539062, -0.8607635498046875, -0.8315353393554688, -0.80230712890625, -0.7730789184570312, -0.7438507080078125, -0.7146224975585938, -0.685394287109375, -0.6561660766601562, -0.6269378662109375, -0.5977096557617188, -0.5684814453125, -0.5392532348632812, -0.5100250244140625, -0.48079681396484375, -0.451568603515625, -0.42234039306640625, -0.3931121826171875, -0.36388397216796875, -0.33465576171875, -0.30542755126953125, -0.2761993408203125, -0.24697113037109375, -0.217742919921875, -0.18851470947265625, -0.1592864990234375, -0.13005828857421875, -0.100830078125, -0.07160186767578125, -0.0423736572265625, -0.01314544677734375, 0.016082763671875, 0.04531097412109375, 0.0745391845703125, 0.10376739501953125, 0.13299560546875, 0.16222381591796875, 0.1914520263671875, 0.22068023681640625, 0.249908447265625, 0.27913665771484375, 0.3083648681640625, 0.33759307861328125, 0.3668212890625, 0.39604949951171875, 0.4252777099609375, 0.45450592041015625, 0.483734130859375, 0.5129623413085938, 0.5421905517578125, 0.5714187622070312, 0.60064697265625, 0.6298751831054688, 0.6591033935546875, 0.6883316040039062, 0.717559814453125, 0.7467880249023438, 0.7760162353515625, 0.8052444458007812, 0.83447265625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 6.0, 8.0, 4.0, 9.0, 6.0, 13.0, 13.0, 24.0, 22.0, 31.0, 28.0, 39.0, 37.0, 51.0, 59.0, 66.0, 46.0, 59.0, 61.0, 62.0, 61.0, 49.0, 37.0, 33.0, 36.0, 28.0, 22.0, 22.0, 9.0, 12.0, 18.0, 9.0, 4.0, 6.0, 5.0, 7.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27001953125, -0.25943756103515625, -0.2488555908203125, -0.23827362060546875, -0.227691650390625, -0.21710968017578125, -0.2065277099609375, -0.19594573974609375, -0.18536376953125, -0.17478179931640625, -0.1641998291015625, -0.15361785888671875, -0.143035888671875, -0.13245391845703125, -0.1218719482421875, -0.11128997802734375, -0.1007080078125, -0.09012603759765625, -0.0795440673828125, -0.06896209716796875, -0.058380126953125, -0.04779815673828125, -0.0372161865234375, -0.02663421630859375, -0.01605224609375, -0.00547027587890625, 0.0051116943359375, 0.01569366455078125, 0.026275634765625, 0.03685760498046875, 0.0474395751953125, 0.05802154541015625, 0.068603515625, 0.07918548583984375, 0.0897674560546875, 0.10034942626953125, 0.110931396484375, 0.12151336669921875, 0.1320953369140625, 0.14267730712890625, 0.15325927734375, 0.16384124755859375, 0.1744232177734375, 0.18500518798828125, 0.195587158203125, 0.20616912841796875, 0.2167510986328125, 0.22733306884765625, 0.2379150390625, 0.24849700927734375, 0.2590789794921875, 0.26966094970703125, 0.280242919921875, 0.29082489013671875, 0.3014068603515625, 0.31198883056640625, 0.32257080078125, 0.33315277099609375, 0.3437347412109375, 0.35431671142578125, 0.364898681640625, 0.37548065185546875, 0.3860626220703125, 0.39664459228515625, 0.4072265625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 0.0, 5.0, 4.0, 5.0, 6.0, 7.0, 12.0, 9.0, 10.0, 13.0, 19.0, 27.0, 35.0, 44.0, 75.0, 133.0, 269.0, 511.0, 1061.0, 2334.0, 5621.0, 21086.0, 343644.0, 630201.0, 31059.0, 7006.0, 2754.0, 1246.0, 600.0, 289.0, 165.0, 87.0, 48.0, 33.0, 28.0, 23.0, 14.0, 17.0, 8.0, 12.0, 10.0, 2.0, 5.0, 7.0, 1.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.92138671875, -0.8917617797851562, -0.8621368408203125, -0.8325119018554688, -0.802886962890625, -0.7732620239257812, -0.7436370849609375, -0.7140121459960938, -0.68438720703125, -0.6547622680664062, -0.6251373291015625, -0.5955123901367188, -0.565887451171875, -0.5362625122070312, -0.5066375732421875, -0.47701263427734375, -0.4473876953125, -0.41776275634765625, -0.3881378173828125, -0.35851287841796875, -0.328887939453125, -0.29926300048828125, -0.2696380615234375, -0.24001312255859375, -0.21038818359375, -0.18076324462890625, -0.1511383056640625, -0.12151336669921875, -0.091888427734375, -0.06226348876953125, -0.0326385498046875, -0.00301361083984375, 0.026611328125, 0.05623626708984375, 0.0858612060546875, 0.11548614501953125, 0.145111083984375, 0.17473602294921875, 0.2043609619140625, 0.23398590087890625, 0.26361083984375, 0.29323577880859375, 0.3228607177734375, 0.35248565673828125, 0.382110595703125, 0.41173553466796875, 0.4413604736328125, 0.47098541259765625, 0.5006103515625, 0.5302352905273438, 0.5598602294921875, 0.5894851684570312, 0.619110107421875, 0.6487350463867188, 0.6783599853515625, 0.7079849243164062, 0.73760986328125, 0.7672348022460938, 0.7968597412109375, 0.8264846801757812, 0.856109619140625, 0.8857345581054688, 0.9153594970703125, 0.9449844360351562, 0.974609375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 5.0, 4.0, 12.0, 11.0, 16.0, 16.0, 26.0, 42.0, 52.0, 83.0, 114.0, 145.0, 134.0, 93.0, 67.0, 61.0, 26.0, 26.0, 17.0, 15.0, 8.0, 5.0, 3.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.620189666748047e-05, -9.298045188188553e-05, -8.975900709629059e-05, -8.653756231069565e-05, -8.331611752510071e-05, -8.009467273950577e-05, -7.687322795391083e-05, -7.365178316831589e-05, -7.043033838272095e-05, -6.720889359712601e-05, -6.398744881153107e-05, -6.076600402593613e-05, -5.7544559240341187e-05, -5.4323114454746246e-05, -5.1101669669151306e-05, -4.7880224883556366e-05, -4.4658780097961426e-05, -4.1437335312366486e-05, -3.8215890526771545e-05, -3.4994445741176605e-05, -3.1773000955581665e-05, -2.8551556169986725e-05, -2.5330111384391785e-05, -2.2108666598796844e-05, -1.8887221813201904e-05, -1.5665777027606964e-05, -1.2444332242012024e-05, -9.222887456417084e-06, -6.0014426708221436e-06, -2.7799978852272034e-06, 4.414469003677368e-07, 3.662891685962677e-06, 6.884336471557617e-06, 1.0105781257152557e-05, 1.3327226042747498e-05, 1.6548670828342438e-05, 1.9770115613937378e-05, 2.2991560399532318e-05, 2.6213005185127258e-05, 2.94344499707222e-05, 3.265589475631714e-05, 3.587733954191208e-05, 3.909878432750702e-05, 4.232022911310196e-05, 4.55416738986969e-05, 4.876311868429184e-05, 5.198456346988678e-05, 5.520600825548172e-05, 5.842745304107666e-05, 6.16488978266716e-05, 6.487034261226654e-05, 6.809178739786148e-05, 7.131323218345642e-05, 7.453467696905136e-05, 7.77561217546463e-05, 8.097756654024124e-05, 8.419901132583618e-05, 8.742045611143112e-05, 9.064190089702606e-05, 9.3863345682621e-05, 9.708479046821594e-05, 0.00010030623525381088, 0.00010352768003940582, 0.00010674912482500076, 0.0001099705696105957]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 7.0, 6.0, 3.0, 7.0, 6.0, 10.0, 16.0, 13.0, 23.0, 38.0, 52.0, 87.0, 145.0, 238.0, 462.0, 879.0, 1784.0, 3996.0, 12051.0, 84723.0, 858443.0, 67261.0, 10858.0, 3898.0, 1733.0, 758.0, 419.0, 225.0, 152.0, 74.0, 55.0, 40.0, 16.0, 16.0, 17.0, 8.0, 12.0, 6.0, 1.0, 11.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.9677734375, -0.9388504028320312, -0.9099273681640625, -0.8810043334960938, -0.852081298828125, -0.8231582641601562, -0.7942352294921875, -0.7653121948242188, -0.73638916015625, -0.7074661254882812, -0.6785430908203125, -0.6496200561523438, -0.620697021484375, -0.5917739868164062, -0.5628509521484375, -0.5339279174804688, -0.5050048828125, -0.47608184814453125, -0.4471588134765625, -0.41823577880859375, -0.389312744140625, -0.36038970947265625, -0.3314666748046875, -0.30254364013671875, -0.27362060546875, -0.24469757080078125, -0.2157745361328125, -0.18685150146484375, -0.157928466796875, -0.12900543212890625, -0.1000823974609375, -0.07115936279296875, -0.042236328125, -0.01331329345703125, 0.0156097412109375, 0.04453277587890625, 0.073455810546875, 0.10237884521484375, 0.1313018798828125, 0.16022491455078125, 0.18914794921875, 0.21807098388671875, 0.2469940185546875, 0.27591705322265625, 0.304840087890625, 0.33376312255859375, 0.3626861572265625, 0.39160919189453125, 0.4205322265625, 0.44945526123046875, 0.4783782958984375, 0.5073013305664062, 0.536224365234375, 0.5651473999023438, 0.5940704345703125, 0.6229934692382812, 0.65191650390625, 0.6808395385742188, 0.7097625732421875, 0.7386856079101562, 0.767608642578125, 0.7965316772460938, 0.8254547119140625, 0.8543777465820312, 0.88330078125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 1.0, 5.0, 3.0, 12.0, 16.0, 30.0, 46.0, 89.0, 134.0, 163.0, 180.0, 128.0, 85.0, 33.0, 20.0, 18.0, 6.0, 6.0, 3.0, 2.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.609375, -0.5918960571289062, -0.5744171142578125, -0.5569381713867188, -0.539459228515625, -0.5219802856445312, -0.5045013427734375, -0.48702239990234375, -0.46954345703125, -0.45206451416015625, -0.4345855712890625, -0.41710662841796875, -0.399627685546875, -0.38214874267578125, -0.3646697998046875, -0.34719085693359375, -0.3297119140625, -0.31223297119140625, -0.2947540283203125, -0.27727508544921875, -0.259796142578125, -0.24231719970703125, -0.2248382568359375, -0.20735931396484375, -0.18988037109375, -0.17240142822265625, -0.1549224853515625, -0.13744354248046875, -0.119964599609375, -0.10248565673828125, -0.0850067138671875, -0.06752777099609375, -0.050048828125, -0.03256988525390625, -0.0150909423828125, 0.00238800048828125, 0.019866943359375, 0.03734588623046875, 0.0548248291015625, 0.07230377197265625, 0.08978271484375, 0.10726165771484375, 0.1247406005859375, 0.14221954345703125, 0.159698486328125, 0.17717742919921875, 0.1946563720703125, 0.21213531494140625, 0.2296142578125, 0.24709320068359375, 0.2645721435546875, 0.28205108642578125, 0.299530029296875, 0.31700897216796875, 0.3344879150390625, 0.35196685791015625, 0.36944580078125, 0.38692474365234375, 0.4044036865234375, 0.42188262939453125, 0.439361572265625, 0.45684051513671875, 0.4743194580078125, 0.49179840087890625, 0.50927734375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 4.0, 2.0, 8.0, 20.0, 57.0, 132.0, 281.0, 283.0, 135.0, 47.0, 15.0, 13.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.259020805358887, -4.906360149383545, -4.553699493408203, -4.201038360595703, -3.8483779430389404, -3.4957172870635986, -3.1430563926696777, -2.790395736694336, -2.437735080718994, -2.0850744247436523, -1.732413649559021, -1.3797528743743896, -1.0270922183990479, -0.674431562423706, -0.32177066802978516, 0.03088998794555664, 0.38355064392089844, 0.736211359500885, 1.0888720750808716, 1.441532850265503, 1.7941935062408447, 2.1468541622161865, 2.4995150566101074, 2.852175712585449, 3.204836368560791, 3.557497024536133, 3.9101576805114746, 4.262818336486816, 4.615479469299316, 4.9681396484375, 5.32080078125, 5.673461437225342, 6.026123046875, 6.378783702850342, 6.731444358825684, 7.084105491638184, 7.436765670776367, 7.789426803588867, 8.142087936401367, 8.49474811553955, 8.847408294677734, 9.200069427490234, 9.552729606628418, 9.905390739440918, 10.258050918579102, 10.610712051391602, 10.963373184204102, 11.316033363342285, 11.668694496154785, 12.021355628967285, 12.374015808105469, 12.726676940917969, 13.079337120056152, 13.431998252868652, 13.784658432006836, 14.137319564819336, 14.489980697631836, 14.842641830444336, 15.19530200958252, 15.54796314239502, 15.900623321533203, 16.253284454345703, 16.605945587158203, 16.958606719970703, 17.31126594543457]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 10.0, 4.0, 7.0, 8.0, 11.0, 16.0, 15.0, 17.0, 20.0, 25.0, 34.0, 35.0, 45.0, 55.0, 37.0, 47.0, 53.0, 48.0, 53.0, 39.0, 39.0, 43.0, 42.0, 32.0, 43.0, 30.0, 33.0, 27.0, 23.0, 25.0, 14.0, 13.0, 11.0, 11.0, 13.0, 9.0, 5.0, 4.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9902983903884888, -1.9242666959762573, -1.8582348823547363, -1.7922031879425049, -1.7261714935302734, -1.6601396799087524, -1.594107985496521, -1.528076171875, -1.4620444774627686, -1.396012783050537, -1.3299809694290161, -1.2639492750167847, -1.1979174613952637, -1.1318857669830322, -1.0658540725708008, -0.9998223185539246, -0.9337905645370483, -0.8677588105201721, -0.8017270565032959, -0.7356953620910645, -0.6696636080741882, -0.603631854057312, -0.5376001596450806, -0.47156840562820435, -0.4055366516113281, -0.3395048975944519, -0.27347317337989807, -0.20744143426418304, -0.14140969514846802, -0.0753779411315918, -0.009346216917037964, 0.05668550729751587, 0.12271714210510254, 0.18874888122081757, 0.2547806203365326, 0.3208123445510864, 0.38684409856796265, 0.45287585258483887, 0.5189075469970703, 0.5849393010139465, 0.6509710550308228, 0.717002809047699, 0.7830345630645752, 0.8490662574768066, 0.9150980114936829, 0.9811297655105591, 1.0471614599227905, 1.1131932735443115, 1.179224967956543, 1.2452566623687744, 1.3112884759902954, 1.3773201704025269, 1.4433519840240479, 1.5093836784362793, 1.5754153728485107, 1.6414470672607422, 1.7074788808822632, 1.7735105752944946, 1.8395423889160156, 1.905574083328247, 1.9716057777404785, 2.037637710571289, 2.1036694049835205, 2.169701099395752, 2.2357327938079834]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 1.0, 5.0, 2.0, 4.0, 5.0, 6.0, 7.0, 10.0, 19.0, 22.0, 27.0, 32.0, 47.0, 77.0, 101.0, 188.0, 352.0, 687.0, 1592.0, 4478.0, 16597.0, 145355.0, 3937263.0, 69617.0, 11785.0, 3504.0, 1202.0, 515.0, 290.0, 156.0, 101.0, 63.0, 44.0, 36.0, 25.0, 24.0, 7.0, 9.0, 8.0, 5.0, 4.0, 7.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.27734375, -2.2129669189453125, -2.148590087890625, -2.0842132568359375, -2.01983642578125, -1.9554595947265625, -1.891082763671875, -1.8267059326171875, -1.7623291015625, -1.6979522705078125, -1.633575439453125, -1.5691986083984375, -1.50482177734375, -1.4404449462890625, -1.376068115234375, -1.3116912841796875, -1.247314453125, -1.1829376220703125, -1.118560791015625, -1.0541839599609375, -0.98980712890625, -0.9254302978515625, -0.861053466796875, -0.7966766357421875, -0.7322998046875, -0.6679229736328125, -0.603546142578125, -0.5391693115234375, -0.47479248046875, -0.4104156494140625, -0.346038818359375, -0.2816619873046875, -0.21728515625, -0.1529083251953125, -0.088531494140625, -0.0241546630859375, 0.04022216796875, 0.1045989990234375, 0.168975830078125, 0.2333526611328125, 0.2977294921875, 0.3621063232421875, 0.426483154296875, 0.4908599853515625, 0.55523681640625, 0.6196136474609375, 0.683990478515625, 0.7483673095703125, 0.812744140625, 0.8771209716796875, 0.941497802734375, 1.0058746337890625, 1.07025146484375, 1.1346282958984375, 1.199005126953125, 1.2633819580078125, 1.3277587890625, 1.3921356201171875, 1.456512451171875, 1.5208892822265625, 1.58526611328125, 1.6496429443359375, 1.714019775390625, 1.7783966064453125, 1.8427734375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 3.0, 6.0, 4.0, 12.0, 12.0, 9.0, 18.0, 21.0, 34.0, 30.0, 47.0, 50.0, 56.0, 70.0, 76.0, 74.0, 68.0, 64.0, 78.0, 49.0, 49.0, 46.0, 26.0, 28.0, 24.0, 15.0, 8.0, 7.0, 6.0, 6.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07977294921875, -0.07724857330322266, -0.07472419738769531, -0.07219982147216797, -0.06967544555664062, -0.06715106964111328, -0.06462669372558594, -0.062102317810058594, -0.05957794189453125, -0.057053565979003906, -0.05452919006347656, -0.05200481414794922, -0.049480438232421875, -0.04695606231689453, -0.04443168640136719, -0.041907310485839844, -0.0393829345703125, -0.036858558654785156, -0.03433418273925781, -0.03180980682373047, -0.029285430908203125, -0.02676105499267578, -0.024236679077148438, -0.021712303161621094, -0.01918792724609375, -0.016663551330566406, -0.014139175415039062, -0.011614799499511719, -0.009090423583984375, -0.006566047668457031, -0.0040416717529296875, -0.0015172958374023438, 0.001007080078125, 0.0035314559936523438, 0.0060558319091796875, 0.008580207824707031, 0.011104583740234375, 0.013628959655761719, 0.016153335571289062, 0.018677711486816406, 0.02120208740234375, 0.023726463317871094, 0.026250839233398438, 0.02877521514892578, 0.031299591064453125, 0.03382396697998047, 0.03634834289550781, 0.038872718811035156, 0.0413970947265625, 0.043921470642089844, 0.04644584655761719, 0.04897022247314453, 0.051494598388671875, 0.05401897430419922, 0.05654335021972656, 0.059067726135253906, 0.06159210205078125, 0.0641164779663086, 0.06664085388183594, 0.06916522979736328, 0.07168960571289062, 0.07421398162841797, 0.07673835754394531, 0.07926273345947266, 0.081787109375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 5.0, 7.0, 13.0, 18.0, 37.0, 64.0, 83.0, 146.0, 225.0, 506.0, 1123.0, 4778.0, 43184.0, 4038933.0, 94837.0, 7418.0, 1609.0, 535.0, 301.0, 156.0, 133.0, 69.0, 31.0, 29.0, 20.0, 10.0, 3.0, 8.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.76953125, -1.683685302734375, -1.59783935546875, -1.511993408203125, -1.4261474609375, -1.340301513671875, -1.25445556640625, -1.168609619140625, -1.082763671875, -0.996917724609375, -0.91107177734375, -0.825225830078125, -0.7393798828125, -0.653533935546875, -0.56768798828125, -0.481842041015625, -0.39599609375, -0.310150146484375, -0.22430419921875, -0.138458251953125, -0.0526123046875, 0.033233642578125, 0.11907958984375, 0.204925537109375, 0.290771484375, 0.376617431640625, 0.46246337890625, 0.548309326171875, 0.6341552734375, 0.720001220703125, 0.80584716796875, 0.891693115234375, 0.9775390625, 1.063385009765625, 1.14923095703125, 1.235076904296875, 1.3209228515625, 1.406768798828125, 1.49261474609375, 1.578460693359375, 1.664306640625, 1.750152587890625, 1.83599853515625, 1.921844482421875, 2.0076904296875, 2.093536376953125, 2.17938232421875, 2.265228271484375, 2.35107421875, 2.436920166015625, 2.52276611328125, 2.608612060546875, 2.6944580078125, 2.780303955078125, 2.86614990234375, 2.951995849609375, 3.037841796875, 3.123687744140625, 3.20953369140625, 3.295379638671875, 3.3812255859375, 3.467071533203125, 3.55291748046875, 3.638763427734375, 3.724609375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 5.0, 7.0, 9.0, 15.0, 15.0, 55.0, 128.0, 357.0, 2417.0, 764.0, 155.0, 76.0, 33.0, 16.0, 12.0, 9.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.265869140625, -0.24998092651367188, -0.23409271240234375, -0.21820449829101562, -0.2023162841796875, -0.18642807006835938, -0.17053985595703125, -0.15465164184570312, -0.138763427734375, -0.12287521362304688, -0.10698699951171875, -0.09109878540039062, -0.0752105712890625, -0.059322357177734375, -0.04343414306640625, -0.027545928955078125, -0.01165771484375, 0.004230499267578125, 0.02011871337890625, 0.036006927490234375, 0.0518951416015625, 0.06778335571289062, 0.08367156982421875, 0.09955978393554688, 0.115447998046875, 0.13133621215820312, 0.14722442626953125, 0.16311264038085938, 0.1790008544921875, 0.19488906860351562, 0.21077728271484375, 0.22666549682617188, 0.2425537109375, 0.2584419250488281, 0.27433013916015625, 0.2902183532714844, 0.3061065673828125, 0.3219947814941406, 0.33788299560546875, 0.3537712097167969, 0.369659423828125, 0.3855476379394531, 0.40143585205078125, 0.4173240661621094, 0.4332122802734375, 0.4491004943847656, 0.46498870849609375, 0.4808769226074219, 0.49676513671875, 0.5126533508300781, 0.5285415649414062, 0.5444297790527344, 0.5603179931640625, 0.5762062072753906, 0.5920944213867188, 0.6079826354980469, 0.623870849609375, 0.6397590637207031, 0.6556472778320312, 0.6715354919433594, 0.6874237060546875, 0.7033119201660156, 0.7192001342773438, 0.7350883483886719, 0.7509765625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 22.0, 188.0, 610.0, 165.0, 15.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.36672592163086, -12.106424331665039, -11.846122741699219, -11.585821151733398, -11.325519561767578, -11.065218925476074, -10.804917335510254, -10.544615745544434, -10.284314155578613, -10.024012565612793, -9.763710975646973, -9.503409385681152, -9.243108749389648, -8.982807159423828, -8.722505569458008, -8.462203979492188, -8.201902389526367, -7.941600799560547, -7.681299209594727, -7.4209980964660645, -7.160696506500244, -6.900394916534424, -6.640093803405762, -6.379792213439941, -6.119490623474121, -5.859189033508301, -5.5988874435424805, -5.338586330413818, -5.078284740447998, -4.817983150482178, -4.557682037353516, -4.297380447387695, -4.037079811096191, -3.776778221130371, -3.51647686958313, -3.2561755180358887, -2.9958739280700684, -2.735572338104248, -2.475270986557007, -2.2149696350097656, -1.9546680450439453, -1.6943665742874146, -1.4340651035308838, -1.173763632774353, -0.9134621620178223, -0.6531606912612915, -0.39285922050476074, -0.13255774974822998, 0.12774372100830078, 0.38804519176483154, 0.6483466625213623, 0.9086481332778931, 1.1689496040344238, 1.4292510747909546, 1.6895525455474854, 1.9498540163040161, 2.210155487060547, 2.470457077026367, 2.7307584285736084, 2.9910597801208496, 3.25136137008667, 3.5116629600524902, 3.7719643115997314, 4.032265663146973, 4.292567253112793]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 12.0, 8.0, 16.0, 23.0, 31.0, 40.0, 46.0, 59.0, 81.0, 77.0, 85.0, 91.0, 91.0, 70.0, 72.0, 64.0, 39.0, 31.0, 20.0, 20.0, 13.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.0033044815063477, -1.9571845531463623, -1.911064624786377, -1.864944577217102, -1.8188246488571167, -1.7727047204971313, -1.7265846729278564, -1.680464744567871, -1.6343448162078857, -1.5882248878479004, -1.542104959487915, -1.4959849119186401, -1.4498649835586548, -1.4037450551986694, -1.3576250076293945, -1.3115050792694092, -1.2653851509094238, -1.2192652225494385, -1.1731452941894531, -1.1270252466201782, -1.0809053182601929, -1.0347853899002075, -0.9886654019355774, -0.9425454139709473, -0.8964254856109619, -0.8503055572509766, -0.8041855692863464, -0.7580655813217163, -0.711945652961731, -0.6658257246017456, -0.6197057366371155, -0.5735857486724854, -0.5274658203125, -0.48134586215019226, -0.4352259039878845, -0.3891059458255768, -0.34298598766326904, -0.2968660295009613, -0.25074607133865356, -0.20462611317634583, -0.15850615501403809, -0.11238619685173035, -0.06626623868942261, -0.020146280527114868, 0.02597367763519287, 0.07209363579750061, 0.11821359395980835, 0.1643335521221161, 0.21045351028442383, 0.25657346844673157, 0.3026934266090393, 0.34881338477134705, 0.3949333429336548, 0.4410533010959625, 0.48717325925827026, 0.5332932472229004, 0.5794131755828857, 0.6255331039428711, 0.6716530919075012, 0.7177730798721313, 0.7638930082321167, 0.810012936592102, 0.8561329245567322, 0.9022529125213623, 0.9483728408813477]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 6.0, 10.0, 13.0, 13.0, 25.0, 45.0, 105.0, 125.0, 258.0, 506.0, 1029.0, 2966.0, 15705.0, 222424.0, 742703.0, 53195.0, 6299.0, 1718.0, 674.0, 300.0, 173.0, 90.0, 71.0, 34.0, 19.0, 15.0, 15.0, 6.0, 4.0, 3.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6572265625, -1.5792694091796875, -1.501312255859375, -1.4233551025390625, -1.34539794921875, -1.2674407958984375, -1.189483642578125, -1.1115264892578125, -1.0335693359375, -0.9556121826171875, -0.877655029296875, -0.7996978759765625, -0.72174072265625, -0.6437835693359375, -0.565826416015625, -0.4878692626953125, -0.409912109375, -0.3319549560546875, -0.253997802734375, -0.1760406494140625, -0.09808349609375, -0.0201263427734375, 0.057830810546875, 0.1357879638671875, 0.2137451171875, 0.2917022705078125, 0.369659423828125, 0.4476165771484375, 0.52557373046875, 0.6035308837890625, 0.681488037109375, 0.7594451904296875, 0.83740234375, 0.9153594970703125, 0.993316650390625, 1.0712738037109375, 1.14923095703125, 1.2271881103515625, 1.305145263671875, 1.3831024169921875, 1.4610595703125, 1.5390167236328125, 1.616973876953125, 1.6949310302734375, 1.77288818359375, 1.8508453369140625, 1.928802490234375, 2.0067596435546875, 2.084716796875, 2.1626739501953125, 2.240631103515625, 2.3185882568359375, 2.39654541015625, 2.4745025634765625, 2.552459716796875, 2.6304168701171875, 2.7083740234375, 2.7863311767578125, 2.864288330078125, 2.9422454833984375, 3.02020263671875, 3.0981597900390625, 3.176116943359375, 3.2540740966796875, 3.33203125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 2.0, 11.0, 11.0, 24.0, 33.0, 37.0, 46.0, 40.0, 52.0, 68.0, 68.0, 64.0, 59.0, 66.0, 76.0, 52.0, 60.0, 46.0, 49.0, 36.0, 17.0, 29.0, 12.0, 15.0, 7.0, 3.0, 7.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.11956787109375, -0.1166067123413086, -0.11364555358886719, -0.11068439483642578, -0.10772323608398438, -0.10476207733154297, -0.10180091857910156, -0.09883975982666016, -0.09587860107421875, -0.09291744232177734, -0.08995628356933594, -0.08699512481689453, -0.08403396606445312, -0.08107280731201172, -0.07811164855957031, -0.0751504898071289, -0.0721893310546875, -0.0692281723022461, -0.06626701354980469, -0.06330585479736328, -0.060344696044921875, -0.05738353729248047, -0.05442237854003906, -0.051461219787597656, -0.04850006103515625, -0.045538902282714844, -0.04257774353027344, -0.03961658477783203, -0.036655426025390625, -0.03369426727294922, -0.030733108520507812, -0.027771949768066406, -0.024810791015625, -0.021849632263183594, -0.018888473510742188, -0.01592731475830078, -0.012966156005859375, -0.010004997253417969, -0.0070438385009765625, -0.004082679748535156, -0.00112152099609375, 0.0018396377563476562, 0.0048007965087890625, 0.007761955261230469, 0.010723114013671875, 0.013684272766113281, 0.016645431518554688, 0.019606590270996094, 0.0225677490234375, 0.025528907775878906, 0.028490066528320312, 0.03145122528076172, 0.034412384033203125, 0.03737354278564453, 0.04033470153808594, 0.043295860290527344, 0.04625701904296875, 0.049218177795410156, 0.05217933654785156, 0.05514049530029297, 0.058101654052734375, 0.06106281280517578, 0.06402397155761719, 0.0669851303100586, 0.0699462890625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 3.0, 2.0, 4.0, 2.0, 10.0, 13.0, 12.0, 30.0, 32.0, 44.0, 59.0, 138.0, 271.0, 455.0, 906.0, 2155.0, 6676.0, 30094.0, 282497.0, 637434.0, 69850.0, 11819.0, 3429.0, 1220.0, 621.0, 312.0, 169.0, 114.0, 52.0, 38.0, 37.0, 17.0, 10.0, 8.0, 6.0, 5.0, 1.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.8408203125, -1.788543701171875, -1.73626708984375, -1.683990478515625, -1.6317138671875, -1.579437255859375, -1.52716064453125, -1.474884033203125, -1.422607421875, -1.370330810546875, -1.31805419921875, -1.265777587890625, -1.2135009765625, -1.161224365234375, -1.10894775390625, -1.056671142578125, -1.00439453125, -0.952117919921875, -0.89984130859375, -0.847564697265625, -0.7952880859375, -0.743011474609375, -0.69073486328125, -0.638458251953125, -0.586181640625, -0.533905029296875, -0.48162841796875, -0.429351806640625, -0.3770751953125, -0.324798583984375, -0.27252197265625, -0.220245361328125, -0.16796875, -0.115692138671875, -0.06341552734375, -0.011138916015625, 0.0411376953125, 0.093414306640625, 0.14569091796875, 0.197967529296875, 0.250244140625, 0.302520751953125, 0.35479736328125, 0.407073974609375, 0.4593505859375, 0.511627197265625, 0.56390380859375, 0.616180419921875, 0.66845703125, 0.720733642578125, 0.77301025390625, 0.825286865234375, 0.8775634765625, 0.929840087890625, 0.98211669921875, 1.034393310546875, 1.086669921875, 1.138946533203125, 1.19122314453125, 1.243499755859375, 1.2957763671875, 1.348052978515625, 1.40032958984375, 1.452606201171875, 1.5048828125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 3.0, 1.0, 7.0, 9.0, 9.0, 7.0, 18.0, 18.0, 22.0, 20.0, 31.0, 26.0, 26.0, 20.0, 46.0, 49.0, 47.0, 45.0, 53.0, 38.0, 39.0, 43.0, 59.0, 54.0, 31.0, 51.0, 28.0, 31.0, 24.0, 23.0, 15.0, 24.0, 24.0, 11.0, 18.0, 10.0, 10.0, 5.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3369140625, -0.3252067565917969, -0.31349945068359375, -0.3017921447753906, -0.2900848388671875, -0.2783775329589844, -0.26667022705078125, -0.2549629211425781, -0.243255615234375, -0.23154830932617188, -0.21984100341796875, -0.20813369750976562, -0.1964263916015625, -0.18471908569335938, -0.17301177978515625, -0.16130447387695312, -0.14959716796875, -0.13788986206054688, -0.12618255615234375, -0.11447525024414062, -0.1027679443359375, -0.09106063842773438, -0.07935333251953125, -0.06764602661132812, -0.055938720703125, -0.044231414794921875, -0.03252410888671875, -0.020816802978515625, -0.0091094970703125, 0.002597808837890625, 0.01430511474609375, 0.026012420654296875, 0.0377197265625, 0.049427032470703125, 0.06113433837890625, 0.07284164428710938, 0.0845489501953125, 0.09625625610351562, 0.10796356201171875, 0.11967086791992188, 0.131378173828125, 0.14308547973632812, 0.15479278564453125, 0.16650009155273438, 0.1782073974609375, 0.18991470336914062, 0.20162200927734375, 0.21332931518554688, 0.22503662109375, 0.23674392700195312, 0.24845123291015625, 0.2601585388183594, 0.2718658447265625, 0.2835731506347656, 0.29528045654296875, 0.3069877624511719, 0.318695068359375, 0.3304023742675781, 0.34210968017578125, 0.3538169860839844, 0.3655242919921875, 0.3772315979003906, 0.38893890380859375, 0.4006462097167969, 0.412353515625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 6.0, 3.0, 8.0, 10.0, 14.0, 20.0, 15.0, 32.0, 50.0, 82.0, 192.0, 471.0, 989.0, 2354.0, 6979.0, 48642.0, 830110.0, 141664.0, 11168.0, 3242.0, 1326.0, 566.0, 285.0, 121.0, 62.0, 38.0, 37.0, 16.0, 8.0, 14.0, 7.0, 3.0, 5.0, 7.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9853515625, -0.9551849365234375, -0.925018310546875, -0.8948516845703125, -0.86468505859375, -0.8345184326171875, -0.804351806640625, -0.7741851806640625, -0.7440185546875, -0.7138519287109375, -0.683685302734375, -0.6535186767578125, -0.62335205078125, -0.5931854248046875, -0.563018798828125, -0.5328521728515625, -0.502685546875, -0.4725189208984375, -0.442352294921875, -0.4121856689453125, -0.38201904296875, -0.3518524169921875, -0.321685791015625, -0.2915191650390625, -0.2613525390625, -0.2311859130859375, -0.201019287109375, -0.1708526611328125, -0.14068603515625, -0.1105194091796875, -0.080352783203125, -0.0501861572265625, -0.02001953125, 0.0101470947265625, 0.040313720703125, 0.0704803466796875, 0.10064697265625, 0.1308135986328125, 0.160980224609375, 0.1911468505859375, 0.2213134765625, 0.2514801025390625, 0.281646728515625, 0.3118133544921875, 0.34197998046875, 0.3721466064453125, 0.402313232421875, 0.4324798583984375, 0.462646484375, 0.4928131103515625, 0.522979736328125, 0.5531463623046875, 0.58331298828125, 0.6134796142578125, 0.643646240234375, 0.6738128662109375, 0.7039794921875, 0.7341461181640625, 0.764312744140625, 0.7944793701171875, 0.82464599609375, 0.8548126220703125, 0.884979248046875, 0.9151458740234375, 0.9453125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 9.0, 11.0, 36.0, 52.0, 128.0, 198.0, 257.0, 145.0, 68.0, 37.0, 16.0, 16.0, 9.0, 8.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000125885009765625, -0.00011967122554779053, -0.00011345744132995605, -0.00010724365711212158, -0.00010102987289428711, -9.481608867645264e-05, -8.860230445861816e-05, -8.238852024078369e-05, -7.617473602294922e-05, -6.996095180511475e-05, -6.374716758728027e-05, -5.75333833694458e-05, -5.131959915161133e-05, -4.5105814933776855e-05, -3.889203071594238e-05, -3.267824649810791e-05, -2.6464462280273438e-05, -2.0250678062438965e-05, -1.4036893844604492e-05, -7.82310962677002e-06, -1.6093254089355469e-06, 4.604458808898926e-06, 1.0818243026733398e-05, 1.703202724456787e-05, 2.3245811462402344e-05, 2.9459595680236816e-05, 3.567337989807129e-05, 4.188716411590576e-05, 4.8100948333740234e-05, 5.431473255157471e-05, 6.052851676940918e-05, 6.674230098724365e-05, 7.295608520507812e-05, 7.91698694229126e-05, 8.538365364074707e-05, 9.159743785858154e-05, 9.781122207641602e-05, 0.00010402500629425049, 0.00011023879051208496, 0.00011645257472991943, 0.0001226663589477539, 0.00012888014316558838, 0.00013509392738342285, 0.00014130771160125732, 0.0001475214958190918, 0.00015373528003692627, 0.00015994906425476074, 0.00016616284847259521, 0.0001723766326904297, 0.00017859041690826416, 0.00018480420112609863, 0.0001910179853439331, 0.00019723176956176758, 0.00020344555377960205, 0.00020965933799743652, 0.000215873122215271, 0.00022208690643310547, 0.00022830069065093994, 0.00023451447486877441, 0.0002407282590866089, 0.00024694204330444336, 0.00025315582752227783, 0.0002593696117401123, 0.0002655833959579468, 0.00027179718017578125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 3.0, 8.0, 1.0, 4.0, 11.0, 10.0, 17.0, 29.0, 31.0, 44.0, 58.0, 108.0, 148.0, 296.0, 513.0, 1029.0, 2301.0, 6371.0, 34281.0, 662494.0, 313312.0, 19214.0, 4528.0, 1783.0, 829.0, 476.0, 238.0, 137.0, 93.0, 64.0, 45.0, 29.0, 14.0, 12.0, 8.0, 10.0, 5.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-1.0302734375, -1.0037612915039062, -0.9772491455078125, -0.9507369995117188, -0.924224853515625, -0.8977127075195312, -0.8712005615234375, -0.8446884155273438, -0.81817626953125, -0.7916641235351562, -0.7651519775390625, -0.7386398315429688, -0.712127685546875, -0.6856155395507812, -0.6591033935546875, -0.6325912475585938, -0.6060791015625, -0.5795669555664062, -0.5530548095703125, -0.5265426635742188, -0.500030517578125, -0.47351837158203125, -0.4470062255859375, -0.42049407958984375, -0.39398193359375, -0.36746978759765625, -0.3409576416015625, -0.31444549560546875, -0.287933349609375, -0.26142120361328125, -0.2349090576171875, -0.20839691162109375, -0.181884765625, -0.15537261962890625, -0.1288604736328125, -0.10234832763671875, -0.075836181640625, -0.04932403564453125, -0.0228118896484375, 0.00370025634765625, 0.03021240234375, 0.05672454833984375, 0.0832366943359375, 0.10974884033203125, 0.136260986328125, 0.16277313232421875, 0.1892852783203125, 0.21579742431640625, 0.2423095703125, 0.26882171630859375, 0.2953338623046875, 0.32184600830078125, 0.348358154296875, 0.37487030029296875, 0.4013824462890625, 0.42789459228515625, 0.45440673828125, 0.48091888427734375, 0.5074310302734375, 0.5339431762695312, 0.560455322265625, 0.5869674682617188, 0.6134796142578125, 0.6399917602539062, 0.66650390625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 6.0, 2.0, 6.0, 13.0, 25.0, 31.0, 47.0, 60.0, 103.0, 103.0, 114.0, 139.0, 105.0, 71.0, 76.0, 32.0, 20.0, 17.0, 4.0, 5.0, 12.0, 5.0, 2.0, 2.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.59716796875, -0.5825843811035156, -0.5680007934570312, -0.5534172058105469, -0.5388336181640625, -0.5242500305175781, -0.5096664428710938, -0.4950828552246094, -0.480499267578125, -0.4659156799316406, -0.45133209228515625, -0.4367485046386719, -0.4221649169921875, -0.4075813293457031, -0.39299774169921875, -0.3784141540527344, -0.36383056640625, -0.3492469787597656, -0.33466339111328125, -0.3200798034667969, -0.3054962158203125, -0.2909126281738281, -0.27632904052734375, -0.2617454528808594, -0.247161865234375, -0.23257827758789062, -0.21799468994140625, -0.20341110229492188, -0.1888275146484375, -0.17424392700195312, -0.15966033935546875, -0.14507675170898438, -0.1304931640625, -0.11590957641601562, -0.10132598876953125, -0.08674240112304688, -0.0721588134765625, -0.057575225830078125, -0.04299163818359375, -0.028408050537109375, -0.013824462890625, 0.000759124755859375, 0.01534271240234375, 0.029926300048828125, 0.0445098876953125, 0.059093475341796875, 0.07367706298828125, 0.08826065063476562, 0.10284423828125, 0.11742782592773438, 0.13201141357421875, 0.14659500122070312, 0.1611785888671875, 0.17576217651367188, 0.19034576416015625, 0.20492935180664062, 0.219512939453125, 0.23409652709960938, 0.24868011474609375, 0.2632637023925781, 0.2778472900390625, 0.2924308776855469, 0.30701446533203125, 0.3215980529785156, 0.336181640625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 8.0, 13.0, 22.0, 39.0, 67.0, 116.0, 185.0, 232.0, 143.0, 89.0, 46.0, 14.0, 15.0, 9.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.83360767364502, -11.560700416564941, -11.28779411315918, -11.014886856079102, -10.741979598999023, -10.469073295593262, -10.196166038513184, -9.923258781433105, -9.650352478027344, -9.377445220947266, -9.104538917541504, -8.831631660461426, -8.558724403381348, -8.285818099975586, -8.012910842895508, -7.740004062652588, -7.46709680557251, -7.19419002532959, -6.921282768249512, -6.648375988006592, -6.375469207763672, -6.102561950683594, -5.829655170440674, -5.556748390197754, -5.283841133117676, -5.010934352874756, -4.738027095794678, -4.465120315551758, -4.192213535308838, -3.919306516647339, -3.64639949798584, -3.37349271774292, -3.100586414337158, -2.827679395675659, -2.5547726154327393, -2.2818655967712402, -2.0089588165283203, -1.7360517978668213, -1.4631447792053223, -1.1902378797531128, -0.9173309803009033, -0.6444240808486938, -0.3715171217918396, -0.09861016273498535, 0.17429673671722412, 0.4472036361694336, 0.7201106548309326, 0.9930175542831421, 1.2659244537353516, 1.538831353187561, 1.8117382526397705, 2.0846452713012695, 2.3575520515441895, 2.6304590702056885, 2.9033660888671875, 3.1762728691101074, 3.4491798877716064, 3.7220869064331055, 3.9949936866760254, 4.267900466918945, 4.540807723999023, 4.813714504241943, 5.086621284484863, 5.359528541564941, 5.632435321807861]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 4.0, 7.0, 8.0, 4.0, 6.0, 7.0, 9.0, 15.0, 13.0, 25.0, 24.0, 34.0, 31.0, 29.0, 50.0, 35.0, 54.0, 45.0, 59.0, 44.0, 54.0, 55.0, 49.0, 62.0, 50.0, 28.0, 32.0, 27.0, 38.0, 24.0, 15.0, 9.0, 11.0, 16.0, 10.0, 8.0, 7.0, 4.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.6021432876586914, -2.5201263427734375, -2.4381091594696045, -2.3560922145843506, -2.2740750312805176, -2.1920580863952637, -2.1100409030914307, -2.0280239582061768, -1.9460068941116333, -1.8639898300170898, -1.7819727659225464, -1.699955701828003, -1.617938756942749, -1.535921573638916, -1.453904628753662, -1.3718875646591187, -1.2898705005645752, -1.2078534364700317, -1.1258363723754883, -1.0438193082809448, -0.9618023037910461, -0.8797852396965027, -0.797768235206604, -0.7157511711120605, -0.6337341070175171, -0.5517170429229736, -0.46970000863075256, -0.3876829743385315, -0.30566591024398804, -0.22364884614944458, -0.1416318118572235, -0.05961477756500244, 0.022402524948120117, 0.10441957414150238, 0.18643662333488464, 0.2684536576271057, 0.35047072172164917, 0.4324877858161926, 0.5145047903060913, 0.5965218544006348, 0.6785389184951782, 0.7605559825897217, 0.8425730466842651, 0.9245900511741638, 1.0066070556640625, 1.0886242389678955, 1.1706411838531494, 1.2526582479476929, 1.3346753120422363, 1.4166923761367798, 1.4987094402313232, 1.5807265043258667, 1.6627435684204102, 1.744760513305664, 1.8267775774002075, 1.908794641494751, 1.9908117055892944, 2.072828769683838, 2.154845714569092, 2.236862897872925, 2.3188798427581787, 2.4008970260620117, 2.4829139709472656, 2.5649309158325195, 2.6469480991363525]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 6.0, 8.0, 7.0, 17.0, 19.0, 15.0, 27.0, 26.0, 60.0, 81.0, 119.0, 178.0, 299.0, 579.0, 1105.0, 3141.0, 11729.0, 63684.0, 3061058.0, 990725.0, 47668.0, 9106.0, 2583.0, 958.0, 469.0, 230.0, 128.0, 86.0, 51.0, 29.0, 31.0, 16.0, 12.0, 10.0, 9.0, 6.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.9697265625, -1.9098968505859375, -1.850067138671875, -1.7902374267578125, -1.73040771484375, -1.6705780029296875, -1.610748291015625, -1.5509185791015625, -1.4910888671875, -1.4312591552734375, -1.371429443359375, -1.3115997314453125, -1.25177001953125, -1.1919403076171875, -1.132110595703125, -1.0722808837890625, -1.012451171875, -0.9526214599609375, -0.892791748046875, -0.8329620361328125, -0.77313232421875, -0.7133026123046875, -0.653472900390625, -0.5936431884765625, -0.5338134765625, -0.4739837646484375, -0.414154052734375, -0.3543243408203125, -0.29449462890625, -0.2346649169921875, -0.174835205078125, -0.1150054931640625, -0.05517578125, 0.0046539306640625, 0.064483642578125, 0.1243133544921875, 0.18414306640625, 0.2439727783203125, 0.303802490234375, 0.3636322021484375, 0.4234619140625, 0.4832916259765625, 0.543121337890625, 0.6029510498046875, 0.66278076171875, 0.7226104736328125, 0.782440185546875, 0.8422698974609375, 0.902099609375, 0.9619293212890625, 1.021759033203125, 1.0815887451171875, 1.14141845703125, 1.2012481689453125, 1.261077880859375, 1.3209075927734375, 1.3807373046875, 1.4405670166015625, 1.500396728515625, 1.5602264404296875, 1.62005615234375, 1.6798858642578125, 1.739715576171875, 1.7995452880859375, 1.859375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 5.0, 4.0, 5.0, 15.0, 12.0, 19.0, 23.0, 35.0, 33.0, 36.0, 46.0, 64.0, 54.0, 56.0, 43.0, 58.0, 58.0, 69.0, 62.0, 60.0, 59.0, 30.0, 45.0, 24.0, 19.0, 19.0, 13.0, 12.0, 11.0, 3.0, 2.0, 0.0, 1.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10980224609375, -0.10686588287353516, -0.10392951965332031, -0.10099315643310547, -0.09805679321289062, -0.09512042999267578, -0.09218406677246094, -0.0892477035522461, -0.08631134033203125, -0.0833749771118164, -0.08043861389160156, -0.07750225067138672, -0.07456588745117188, -0.07162952423095703, -0.06869316101074219, -0.06575679779052734, -0.0628204345703125, -0.059884071350097656, -0.05694770812988281, -0.05401134490966797, -0.051074981689453125, -0.04813861846923828, -0.04520225524902344, -0.042265892028808594, -0.03932952880859375, -0.036393165588378906, -0.03345680236816406, -0.03052043914794922, -0.027584075927734375, -0.02464771270751953, -0.021711349487304688, -0.018774986267089844, -0.015838623046875, -0.012902259826660156, -0.009965896606445312, -0.007029533386230469, -0.004093170166015625, -0.0011568069458007812, 0.0017795562744140625, 0.004715919494628906, 0.00765228271484375, 0.010588645935058594, 0.013525009155273438, 0.01646137237548828, 0.019397735595703125, 0.02233409881591797, 0.025270462036132812, 0.028206825256347656, 0.0311431884765625, 0.034079551696777344, 0.03701591491699219, 0.03995227813720703, 0.042888641357421875, 0.04582500457763672, 0.04876136779785156, 0.051697731018066406, 0.05463409423828125, 0.057570457458496094, 0.06050682067871094, 0.06344318389892578, 0.06637954711914062, 0.06931591033935547, 0.07225227355957031, 0.07518863677978516, 0.078125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 6.0, 14.0, 20.0, 42.0, 45.0, 67.0, 148.0, 294.0, 798.0, 3467.0, 55880.0, 4114792.0, 15699.0, 1936.0, 535.0, 215.0, 126.0, 77.0, 48.0, 24.0, 18.0, 13.0, 5.0, 8.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3515625, -5.15582275390625, -4.9600830078125, -4.76434326171875, -4.568603515625, -4.37286376953125, -4.1771240234375, -3.98138427734375, -3.78564453125, -3.58990478515625, -3.3941650390625, -3.19842529296875, -3.002685546875, -2.80694580078125, -2.6112060546875, -2.41546630859375, -2.2197265625, -2.02398681640625, -1.8282470703125, -1.63250732421875, -1.436767578125, -1.24102783203125, -1.0452880859375, -0.84954833984375, -0.65380859375, -0.45806884765625, -0.2623291015625, -0.06658935546875, 0.129150390625, 0.32489013671875, 0.5206298828125, 0.71636962890625, 0.912109375, 1.10784912109375, 1.3035888671875, 1.49932861328125, 1.695068359375, 1.89080810546875, 2.0865478515625, 2.28228759765625, 2.47802734375, 2.67376708984375, 2.8695068359375, 3.06524658203125, 3.260986328125, 3.45672607421875, 3.6524658203125, 3.84820556640625, 4.0439453125, 4.23968505859375, 4.4354248046875, 4.63116455078125, 4.826904296875, 5.02264404296875, 5.2183837890625, 5.41412353515625, 5.60986328125, 5.80560302734375, 6.0013427734375, 6.19708251953125, 6.392822265625, 6.58856201171875, 6.7843017578125, 6.98004150390625, 7.17578125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 7.0, 12.0, 20.0, 35.0, 92.0, 247.0, 1228.0, 1968.0, 301.0, 96.0, 42.0, 20.0, 8.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7607421875, -0.7277984619140625, -0.694854736328125, -0.6619110107421875, -0.62896728515625, -0.5960235595703125, -0.563079833984375, -0.5301361083984375, -0.4971923828125, -0.4642486572265625, -0.431304931640625, -0.3983612060546875, -0.36541748046875, -0.3324737548828125, -0.299530029296875, -0.2665863037109375, -0.233642578125, -0.2006988525390625, -0.167755126953125, -0.1348114013671875, -0.10186767578125, -0.0689239501953125, -0.035980224609375, -0.0030364990234375, 0.0299072265625, 0.0628509521484375, 0.095794677734375, 0.1287384033203125, 0.16168212890625, 0.1946258544921875, 0.227569580078125, 0.2605133056640625, 0.29345703125, 0.3264007568359375, 0.359344482421875, 0.3922882080078125, 0.42523193359375, 0.4581756591796875, 0.491119384765625, 0.5240631103515625, 0.5570068359375, 0.5899505615234375, 0.622894287109375, 0.6558380126953125, 0.68878173828125, 0.7217254638671875, 0.754669189453125, 0.7876129150390625, 0.820556640625, 0.8535003662109375, 0.886444091796875, 0.9193878173828125, 0.95233154296875, 0.9852752685546875, 1.018218994140625, 1.0511627197265625, 1.0841064453125, 1.1170501708984375, 1.149993896484375, 1.1829376220703125, 1.21588134765625, 1.2488250732421875, 1.281768798828125, 1.3147125244140625, 1.34765625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 16.0, 30.0, 108.0, 275.0, 333.0, 151.0, 61.0, 14.0, 11.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.704033851623535, -9.428254127502441, -9.152475357055664, -8.87669563293457, -8.600915908813477, -8.3251371383667, -8.049357414245605, -7.77357816696167, -7.497798919677734, -7.222019672393799, -6.946239948272705, -6.6704607009887695, -6.394681453704834, -6.118902206420898, -5.843122482299805, -5.567343235015869, -5.291563510894775, -5.01578426361084, -4.740004539489746, -4.4642252922058105, -4.188446044921875, -3.9126665592193604, -3.6368870735168457, -3.36110782623291, -3.0853283405303955, -2.809548854827881, -2.5337696075439453, -2.2579901218414307, -1.9822107553482056, -1.7064313888549805, -1.4306519031524658, -1.1548725366592407, -0.8790936470031738, -0.6033142805099487, -0.32753485441207886, -0.051755428314208984, 0.2240239381790161, 0.4998033046722412, 0.7755827903747559, 1.051362156867981, 1.327141523361206, 1.6029208898544312, 1.8787002563476562, 2.154479742050171, 2.4302592277526855, 2.706038475036621, 2.9818179607391357, 3.2575974464416504, 3.533376693725586, 3.8091561794281006, 4.084935665130615, 4.360714912414551, 4.636494159698486, 4.912273406982422, 5.188053131103516, 5.463832378387451, 5.739611625671387, 6.015390872955322, 6.291170597076416, 6.566949844360352, 6.842729091644287, 7.118508338928223, 7.394288063049316, 7.670067310333252, 7.945847034454346]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 4.0, 4.0, 10.0, 10.0, 9.0, 20.0, 23.0, 27.0, 54.0, 64.0, 72.0, 77.0, 81.0, 104.0, 85.0, 68.0, 54.0, 72.0, 41.0, 31.0, 27.0, 22.0, 19.0, 14.0, 7.0, 0.0, 4.0, 3.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5929620265960693, -2.514258623123169, -2.4355552196502686, -2.356851816177368, -2.2781484127044678, -2.1994450092315674, -2.120741605758667, -2.0420382022857666, -1.9633347988128662, -1.8846313953399658, -1.8059279918670654, -1.727224588394165, -1.6485211849212646, -1.5698177814483643, -1.4911143779754639, -1.4124109745025635, -1.333707571029663, -1.2550041675567627, -1.1763007640838623, -1.097597360610962, -1.0188939571380615, -0.9401905536651611, -0.8614871501922607, -0.7827837467193604, -0.70408034324646, -0.6253769397735596, -0.5466735363006592, -0.4679701328277588, -0.3892667293548584, -0.310563325881958, -0.23185992240905762, -0.15315651893615723, -0.07445335388183594, 0.004250049591064453, 0.08295345306396484, 0.16165685653686523, 0.24036026000976562, 0.319063663482666, 0.3977670669555664, 0.4764704704284668, 0.5551738739013672, 0.6338772773742676, 0.712580680847168, 0.7912840843200684, 0.8699874877929688, 0.9486908912658691, 1.0273942947387695, 1.10609769821167, 1.1848011016845703, 1.2635045051574707, 1.342207908630371, 1.4209113121032715, 1.4996147155761719, 1.5783181190490723, 1.6570215225219727, 1.735724925994873, 1.8144283294677734, 1.8931317329406738, 1.9718351364135742, 2.0505385398864746, 2.129241943359375, 2.2079453468322754, 2.286648750305176, 2.365352153778076, 2.4440555572509766]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 9.0, 7.0, 10.0, 10.0, 21.0, 26.0, 39.0, 50.0, 86.0, 120.0, 169.0, 276.0, 520.0, 1048.0, 2332.0, 8187.0, 56842.0, 520817.0, 405612.0, 41617.0, 6451.0, 2091.0, 898.0, 449.0, 287.0, 189.0, 125.0, 70.0, 52.0, 44.0, 22.0, 24.0, 12.0, 12.0, 14.0, 6.0, 2.0, 5.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.025390625, -1.9638824462890625, -1.902374267578125, -1.8408660888671875, -1.77935791015625, -1.7178497314453125, -1.656341552734375, -1.5948333740234375, -1.5333251953125, -1.4718170166015625, -1.410308837890625, -1.3488006591796875, -1.28729248046875, -1.2257843017578125, -1.164276123046875, -1.1027679443359375, -1.041259765625, -0.9797515869140625, -0.918243408203125, -0.8567352294921875, -0.79522705078125, -0.7337188720703125, -0.672210693359375, -0.6107025146484375, -0.5491943359375, -0.4876861572265625, -0.426177978515625, -0.3646697998046875, -0.30316162109375, -0.2416534423828125, -0.180145263671875, -0.1186370849609375, -0.05712890625, 0.0043792724609375, 0.065887451171875, 0.1273956298828125, 0.18890380859375, 0.2504119873046875, 0.311920166015625, 0.3734283447265625, 0.4349365234375, 0.4964447021484375, 0.557952880859375, 0.6194610595703125, 0.68096923828125, 0.7424774169921875, 0.803985595703125, 0.8654937744140625, 0.927001953125, 0.9885101318359375, 1.050018310546875, 1.1115264892578125, 1.17303466796875, 1.2345428466796875, 1.296051025390625, 1.3575592041015625, 1.4190673828125, 1.4805755615234375, 1.542083740234375, 1.6035919189453125, 1.66510009765625, 1.7266082763671875, 1.788116455078125, 1.8496246337890625, 1.9111328125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 11.0, 20.0, 32.0, 52.0, 84.0, 123.0, 131.0, 125.0, 142.0, 106.0, 81.0, 42.0, 21.0, 14.0, 16.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2802734375, -0.2723426818847656, -0.26441192626953125, -0.2564811706542969, -0.2485504150390625, -0.24061965942382812, -0.23268890380859375, -0.22475814819335938, -0.216827392578125, -0.20889663696289062, -0.20096588134765625, -0.19303512573242188, -0.1851043701171875, -0.17717361450195312, -0.16924285888671875, -0.16131210327148438, -0.15338134765625, -0.14545059204101562, -0.13751983642578125, -0.12958908081054688, -0.1216583251953125, -0.11372756958007812, -0.10579681396484375, -0.09786605834960938, -0.089935302734375, -0.08200454711914062, -0.07407379150390625, -0.06614303588867188, -0.0582122802734375, -0.050281524658203125, -0.04235076904296875, -0.034420013427734375, -0.0264892578125, -0.018558502197265625, -0.01062774658203125, -0.002696990966796875, 0.0052337646484375, 0.013164520263671875, 0.02109527587890625, 0.029026031494140625, 0.036956787109375, 0.044887542724609375, 0.05281829833984375, 0.060749053955078125, 0.0686798095703125, 0.07661056518554688, 0.08454132080078125, 0.09247207641601562, 0.10040283203125, 0.10833358764648438, 0.11626434326171875, 0.12419509887695312, 0.1321258544921875, 0.14005661010742188, 0.14798736572265625, 0.15591812133789062, 0.163848876953125, 0.17177963256835938, 0.17971038818359375, 0.18764114379882812, 0.1955718994140625, 0.20350265502929688, 0.21143341064453125, 0.21936416625976562, 0.227294921875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 6.0, 5.0, 8.0, 9.0, 10.0, 9.0, 25.0, 20.0, 34.0, 56.0, 88.0, 130.0, 183.0, 303.0, 531.0, 921.0, 1958.0, 3888.0, 8701.0, 21403.0, 56743.0, 159134.0, 351285.0, 274526.0, 104130.0, 37391.0, 14739.0, 6087.0, 2851.0, 1440.0, 767.0, 447.0, 254.0, 152.0, 101.0, 73.0, 43.0, 38.0, 18.0, 19.0, 13.0, 4.0, 7.0, 8.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52978515625, -0.509246826171875, -0.48870849609375, -0.468170166015625, -0.4476318359375, -0.427093505859375, -0.40655517578125, -0.386016845703125, -0.365478515625, -0.344940185546875, -0.32440185546875, -0.303863525390625, -0.2833251953125, -0.262786865234375, -0.24224853515625, -0.221710205078125, -0.201171875, -0.180633544921875, -0.16009521484375, -0.139556884765625, -0.1190185546875, -0.098480224609375, -0.07794189453125, -0.057403564453125, -0.036865234375, -0.016326904296875, 0.00421142578125, 0.024749755859375, 0.0452880859375, 0.065826416015625, 0.08636474609375, 0.106903076171875, 0.12744140625, 0.147979736328125, 0.16851806640625, 0.189056396484375, 0.2095947265625, 0.230133056640625, 0.25067138671875, 0.271209716796875, 0.291748046875, 0.312286376953125, 0.33282470703125, 0.353363037109375, 0.3739013671875, 0.394439697265625, 0.41497802734375, 0.435516357421875, 0.4560546875, 0.476593017578125, 0.49713134765625, 0.517669677734375, 0.5382080078125, 0.558746337890625, 0.57928466796875, 0.599822998046875, 0.620361328125, 0.640899658203125, 0.66143798828125, 0.681976318359375, 0.7025146484375, 0.723052978515625, 0.74359130859375, 0.764129638671875, 0.78466796875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 5.0, 3.0, 9.0, 9.0, 6.0, 13.0, 18.0, 12.0, 16.0, 17.0, 28.0, 36.0, 32.0, 44.0, 31.0, 38.0, 42.0, 48.0, 53.0, 52.0, 41.0, 58.0, 47.0, 50.0, 39.0, 36.0, 26.0, 29.0, 24.0, 30.0, 25.0, 11.0, 16.0, 8.0, 12.0, 13.0, 10.0, 8.0, 2.0, 1.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.4697265625, -0.4561195373535156, -0.44251251220703125, -0.4289054870605469, -0.4152984619140625, -0.4016914367675781, -0.38808441162109375, -0.3744773864746094, -0.360870361328125, -0.3472633361816406, -0.33365631103515625, -0.3200492858886719, -0.3064422607421875, -0.2928352355957031, -0.27922821044921875, -0.2656211853027344, -0.25201416015625, -0.23840713500976562, -0.22480010986328125, -0.21119308471679688, -0.1975860595703125, -0.18397903442382812, -0.17037200927734375, -0.15676498413085938, -0.143157958984375, -0.12955093383789062, -0.11594390869140625, -0.10233688354492188, -0.0887298583984375, -0.07512283325195312, -0.06151580810546875, -0.047908782958984375, -0.0343017578125, -0.020694732666015625, -0.00708770751953125, 0.006519317626953125, 0.0201263427734375, 0.033733367919921875, 0.04734039306640625, 0.060947418212890625, 0.074554443359375, 0.08816146850585938, 0.10176849365234375, 0.11537551879882812, 0.1289825439453125, 0.14258956909179688, 0.15619659423828125, 0.16980361938476562, 0.18341064453125, 0.19701766967773438, 0.21062469482421875, 0.22423171997070312, 0.2378387451171875, 0.2514457702636719, 0.26505279541015625, 0.2786598205566406, 0.292266845703125, 0.3058738708496094, 0.31948089599609375, 0.3330879211425781, 0.3466949462890625, 0.3603019714355469, 0.37390899658203125, 0.3875160217285156, 0.401123046875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 5.0, 10.0, 7.0, 17.0, 25.0, 36.0, 60.0, 97.0, 151.0, 257.0, 571.0, 1144.0, 2934.0, 9246.0, 48157.0, 613841.0, 333385.0, 27838.0, 6558.0, 2232.0, 944.0, 462.0, 216.0, 125.0, 68.0, 56.0, 34.0, 23.0, 13.0, 16.0, 8.0, 6.0, 2.0, 4.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.87451171875, -0.84942626953125, -0.8243408203125, -0.79925537109375, -0.774169921875, -0.74908447265625, -0.7239990234375, -0.69891357421875, -0.673828125, -0.64874267578125, -0.6236572265625, -0.59857177734375, -0.573486328125, -0.54840087890625, -0.5233154296875, -0.49822998046875, -0.47314453125, -0.44805908203125, -0.4229736328125, -0.39788818359375, -0.372802734375, -0.34771728515625, -0.3226318359375, -0.29754638671875, -0.2724609375, -0.24737548828125, -0.2222900390625, -0.19720458984375, -0.172119140625, -0.14703369140625, -0.1219482421875, -0.09686279296875, -0.07177734375, -0.04669189453125, -0.0216064453125, 0.00347900390625, 0.028564453125, 0.05364990234375, 0.0787353515625, 0.10382080078125, 0.12890625, 0.15399169921875, 0.1790771484375, 0.20416259765625, 0.229248046875, 0.25433349609375, 0.2794189453125, 0.30450439453125, 0.32958984375, 0.35467529296875, 0.3797607421875, 0.40484619140625, 0.429931640625, 0.45501708984375, 0.4801025390625, 0.50518798828125, 0.5302734375, 0.55535888671875, 0.5804443359375, 0.60552978515625, 0.630615234375, 0.65570068359375, 0.6807861328125, 0.70587158203125, 0.73095703125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 3.0, 4.0, 5.0, 4.0, 10.0, 11.0, 26.0, 31.0, 37.0, 63.0, 75.0, 85.0, 113.0, 105.0, 87.0, 89.0, 64.0, 36.0, 43.0, 28.0, 20.0, 13.0, 13.0, 9.0, 8.0, 8.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.081031799316406e-05, -6.774440407752991e-05, -6.467849016189575e-05, -6.16125762462616e-05, -5.854666233062744e-05, -5.5480748414993286e-05, -5.241483449935913e-05, -4.9348920583724976e-05, -4.628300666809082e-05, -4.3217092752456665e-05, -4.015117883682251e-05, -3.7085264921188354e-05, -3.40193510055542e-05, -3.0953437089920044e-05, -2.788752317428589e-05, -2.4821609258651733e-05, -2.1755695343017578e-05, -1.8689781427383423e-05, -1.5623867511749268e-05, -1.2557953596115112e-05, -9.492039680480957e-06, -6.426125764846802e-06, -3.3602118492126465e-06, -2.942979335784912e-07, 2.771615982055664e-06, 5.837529897689819e-06, 8.903443813323975e-06, 1.196935772895813e-05, 1.5035271644592285e-05, 1.810118556022644e-05, 2.1167099475860596e-05, 2.423301339149475e-05, 2.7298927307128906e-05, 3.036484122276306e-05, 3.343075513839722e-05, 3.649666905403137e-05, 3.956258296966553e-05, 4.262849688529968e-05, 4.569441080093384e-05, 4.876032471656799e-05, 5.182623863220215e-05, 5.4892152547836304e-05, 5.795806646347046e-05, 6.1023980379104614e-05, 6.408989429473877e-05, 6.715580821037292e-05, 7.022172212600708e-05, 7.328763604164124e-05, 7.635354995727539e-05, 7.941946387290955e-05, 8.24853777885437e-05, 8.555129170417786e-05, 8.861720561981201e-05, 9.168311953544617e-05, 9.474903345108032e-05, 9.781494736671448e-05, 0.00010088086128234863, 0.00010394677519798279, 0.00010701268911361694, 0.0001100786030292511, 0.00011314451694488525, 0.00011621043086051941, 0.00011927634477615356, 0.00012234225869178772, 0.00012540817260742188]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 3.0, 14.0, 20.0, 21.0, 56.0, 72.0, 131.0, 288.0, 603.0, 1257.0, 3144.0, 10333.0, 56121.0, 638806.0, 299222.0, 27818.0, 6501.0, 2230.0, 965.0, 434.0, 235.0, 113.0, 59.0, 41.0, 19.0, 18.0, 10.0, 6.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.75927734375, -0.73614501953125, -0.7130126953125, -0.68988037109375, -0.666748046875, -0.64361572265625, -0.6204833984375, -0.59735107421875, -0.57421875, -0.55108642578125, -0.5279541015625, -0.50482177734375, -0.481689453125, -0.45855712890625, -0.4354248046875, -0.41229248046875, -0.38916015625, -0.36602783203125, -0.3428955078125, -0.31976318359375, -0.296630859375, -0.27349853515625, -0.2503662109375, -0.22723388671875, -0.2041015625, -0.18096923828125, -0.1578369140625, -0.13470458984375, -0.111572265625, -0.08843994140625, -0.0653076171875, -0.04217529296875, -0.01904296875, 0.00408935546875, 0.0272216796875, 0.05035400390625, 0.073486328125, 0.09661865234375, 0.1197509765625, 0.14288330078125, 0.166015625, 0.18914794921875, 0.2122802734375, 0.23541259765625, 0.258544921875, 0.28167724609375, 0.3048095703125, 0.32794189453125, 0.35107421875, 0.37420654296875, 0.3973388671875, 0.42047119140625, 0.443603515625, 0.46673583984375, 0.4898681640625, 0.51300048828125, 0.5361328125, 0.55926513671875, 0.5823974609375, 0.60552978515625, 0.628662109375, 0.65179443359375, 0.6749267578125, 0.69805908203125, 0.72119140625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 0.0, 3.0, 2.0, 3.0, 5.0, 7.0, 10.0, 16.0, 19.0, 21.0, 41.0, 66.0, 92.0, 93.0, 104.0, 100.0, 83.0, 94.0, 72.0, 58.0, 37.0, 15.0, 15.0, 8.0, 14.0, 3.0, 5.0, 10.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.379150390625, -0.36565399169921875, -0.3521575927734375, -0.33866119384765625, -0.325164794921875, -0.31166839599609375, -0.2981719970703125, -0.28467559814453125, -0.27117919921875, -0.25768280029296875, -0.2441864013671875, -0.23069000244140625, -0.217193603515625, -0.20369720458984375, -0.1902008056640625, -0.17670440673828125, -0.1632080078125, -0.14971160888671875, -0.1362152099609375, -0.12271881103515625, -0.109222412109375, -0.09572601318359375, -0.0822296142578125, -0.06873321533203125, -0.05523681640625, -0.04174041748046875, -0.0282440185546875, -0.01474761962890625, -0.001251220703125, 0.01224517822265625, 0.0257415771484375, 0.03923797607421875, 0.052734375, 0.06623077392578125, 0.0797271728515625, 0.09322357177734375, 0.106719970703125, 0.12021636962890625, 0.1337127685546875, 0.14720916748046875, 0.16070556640625, 0.17420196533203125, 0.1876983642578125, 0.20119476318359375, 0.214691162109375, 0.22818756103515625, 0.2416839599609375, 0.25518035888671875, 0.2686767578125, 0.28217315673828125, 0.2956695556640625, 0.30916595458984375, 0.322662353515625, 0.33615875244140625, 0.3496551513671875, 0.36315155029296875, 0.37664794921875, 0.39014434814453125, 0.4036407470703125, 0.41713714599609375, 0.430633544921875, 0.44412994384765625, 0.4576263427734375, 0.47112274169921875, 0.484619140625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 8.0, 12.0, 27.0, 67.0, 141.0, 252.0, 246.0, 136.0, 59.0, 34.0, 18.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.599502563476562, -13.259078979492188, -12.918655395507812, -12.578231811523438, -12.237807273864746, -11.897383689880371, -11.556960105895996, -11.216536521911621, -10.87611198425293, -10.535688400268555, -10.19526481628418, -9.854841232299805, -9.514416694641113, -9.173993110656738, -8.833569526672363, -8.493145942687988, -8.152722358703613, -7.812298774719238, -7.471874713897705, -7.13145112991333, -6.791027069091797, -6.450603485107422, -6.110179901123047, -5.769756317138672, -5.429332256317139, -5.088908672332764, -4.7484846115112305, -4.4080610275268555, -4.0676374435424805, -3.7272133827209473, -3.3867897987365723, -3.046365976333618, -2.705942153930664, -2.36551833152771, -2.025094509124756, -1.6846709251403809, -1.3442471027374268, -1.0038232803344727, -0.6633996963500977, -0.32297587394714355, 0.017447948455810547, 0.3578717112541199, 0.6982954740524292, 1.0387191772460938, 1.3791429996490479, 1.719566822052002, 2.059990406036377, 2.400414228439331, 2.740838050842285, 3.0812618732452393, 3.4216856956481934, 3.7621092796325684, 4.102533340454102, 4.442956924438477, 4.783380508422852, 5.123804092407227, 5.46422815322876, 5.804651737213135, 6.145075798034668, 6.485499382019043, 6.825922966003418, 7.166347026824951, 7.506770610809326, 7.847194671630859, 8.187618255615234]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 2.0, 6.0, 14.0, 12.0, 15.0, 19.0, 24.0, 24.0, 33.0, 46.0, 51.0, 45.0, 41.0, 54.0, 50.0, 72.0, 51.0, 53.0, 59.0, 63.0, 41.0, 39.0, 40.0, 32.0, 19.0, 22.0, 24.0, 11.0, 8.0, 5.0, 7.0, 5.0, 3.0, 7.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2581593990325928, -3.1566693782806396, -3.0551791191101074, -2.9536890983581543, -2.852199077606201, -2.750709056854248, -2.649218797683716, -2.5477287769317627, -2.4462385177612305, -2.3447484970092773, -2.243258237838745, -2.141768217086792, -2.040278196334839, -1.9387880563735962, -1.8372979164123535, -1.7358078956604004, -1.6343178749084473, -1.5328277349472046, -1.4313377141952515, -1.3298475742340088, -1.2283575534820557, -1.126867413520813, -1.0253772735595703, -0.9238871932029724, -0.8223971128463745, -0.7209070324897766, -0.6194169521331787, -0.517926812171936, -0.41643673181533813, -0.31494665145874023, -0.21345651149749756, -0.11196643114089966, -0.01047658920288086, 0.09101350605487823, 0.19250360131263733, 0.2939937114715576, 0.3954837918281555, 0.4969738721847534, 0.5984640121459961, 0.699954092502594, 0.8014441728591919, 0.9029342532157898, 1.0044243335723877, 1.1059144735336304, 1.207404613494873, 1.3088946342468262, 1.4103847742080688, 1.5118749141693115, 1.6133649349212646, 1.7148550748825073, 1.8163450956344604, 1.9178352355957031, 2.0193252563476562, 2.1208152770996094, 2.2223055362701416, 2.3237955570220947, 2.425285816192627, 2.52677583694458, 2.6282660961151123, 2.7297561168670654, 2.8312461376190186, 2.932736396789551, 3.034226417541504, 3.135716438293457, 3.23720645904541]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 6.0, 10.0, 12.0, 21.0, 19.0, 18.0, 33.0, 39.0, 62.0, 75.0, 124.0, 167.0, 282.0, 609.0, 1645.0, 7255.0, 56019.0, 4001550.0, 111733.0, 10507.0, 2358.0, 759.0, 406.0, 230.0, 111.0, 84.0, 50.0, 27.0, 17.0, 13.0, 9.0, 8.0, 5.0, 5.0, 4.0, 3.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.642578125, -2.56622314453125, -2.4898681640625, -2.41351318359375, -2.337158203125, -2.26080322265625, -2.1844482421875, -2.10809326171875, -2.03173828125, -1.95538330078125, -1.8790283203125, -1.80267333984375, -1.726318359375, -1.64996337890625, -1.5736083984375, -1.49725341796875, -1.4208984375, -1.34454345703125, -1.2681884765625, -1.19183349609375, -1.115478515625, -1.03912353515625, -0.9627685546875, -0.88641357421875, -0.81005859375, -0.73370361328125, -0.6573486328125, -0.58099365234375, -0.504638671875, -0.42828369140625, -0.3519287109375, -0.27557373046875, -0.19921875, -0.12286376953125, -0.0465087890625, 0.02984619140625, 0.106201171875, 0.18255615234375, 0.2589111328125, 0.33526611328125, 0.41162109375, 0.48797607421875, 0.5643310546875, 0.64068603515625, 0.717041015625, 0.79339599609375, 0.8697509765625, 0.94610595703125, 1.0224609375, 1.09881591796875, 1.1751708984375, 1.25152587890625, 1.327880859375, 1.40423583984375, 1.4805908203125, 1.55694580078125, 1.63330078125, 1.70965576171875, 1.7860107421875, 1.86236572265625, 1.938720703125, 2.01507568359375, 2.0914306640625, 2.16778564453125, 2.244140625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 18.0, 30.0, 43.0, 75.0, 93.0, 117.0, 130.0, 124.0, 114.0, 97.0, 56.0, 41.0, 27.0, 21.0, 9.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2822265625, -0.2743644714355469, -0.26650238037109375, -0.2586402893066406, -0.2507781982421875, -0.24291610717773438, -0.23505401611328125, -0.22719192504882812, -0.219329833984375, -0.21146774291992188, -0.20360565185546875, -0.19574356079101562, -0.1878814697265625, -0.18001937866210938, -0.17215728759765625, -0.16429519653320312, -0.15643310546875, -0.14857101440429688, -0.14070892333984375, -0.13284683227539062, -0.1249847412109375, -0.11712265014648438, -0.10926055908203125, -0.10139846801757812, -0.093536376953125, -0.08567428588867188, -0.07781219482421875, -0.06995010375976562, -0.0620880126953125, -0.054225921630859375, -0.04636383056640625, -0.038501739501953125, -0.0306396484375, -0.022777557373046875, -0.01491546630859375, -0.007053375244140625, 0.0008087158203125, 0.008670806884765625, 0.01653289794921875, 0.024394989013671875, 0.032257080078125, 0.040119171142578125, 0.04798126220703125, 0.055843353271484375, 0.0637054443359375, 0.07156753540039062, 0.07942962646484375, 0.08729171752929688, 0.09515380859375, 0.10301589965820312, 0.11087799072265625, 0.11874008178710938, 0.1266021728515625, 0.13446426391601562, 0.14232635498046875, 0.15018844604492188, 0.158050537109375, 0.16591262817382812, 0.17377471923828125, 0.18163681030273438, 0.1894989013671875, 0.19736099243164062, 0.20522308349609375, 0.21308517456054688, 0.220947265625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 7.0, 11.0, 4.0, 8.0, 23.0, 19.0, 43.0, 84.0, 178.0, 400.0, 945.0, 2276.0, 6309.0, 21660.0, 113975.0, 3649287.0, 345636.0, 37486.0, 10096.0, 3383.0, 1333.0, 586.0, 250.0, 146.0, 62.0, 29.0, 21.0, 7.0, 7.0, 5.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2841796875, -1.2436676025390625, -1.203155517578125, -1.1626434326171875, -1.12213134765625, -1.0816192626953125, -1.041107177734375, -1.0005950927734375, -0.9600830078125, -0.9195709228515625, -0.879058837890625, -0.8385467529296875, -0.79803466796875, -0.7575225830078125, -0.717010498046875, -0.6764984130859375, -0.635986328125, -0.5954742431640625, -0.554962158203125, -0.5144500732421875, -0.47393798828125, -0.4334259033203125, -0.392913818359375, -0.3524017333984375, -0.3118896484375, -0.2713775634765625, -0.230865478515625, -0.1903533935546875, -0.14984130859375, -0.1093292236328125, -0.068817138671875, -0.0283050537109375, 0.01220703125, 0.0527191162109375, 0.093231201171875, 0.1337432861328125, 0.17425537109375, 0.2147674560546875, 0.255279541015625, 0.2957916259765625, 0.3363037109375, 0.3768157958984375, 0.417327880859375, 0.4578399658203125, 0.49835205078125, 0.5388641357421875, 0.579376220703125, 0.6198883056640625, 0.660400390625, 0.7009124755859375, 0.741424560546875, 0.7819366455078125, 0.82244873046875, 0.8629608154296875, 0.903472900390625, 0.9439849853515625, 0.9844970703125, 1.0250091552734375, 1.065521240234375, 1.1060333251953125, 1.14654541015625, 1.1870574951171875, 1.227569580078125, 1.2680816650390625, 1.30859375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 9.0, 9.0, 10.0, 13.0, 15.0, 27.0, 28.0, 39.0, 90.0, 125.0, 264.0, 860.0, 1724.0, 452.0, 161.0, 87.0, 52.0, 30.0, 15.0, 13.0, 17.0, 14.0, 6.0, 8.0, 1.0, 3.0, 5.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.425537109375, -0.4134559631347656, -0.40137481689453125, -0.3892936706542969, -0.3772125244140625, -0.3651313781738281, -0.35305023193359375, -0.3409690856933594, -0.328887939453125, -0.3168067932128906, -0.30472564697265625, -0.2926445007324219, -0.2805633544921875, -0.2684822082519531, -0.25640106201171875, -0.24431991577148438, -0.23223876953125, -0.22015762329101562, -0.20807647705078125, -0.19599533081054688, -0.1839141845703125, -0.17183303833007812, -0.15975189208984375, -0.14767074584960938, -0.135589599609375, -0.12350845336914062, -0.11142730712890625, -0.09934616088867188, -0.0872650146484375, -0.07518386840820312, -0.06310272216796875, -0.051021575927734375, -0.0389404296875, -0.026859283447265625, -0.01477813720703125, -0.002696990966796875, 0.0093841552734375, 0.021465301513671875, 0.03354644775390625, 0.045627593994140625, 0.057708740234375, 0.06978988647460938, 0.08187103271484375, 0.09395217895507812, 0.1060333251953125, 0.11811447143554688, 0.13019561767578125, 0.14227676391601562, 0.15435791015625, 0.16643905639648438, 0.17852020263671875, 0.19060134887695312, 0.2026824951171875, 0.21476364135742188, 0.22684478759765625, 0.23892593383789062, 0.251007080078125, 0.2630882263183594, 0.27516937255859375, 0.2872505187988281, 0.2993316650390625, 0.3114128112792969, 0.32349395751953125, 0.3355751037597656, 0.34765625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 8.0, 29.0, 81.0, 289.0, 393.0, 147.0, 49.0, 8.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.312604904174805, -6.104586124420166, -5.896567344665527, -5.688548564910889, -5.48052978515625, -5.272511005401611, -5.064492225646973, -4.856472969055176, -4.648454666137695, -4.440435886383057, -4.232417106628418, -4.024398326873779, -3.8163795471191406, -3.608360767364502, -3.400341749191284, -3.1923229694366455, -2.9843039512634277, -2.776285171508789, -2.5682663917541504, -2.3602476119995117, -2.152228832244873, -1.9442099332809448, -1.7361910343170166, -1.528172254562378, -1.3201534748077393, -1.1121346950531006, -0.9041158556938171, -0.6960970163345337, -0.488078236579895, -0.28005945682525635, -0.07204055786132812, 0.13597822189331055, 0.343996524810791, 0.5520153045654297, 0.7600341439247131, 0.9680529832839966, 1.1760717630386353, 1.384090542793274, 1.5921094417572021, 1.8001282215118408, 2.0081470012664795, 2.216165781021118, 2.424184560775757, 2.6322035789489746, 2.8402223587036133, 3.048241138458252, 3.2562599182128906, 3.4642786979675293, 3.672297477722168, 3.8803162574768066, 4.088335037231445, 4.296353816986084, 4.504372596740723, 4.712391376495361, 4.92041015625, 5.128429412841797, 5.336447715759277, 5.544466495513916, 5.752485275268555, 5.960504055023193, 6.168522834777832, 6.376541614532471, 6.584560394287109, 6.792579650878906, 7.000598430633545]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 5.0, 7.0, 10.0, 9.0, 14.0, 20.0, 26.0, 16.0, 27.0, 36.0, 22.0, 55.0, 44.0, 43.0, 42.0, 43.0, 34.0, 67.0, 42.0, 55.0, 66.0, 48.0, 42.0, 35.0, 39.0, 31.0, 20.0, 16.0, 22.0, 19.0, 13.0, 10.0, 9.0, 8.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.987533688545227, -0.9483421444892883, -0.9091506004333496, -0.8699590563774109, -0.8307675123214722, -0.7915759682655334, -0.7523844242095947, -0.713192880153656, -0.6740013360977173, -0.6348097920417786, -0.5956182479858398, -0.5564267039299011, -0.5172351598739624, -0.4780436158180237, -0.43885207176208496, -0.39966052770614624, -0.3604689836502075, -0.3212774395942688, -0.2820858955383301, -0.24289435148239136, -0.20370280742645264, -0.16451126337051392, -0.1253197193145752, -0.08612817525863647, -0.046936631202697754, -0.007745087146759033, 0.03144645690917969, 0.07063800096511841, 0.10982954502105713, 0.14902108907699585, 0.18821263313293457, 0.2274041771888733, 0.26659584045410156, 0.3057873845100403, 0.344978928565979, 0.3841704726219177, 0.42336201667785645, 0.46255356073379517, 0.5017451047897339, 0.5409366488456726, 0.5801281929016113, 0.61931973695755, 0.6585112810134888, 0.6977028250694275, 0.7368943691253662, 0.7760859131813049, 0.8152774572372437, 0.8544690012931824, 0.8936605453491211, 0.9328520894050598, 0.9720436334609985, 1.011235237121582, 1.050426721572876, 1.08961820602417, 1.1288098096847534, 1.168001413345337, 1.2071928977966309, 1.2463843822479248, 1.2855759859085083, 1.3247675895690918, 1.3639590740203857, 1.4031505584716797, 1.4423421621322632, 1.4815337657928467, 1.5207252502441406]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 3.0, 1.0, 7.0, 7.0, 14.0, 5.0, 13.0, 21.0, 14.0, 40.0, 30.0, 53.0, 82.0, 103.0, 184.0, 302.0, 544.0, 997.0, 2267.0, 7512.0, 37125.0, 261904.0, 602135.0, 110050.0, 17461.0, 4240.0, 1615.0, 693.0, 388.0, 242.0, 156.0, 96.0, 63.0, 54.0, 50.0, 19.0, 14.0, 16.0, 6.0, 16.0, 6.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.18359375, -2.126556396484375, -2.06951904296875, -2.012481689453125, -1.9554443359375, -1.898406982421875, -1.84136962890625, -1.784332275390625, -1.727294921875, -1.670257568359375, -1.61322021484375, -1.556182861328125, -1.4991455078125, -1.442108154296875, -1.38507080078125, -1.328033447265625, -1.27099609375, -1.213958740234375, -1.15692138671875, -1.099884033203125, -1.0428466796875, -0.985809326171875, -0.92877197265625, -0.871734619140625, -0.814697265625, -0.757659912109375, -0.70062255859375, -0.643585205078125, -0.5865478515625, -0.529510498046875, -0.47247314453125, -0.415435791015625, -0.3583984375, -0.301361083984375, -0.24432373046875, -0.187286376953125, -0.1302490234375, -0.073211669921875, -0.01617431640625, 0.040863037109375, 0.097900390625, 0.154937744140625, 0.21197509765625, 0.269012451171875, 0.3260498046875, 0.383087158203125, 0.44012451171875, 0.497161865234375, 0.55419921875, 0.611236572265625, 0.66827392578125, 0.725311279296875, 0.7823486328125, 0.839385986328125, 0.89642333984375, 0.953460693359375, 1.010498046875, 1.067535400390625, 1.12457275390625, 1.181610107421875, 1.2386474609375, 1.295684814453125, 1.35272216796875, 1.409759521484375, 1.466796875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 8.0, 11.0, 13.0, 37.0, 46.0, 76.0, 89.0, 130.0, 151.0, 104.0, 97.0, 66.0, 57.0, 55.0, 24.0, 24.0, 7.0, 11.0, 5.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.30712890625, -0.29900360107421875, -0.2908782958984375, -0.28275299072265625, -0.274627685546875, -0.26650238037109375, -0.2583770751953125, -0.25025177001953125, -0.24212646484375, -0.23400115966796875, -0.2258758544921875, -0.21775054931640625, -0.209625244140625, -0.20149993896484375, -0.1933746337890625, -0.18524932861328125, -0.1771240234375, -0.16899871826171875, -0.1608734130859375, -0.15274810791015625, -0.144622802734375, -0.13649749755859375, -0.1283721923828125, -0.12024688720703125, -0.11212158203125, -0.10399627685546875, -0.0958709716796875, -0.08774566650390625, -0.079620361328125, -0.07149505615234375, -0.0633697509765625, -0.05524444580078125, -0.047119140625, -0.03899383544921875, -0.0308685302734375, -0.02274322509765625, -0.014617919921875, -0.00649261474609375, 0.0016326904296875, 0.00975799560546875, 0.01788330078125, 0.02600860595703125, 0.0341339111328125, 0.04225921630859375, 0.050384521484375, 0.05850982666015625, 0.0666351318359375, 0.07476043701171875, 0.0828857421875, 0.09101104736328125, 0.0991363525390625, 0.10726165771484375, 0.115386962890625, 0.12351226806640625, 0.1316375732421875, 0.13976287841796875, 0.14788818359375, 0.15601348876953125, 0.1641387939453125, 0.17226409912109375, 0.180389404296875, 0.18851470947265625, 0.1966400146484375, 0.20476531982421875, 0.212890625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 11.0, 7.0, 15.0, 20.0, 18.0, 33.0, 51.0, 61.0, 133.0, 188.0, 313.0, 521.0, 1019.0, 2104.0, 4218.0, 9900.0, 23624.0, 64968.0, 186904.0, 381415.0, 236430.0, 84451.0, 29835.0, 11961.0, 5142.0, 2404.0, 1222.0, 673.0, 353.0, 191.0, 120.0, 79.0, 48.0, 29.0, 21.0, 21.0, 10.0, 9.0, 9.0, 3.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0], "bins": [-0.806640625, -0.7833404541015625, -0.760040283203125, -0.7367401123046875, -0.71343994140625, -0.6901397705078125, -0.666839599609375, -0.6435394287109375, -0.6202392578125, -0.5969390869140625, -0.573638916015625, -0.5503387451171875, -0.52703857421875, -0.5037384033203125, -0.480438232421875, -0.4571380615234375, -0.433837890625, -0.4105377197265625, -0.387237548828125, -0.3639373779296875, -0.34063720703125, -0.3173370361328125, -0.294036865234375, -0.2707366943359375, -0.2474365234375, -0.2241363525390625, -0.200836181640625, -0.1775360107421875, -0.15423583984375, -0.1309356689453125, -0.107635498046875, -0.0843353271484375, -0.06103515625, -0.0377349853515625, -0.014434814453125, 0.0088653564453125, 0.03216552734375, 0.0554656982421875, 0.078765869140625, 0.1020660400390625, 0.1253662109375, 0.1486663818359375, 0.171966552734375, 0.1952667236328125, 0.21856689453125, 0.2418670654296875, 0.265167236328125, 0.2884674072265625, 0.311767578125, 0.3350677490234375, 0.358367919921875, 0.3816680908203125, 0.40496826171875, 0.4282684326171875, 0.451568603515625, 0.4748687744140625, 0.4981689453125, 0.5214691162109375, 0.544769287109375, 0.5680694580078125, 0.59136962890625, 0.6146697998046875, 0.637969970703125, 0.6612701416015625, 0.6845703125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 4.0, 2.0, 6.0, 7.0, 17.0, 13.0, 11.0, 24.0, 15.0, 19.0, 22.0, 22.0, 27.0, 29.0, 35.0, 40.0, 32.0, 44.0, 48.0, 50.0, 48.0, 41.0, 50.0, 52.0, 35.0, 40.0, 32.0, 33.0, 28.0, 19.0, 26.0, 22.0, 24.0, 16.0, 15.0, 18.0, 9.0, 9.0, 7.0, 2.0, 3.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.49658203125, -0.4825859069824219, -0.46858978271484375, -0.4545936584472656, -0.4405975341796875, -0.4266014099121094, -0.41260528564453125, -0.3986091613769531, -0.384613037109375, -0.3706169128417969, -0.35662078857421875, -0.3426246643066406, -0.3286285400390625, -0.3146324157714844, -0.30063629150390625, -0.2866401672363281, -0.27264404296875, -0.2586479187011719, -0.24465179443359375, -0.23065567016601562, -0.2166595458984375, -0.20266342163085938, -0.18866729736328125, -0.17467117309570312, -0.160675048828125, -0.14667892456054688, -0.13268280029296875, -0.11868667602539062, -0.1046905517578125, -0.09069442749023438, -0.07669830322265625, -0.06270217895507812, -0.0487060546875, -0.034709930419921875, -0.02071380615234375, -0.006717681884765625, 0.0072784423828125, 0.021274566650390625, 0.03527069091796875, 0.049266815185546875, 0.063262939453125, 0.07725906372070312, 0.09125518798828125, 0.10525131225585938, 0.1192474365234375, 0.13324356079101562, 0.14723968505859375, 0.16123580932617188, 0.17523193359375, 0.18922805786132812, 0.20322418212890625, 0.21722030639648438, 0.2312164306640625, 0.24521255493164062, 0.25920867919921875, 0.2732048034667969, 0.287200927734375, 0.3011970520019531, 0.31519317626953125, 0.3291893005371094, 0.3431854248046875, 0.3571815490722656, 0.37117767333984375, 0.3851737976074219, 0.399169921875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 5.0, 18.0, 22.0, 43.0, 83.0, 144.0, 276.0, 658.0, 1681.0, 6500.0, 41663.0, 430350.0, 504416.0, 51962.0, 7510.0, 1914.0, 696.0, 288.0, 141.0, 76.0, 37.0, 27.0, 13.0, 11.0, 8.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50927734375, -0.48894500732421875, -0.4686126708984375, -0.44828033447265625, -0.427947998046875, -0.40761566162109375, -0.3872833251953125, -0.36695098876953125, -0.34661865234375, -0.32628631591796875, -0.3059539794921875, -0.28562164306640625, -0.265289306640625, -0.24495697021484375, -0.2246246337890625, -0.20429229736328125, -0.1839599609375, -0.16362762451171875, -0.1432952880859375, -0.12296295166015625, -0.102630615234375, -0.08229827880859375, -0.0619659423828125, -0.04163360595703125, -0.02130126953125, -0.00096893310546875, 0.0193634033203125, 0.03969573974609375, 0.060028076171875, 0.08036041259765625, 0.1006927490234375, 0.12102508544921875, 0.141357421875, 0.16168975830078125, 0.1820220947265625, 0.20235443115234375, 0.222686767578125, 0.24301910400390625, 0.2633514404296875, 0.28368377685546875, 0.30401611328125, 0.32434844970703125, 0.3446807861328125, 0.36501312255859375, 0.385345458984375, 0.40567779541015625, 0.4260101318359375, 0.44634246826171875, 0.4666748046875, 0.48700714111328125, 0.5073394775390625, 0.5276718139648438, 0.548004150390625, 0.5683364868164062, 0.5886688232421875, 0.6090011596679688, 0.62933349609375, 0.6496658325195312, 0.6699981689453125, 0.6903305053710938, 0.710662841796875, 0.7309951782226562, 0.7513275146484375, 0.7716598510742188, 0.7919921875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 6.0, 8.0, 19.0, 20.0, 20.0, 22.0, 29.0, 41.0, 80.0, 70.0, 105.0, 113.0, 100.0, 73.0, 62.0, 54.0, 38.0, 36.0, 25.0, 22.0, 19.0, 15.0, 4.0, 8.0, 3.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.605552673339844e-05, -7.332488894462585e-05, -7.059425115585327e-05, -6.786361336708069e-05, -6.51329755783081e-05, -6.240233778953552e-05, -5.967170000076294e-05, -5.6941062211990356e-05, -5.4210424423217773e-05, -5.147978663444519e-05, -4.874914884567261e-05, -4.6018511056900024e-05, -4.328787326812744e-05, -4.055723547935486e-05, -3.7826597690582275e-05, -3.509595990180969e-05, -3.236532211303711e-05, -2.9634684324264526e-05, -2.6904046535491943e-05, -2.417340874671936e-05, -2.1442770957946777e-05, -1.8712133169174194e-05, -1.598149538040161e-05, -1.3250857591629028e-05, -1.0520219802856445e-05, -7.789582014083862e-06, -5.058944225311279e-06, -2.3283064365386963e-06, 4.023313522338867e-07, 3.1329691410064697e-06, 5.863606929779053e-06, 8.594244718551636e-06, 1.1324882507324219e-05, 1.4055520296096802e-05, 1.6786158084869385e-05, 1.9516795873641968e-05, 2.224743366241455e-05, 2.4978071451187134e-05, 2.7708709239959717e-05, 3.04393470287323e-05, 3.316998481750488e-05, 3.5900622606277466e-05, 3.863126039505005e-05, 4.136189818382263e-05, 4.4092535972595215e-05, 4.68231737613678e-05, 4.955381155014038e-05, 5.2284449338912964e-05, 5.501508712768555e-05, 5.774572491645813e-05, 6.047636270523071e-05, 6.32070004940033e-05, 6.593763828277588e-05, 6.866827607154846e-05, 7.139891386032104e-05, 7.412955164909363e-05, 7.686018943786621e-05, 7.95908272266388e-05, 8.232146501541138e-05, 8.505210280418396e-05, 8.778274059295654e-05, 9.051337838172913e-05, 9.324401617050171e-05, 9.597465395927429e-05, 9.870529174804688e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 5.0, 9.0, 8.0, 16.0, 19.0, 29.0, 62.0, 93.0, 122.0, 262.0, 562.0, 1264.0, 4153.0, 17191.0, 100632.0, 510616.0, 343812.0, 54692.0, 10291.0, 2732.0, 1002.0, 418.0, 222.0, 131.0, 66.0, 48.0, 36.0, 19.0, 8.0, 14.0, 7.0, 4.0, 6.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.459716796875, -0.4443092346191406, -0.42890167236328125, -0.4134941101074219, -0.3980865478515625, -0.3826789855957031, -0.36727142333984375, -0.3518638610839844, -0.336456298828125, -0.3210487365722656, -0.30564117431640625, -0.2902336120605469, -0.2748260498046875, -0.2594184875488281, -0.24401092529296875, -0.22860336303710938, -0.21319580078125, -0.19778823852539062, -0.18238067626953125, -0.16697311401367188, -0.1515655517578125, -0.13615798950195312, -0.12075042724609375, -0.10534286499023438, -0.089935302734375, -0.07452774047851562, -0.05912017822265625, -0.043712615966796875, -0.0283050537109375, -0.012897491455078125, 0.00251007080078125, 0.017917633056640625, 0.0333251953125, 0.048732757568359375, 0.06414031982421875, 0.07954788208007812, 0.0949554443359375, 0.11036300659179688, 0.12577056884765625, 0.14117813110351562, 0.156585693359375, 0.17199325561523438, 0.18740081787109375, 0.20280838012695312, 0.2182159423828125, 0.23362350463867188, 0.24903106689453125, 0.2644386291503906, 0.27984619140625, 0.2952537536621094, 0.31066131591796875, 0.3260688781738281, 0.3414764404296875, 0.3568840026855469, 0.37229156494140625, 0.3876991271972656, 0.403106689453125, 0.4185142517089844, 0.43392181396484375, 0.4493293762207031, 0.4647369384765625, 0.4801445007324219, 0.49555206298828125, 0.5109596252441406, 0.5263671875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 5.0, 5.0, 4.0, 2.0, 13.0, 12.0, 21.0, 26.0, 33.0, 28.0, 46.0, 60.0, 46.0, 51.0, 57.0, 71.0, 66.0, 72.0, 61.0, 54.0, 41.0, 37.0, 37.0, 32.0, 23.0, 21.0, 19.0, 10.0, 13.0, 6.0, 8.0, 5.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.28564453125, -0.2768096923828125, -0.267974853515625, -0.2591400146484375, -0.25030517578125, -0.2414703369140625, -0.232635498046875, -0.2238006591796875, -0.2149658203125, -0.2061309814453125, -0.197296142578125, -0.1884613037109375, -0.17962646484375, -0.1707916259765625, -0.161956787109375, -0.1531219482421875, -0.144287109375, -0.1354522705078125, -0.126617431640625, -0.1177825927734375, -0.10894775390625, -0.1001129150390625, -0.091278076171875, -0.0824432373046875, -0.0736083984375, -0.0647735595703125, -0.055938720703125, -0.0471038818359375, -0.03826904296875, -0.0294342041015625, -0.020599365234375, -0.0117645263671875, -0.0029296875, 0.0059051513671875, 0.014739990234375, 0.0235748291015625, 0.03240966796875, 0.0412445068359375, 0.050079345703125, 0.0589141845703125, 0.0677490234375, 0.0765838623046875, 0.085418701171875, 0.0942535400390625, 0.10308837890625, 0.1119232177734375, 0.120758056640625, 0.1295928955078125, 0.138427734375, 0.1472625732421875, 0.156097412109375, 0.1649322509765625, 0.17376708984375, 0.1826019287109375, 0.191436767578125, 0.2002716064453125, 0.2091064453125, 0.2179412841796875, 0.226776123046875, 0.2356109619140625, 0.24444580078125, 0.2532806396484375, 0.262115478515625, 0.2709503173828125, 0.27978515625]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 7.0, 9.0, 17.0, 25.0, 57.0, 124.0, 189.0, 227.0, 175.0, 99.0, 40.0, 25.0, 6.0, 8.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.865457534790039, -4.528101444244385, -4.190745830535889, -3.8533897399902344, -3.516033887863159, -3.178678035736084, -2.8413219451904297, -2.5039660930633545, -2.1666102409362793, -1.829254388809204, -1.4918984174728394, -1.1545424461364746, -0.8171865940093994, -0.4798307418823242, -0.14247465133666992, 0.19488120079040527, 0.5322370529174805, 0.8695929646492004, 1.2069488763809204, 1.5443048477172852, 1.8816606998443604, 2.2190165519714355, 2.55637264251709, 2.893728494644165, 3.2310843467712402, 3.5684401988983154, 3.9057960510253906, 4.243152141571045, 4.580508232116699, 4.917863845825195, 5.25521993637085, 5.592576026916504, 5.929931640625, 6.267287731170654, 6.60464334487915, 6.941999435424805, 7.279355049133301, 7.616711139678955, 7.954067230224609, 8.291422843933105, 8.628778457641602, 8.966134071350098, 9.30349063873291, 9.640846252441406, 9.978201866149902, 10.315557479858398, 10.652914047241211, 10.990269660949707, 11.32762622833252, 11.664981842041016, 12.002338409423828, 12.339694023132324, 12.67704963684082, 13.014406204223633, 13.351761817932129, 13.689117431640625, 14.026473999023438, 14.363829612731934, 14.701186180114746, 15.038541793823242, 15.375897407531738, 15.713253021240234, 16.050609588623047, 16.38796615600586, 16.72532081604004]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 7.0, 7.0, 9.0, 8.0, 7.0, 10.0, 11.0, 20.0, 20.0, 22.0, 28.0, 24.0, 38.0, 29.0, 32.0, 41.0, 35.0, 37.0, 50.0, 48.0, 48.0, 49.0, 52.0, 51.0, 36.0, 40.0, 35.0, 37.0, 27.0, 31.0, 21.0, 15.0, 18.0, 13.0, 7.0, 7.0, 8.0, 6.0, 7.0, 7.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0], "bins": [-3.21193528175354, -3.127472162246704, -3.043008804321289, -2.958545684814453, -2.874082565307617, -2.7896194458007812, -2.705156087875366, -2.6206929683685303, -2.5362296104431152, -2.4517664909362793, -2.3673031330108643, -2.2828400135040283, -2.1983768939971924, -2.1139135360717773, -2.0294504165649414, -1.9449872970581055, -1.8605241775512695, -1.776060938835144, -1.691597819328308, -1.6071345806121826, -1.5226714611053467, -1.4382082223892212, -1.3537449836730957, -1.2692818641662598, -1.1848186254501343, -1.1003553867340088, -1.0158922672271729, -0.9314290285110474, -0.8469658493995667, -0.7625026702880859, -0.6780394315719604, -0.5935762524604797, -0.5091128349304199, -0.4246496558189392, -0.3401864469051361, -0.255723237991333, -0.1712600588798523, -0.08679687976837158, -0.0023336410522460938, 0.08212953805923462, 0.16659271717071533, 0.25105589628219604, 0.33551910519599915, 0.41998231410980225, 0.504445493221283, 0.5889086723327637, 0.6733719110488892, 0.7578350901603699, 0.8422982692718506, 0.9267614483833313, 1.011224627494812, 1.0956878662109375, 1.1801509857177734, 1.264614224433899, 1.3490774631500244, 1.4335405826568604, 1.5180038213729858, 1.6024670600891113, 1.6869301795959473, 1.7713934183120728, 1.8558566570281982, 1.9403197765350342, 2.024783134460449, 2.109246253967285, 2.193709373474121]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 6.0, 2.0, 5.0, 2.0, 6.0, 12.0, 4.0, 6.0, 12.0, 19.0, 17.0, 21.0, 36.0, 37.0, 32.0, 48.0, 65.0, 81.0, 146.0, 254.0, 474.0, 936.0, 2354.0, 6151.0, 22400.0, 218628.0, 3850551.0, 71246.0, 12887.0, 4210.0, 1655.0, 834.0, 467.0, 230.0, 158.0, 87.0, 70.0, 46.0, 32.0, 22.0, 16.0, 9.0, 7.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9375, -1.87139892578125, -1.8052978515625, -1.73919677734375, -1.673095703125, -1.60699462890625, -1.5408935546875, -1.47479248046875, -1.40869140625, -1.34259033203125, -1.2764892578125, -1.21038818359375, -1.144287109375, -1.07818603515625, -1.0120849609375, -0.94598388671875, -0.8798828125, -0.81378173828125, -0.7476806640625, -0.68157958984375, -0.615478515625, -0.54937744140625, -0.4832763671875, -0.41717529296875, -0.35107421875, -0.28497314453125, -0.2188720703125, -0.15277099609375, -0.086669921875, -0.02056884765625, 0.0455322265625, 0.11163330078125, 0.177734375, 0.24383544921875, 0.3099365234375, 0.37603759765625, 0.442138671875, 0.50823974609375, 0.5743408203125, 0.64044189453125, 0.70654296875, 0.77264404296875, 0.8387451171875, 0.90484619140625, 0.970947265625, 1.03704833984375, 1.1031494140625, 1.16925048828125, 1.2353515625, 1.30145263671875, 1.3675537109375, 1.43365478515625, 1.499755859375, 1.56585693359375, 1.6319580078125, 1.69805908203125, 1.76416015625, 1.83026123046875, 1.8963623046875, 1.96246337890625, 2.028564453125, 2.09466552734375, 2.1607666015625, 2.22686767578125, 2.29296875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 8.0, 12.0, 29.0, 33.0, 48.0, 72.0, 72.0, 119.0, 117.0, 125.0, 84.0, 83.0, 81.0, 44.0, 28.0, 20.0, 13.0, 5.0, 4.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.306396484375, -0.2983074188232422, -0.2902183532714844, -0.28212928771972656, -0.27404022216796875, -0.26595115661621094, -0.2578620910644531, -0.2497730255126953, -0.2416839599609375, -0.2335948944091797, -0.22550582885742188, -0.21741676330566406, -0.20932769775390625, -0.20123863220214844, -0.19314956665039062, -0.1850605010986328, -0.176971435546875, -0.1688823699951172, -0.16079330444335938, -0.15270423889160156, -0.14461517333984375, -0.13652610778808594, -0.12843704223632812, -0.12034797668457031, -0.1122589111328125, -0.10416984558105469, -0.09608078002929688, -0.08799171447753906, -0.07990264892578125, -0.07181358337402344, -0.06372451782226562, -0.05563545227050781, -0.04754638671875, -0.03945732116699219, -0.031368255615234375, -0.023279190063476562, -0.01519012451171875, -0.0071010589599609375, 0.000988006591796875, 0.009077072143554688, 0.0171661376953125, 0.025255203247070312, 0.033344268798828125, 0.04143333435058594, 0.04952239990234375, 0.05761146545410156, 0.06570053100585938, 0.07378959655761719, 0.081878662109375, 0.08996772766113281, 0.09805679321289062, 0.10614585876464844, 0.11423492431640625, 0.12232398986816406, 0.13041305541992188, 0.1385021209716797, 0.1465911865234375, 0.1546802520751953, 0.16276931762695312, 0.17085838317871094, 0.17894744873046875, 0.18703651428222656, 0.19512557983398438, 0.2032146453857422, 0.2113037109375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 8.0, 15.0, 22.0, 10.0, 25.0, 31.0, 51.0, 69.0, 114.0, 266.0, 555.0, 1365.0, 3801.0, 15211.0, 105357.0, 3735810.0, 295057.0, 27225.0, 5940.0, 1843.0, 722.0, 346.0, 181.0, 82.0, 56.0, 42.0, 24.0, 18.0, 7.0, 8.0, 6.0, 9.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8935546875, -1.835601806640625, -1.77764892578125, -1.719696044921875, -1.6617431640625, -1.603790283203125, -1.54583740234375, -1.487884521484375, -1.429931640625, -1.371978759765625, -1.31402587890625, -1.256072998046875, -1.1981201171875, -1.140167236328125, -1.08221435546875, -1.024261474609375, -0.96630859375, -0.908355712890625, -0.85040283203125, -0.792449951171875, -0.7344970703125, -0.676544189453125, -0.61859130859375, -0.560638427734375, -0.502685546875, -0.444732666015625, -0.38677978515625, -0.328826904296875, -0.2708740234375, -0.212921142578125, -0.15496826171875, -0.097015380859375, -0.0390625, 0.018890380859375, 0.07684326171875, 0.134796142578125, 0.1927490234375, 0.250701904296875, 0.30865478515625, 0.366607666015625, 0.424560546875, 0.482513427734375, 0.54046630859375, 0.598419189453125, 0.6563720703125, 0.714324951171875, 0.77227783203125, 0.830230712890625, 0.88818359375, 0.946136474609375, 1.00408935546875, 1.062042236328125, 1.1199951171875, 1.177947998046875, 1.23590087890625, 1.293853759765625, 1.351806640625, 1.409759521484375, 1.46771240234375, 1.525665283203125, 1.5836181640625, 1.641571044921875, 1.69952392578125, 1.757476806640625, 1.8154296875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 5.0, 1.0, 3.0, 11.0, 11.0, 21.0, 27.0, 38.0, 51.0, 119.0, 245.0, 670.0, 1874.0, 520.0, 196.0, 110.0, 61.0, 40.0, 26.0, 20.0, 13.0, 7.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55322265625, -0.5330352783203125, -0.512847900390625, -0.4926605224609375, -0.47247314453125, -0.4522857666015625, -0.432098388671875, -0.4119110107421875, -0.3917236328125, -0.3715362548828125, -0.351348876953125, -0.3311614990234375, -0.31097412109375, -0.2907867431640625, -0.270599365234375, -0.2504119873046875, -0.230224609375, -0.2100372314453125, -0.189849853515625, -0.1696624755859375, -0.14947509765625, -0.1292877197265625, -0.109100341796875, -0.0889129638671875, -0.0687255859375, -0.0485382080078125, -0.028350830078125, -0.0081634521484375, 0.01202392578125, 0.0322113037109375, 0.052398681640625, 0.0725860595703125, 0.0927734375, 0.1129608154296875, 0.133148193359375, 0.1533355712890625, 0.17352294921875, 0.1937103271484375, 0.213897705078125, 0.2340850830078125, 0.2542724609375, 0.2744598388671875, 0.294647216796875, 0.3148345947265625, 0.33502197265625, 0.3552093505859375, 0.375396728515625, 0.3955841064453125, 0.415771484375, 0.4359588623046875, 0.456146240234375, 0.4763336181640625, 0.49652099609375, 0.5167083740234375, 0.536895751953125, 0.5570831298828125, 0.5772705078125, 0.5974578857421875, 0.617645263671875, 0.6378326416015625, 0.65802001953125, 0.6782073974609375, 0.698394775390625, 0.7185821533203125, 0.73876953125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 12.0, 24.0, 130.0, 322.0, 332.0, 125.0, 47.0, 7.0, 7.0, 1.0, 0.0, 2.0, 1.0], "bins": [-15.870895385742188, -15.582854270935059, -15.29481315612793, -15.0067720413208, -14.718730926513672, -14.43069076538086, -14.142648696899414, -13.854608535766602, -13.566567420959473, -13.278526306152344, -12.990485191345215, -12.702444076538086, -12.414402961730957, -12.126361846923828, -11.838321685791016, -11.550280570983887, -11.262239456176758, -10.974198341369629, -10.6861572265625, -10.398116111755371, -10.110074996948242, -9.82203483581543, -9.533992767333984, -9.245952606201172, -8.957910537719727, -8.669869422912598, -8.381828308105469, -8.09378719329834, -7.805746555328369, -7.51770544052124, -7.229664325714111, -6.941623687744141, -6.6535820960998535, -6.365540981292725, -6.077499866485596, -5.789459228515625, -5.501418113708496, -5.213376998901367, -4.925335884094238, -4.637294769287109, -4.3492536544799805, -4.061212539672852, -3.7731716632843018, -3.485130548477173, -3.197089672088623, -2.909048557281494, -2.6210074424743652, -2.3329665660858154, -2.0449256896972656, -1.7568846940994263, -1.468843698501587, -1.180802583694458, -0.8927615880966187, -0.6047205924987793, -0.3166794776916504, -0.028638601303100586, 0.2594025135040283, 0.5474435091018677, 0.8354845643043518, 1.123525619506836, 1.4115666151046753, 1.6996076107025146, 1.9876487255096436, 2.2756896018981934, 2.5637307167053223]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 4.0, 5.0, 8.0, 3.0, 6.0, 4.0, 11.0, 11.0, 19.0, 16.0, 30.0, 22.0, 27.0, 27.0, 28.0, 35.0, 42.0, 26.0, 46.0, 51.0, 55.0, 53.0, 40.0, 59.0, 45.0, 39.0, 34.0, 38.0, 32.0, 20.0, 36.0, 23.0, 17.0, 20.0, 14.0, 10.0, 15.0, 9.0, 6.0, 6.0, 4.0, 2.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3890295028686523, -1.3394087553024292, -1.2897881269454956, -1.2401673793792725, -1.1905467510223389, -1.1409260034561157, -1.0913052558898926, -1.041684627532959, -0.9920638799667358, -0.9424431920051575, -0.8928225040435791, -0.843201756477356, -0.7935810685157776, -0.7439603805541992, -0.6943396329879761, -0.6447189450263977, -0.5950982570648193, -0.545477569103241, -0.4958568513393402, -0.44623613357543945, -0.3966154456138611, -0.3469947576522827, -0.29737403988838196, -0.2477533221244812, -0.19813263416290283, -0.14851193130016327, -0.0988912284374237, -0.04927052557468414, 0.0003501772880554199, 0.04997088015079498, 0.09959158301353455, 0.1492123007774353, 0.19883298873901367, 0.24845369160175323, 0.2980743944644928, 0.34769511222839355, 0.3973158001899719, 0.4469364881515503, 0.49655720591545105, 0.5461779236793518, 0.5957986116409302, 0.6454192996025085, 0.6950399875640869, 0.7446607351303101, 0.7942814230918884, 0.8439021110534668, 0.8935228586196899, 0.9431435465812683, 0.9927642345428467, 1.0423849821090698, 1.0920056104660034, 1.1416263580322266, 1.1912469863891602, 1.2408677339553833, 1.2904884815216064, 1.34010910987854, 1.3897298574447632, 1.4393506050109863, 1.48897123336792, 1.538591980934143, 1.5882127285003662, 1.6378333568572998, 1.687454104423523, 1.737074851989746, 1.7866954803466797]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 7.0, 5.0, 4.0, 8.0, 10.0, 12.0, 26.0, 29.0, 64.0, 91.0, 180.0, 434.0, 988.0, 3101.0, 16685.0, 199791.0, 755842.0, 60576.0, 7602.0, 1860.0, 617.0, 254.0, 144.0, 83.0, 47.0, 30.0, 24.0, 19.0, 7.0, 6.0, 7.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6796875, -2.59918212890625, -2.5186767578125, -2.43817138671875, -2.357666015625, -2.27716064453125, -2.1966552734375, -2.11614990234375, -2.03564453125, -1.95513916015625, -1.8746337890625, -1.79412841796875, -1.713623046875, -1.63311767578125, -1.5526123046875, -1.47210693359375, -1.3916015625, -1.31109619140625, -1.2305908203125, -1.15008544921875, -1.069580078125, -0.98907470703125, -0.9085693359375, -0.82806396484375, -0.74755859375, -0.66705322265625, -0.5865478515625, -0.50604248046875, -0.425537109375, -0.34503173828125, -0.2645263671875, -0.18402099609375, -0.103515625, -0.02301025390625, 0.0574951171875, 0.13800048828125, 0.218505859375, 0.29901123046875, 0.3795166015625, 0.46002197265625, 0.54052734375, 0.62103271484375, 0.7015380859375, 0.78204345703125, 0.862548828125, 0.94305419921875, 1.0235595703125, 1.10406494140625, 1.1845703125, 1.26507568359375, 1.3455810546875, 1.42608642578125, 1.506591796875, 1.58709716796875, 1.6676025390625, 1.74810791015625, 1.82861328125, 1.90911865234375, 1.9896240234375, 2.07012939453125, 2.150634765625, 2.23114013671875, 2.3116455078125, 2.39215087890625, 2.47265625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 2.0, 5.0, 4.0, 4.0, 19.0, 23.0, 33.0, 50.0, 45.0, 64.0, 76.0, 83.0, 87.0, 100.0, 82.0, 83.0, 77.0, 48.0, 35.0, 27.0, 30.0, 13.0, 12.0, 3.0, 3.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.299560546875, -0.2916698455810547, -0.2837791442871094, -0.27588844299316406, -0.26799774169921875, -0.26010704040527344, -0.2522163391113281, -0.2443256378173828, -0.2364349365234375, -0.2285442352294922, -0.22065353393554688, -0.21276283264160156, -0.20487213134765625, -0.19698143005371094, -0.18909072875976562, -0.1812000274658203, -0.173309326171875, -0.1654186248779297, -0.15752792358398438, -0.14963722229003906, -0.14174652099609375, -0.13385581970214844, -0.12596511840820312, -0.11807441711425781, -0.1101837158203125, -0.10229301452636719, -0.09440231323242188, -0.08651161193847656, -0.07862091064453125, -0.07073020935058594, -0.06283950805664062, -0.05494880676269531, -0.04705810546875, -0.03916740417480469, -0.031276702880859375, -0.023386001586914062, -0.01549530029296875, -0.0076045989990234375, 0.000286102294921875, 0.008176803588867188, 0.0160675048828125, 0.023958206176757812, 0.031848907470703125, 0.03973960876464844, 0.04763031005859375, 0.05552101135253906, 0.06341171264648438, 0.07130241394042969, 0.079193115234375, 0.08708381652832031, 0.09497451782226562, 0.10286521911621094, 0.11075592041015625, 0.11864662170410156, 0.12653732299804688, 0.1344280242919922, 0.1423187255859375, 0.1502094268798828, 0.15810012817382812, 0.16599082946777344, 0.17388153076171875, 0.18177223205566406, 0.18966293334960938, 0.1975536346435547, 0.2054443359375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 4.0, 5.0, 4.0, 6.0, 10.0, 14.0, 17.0, 21.0, 34.0, 61.0, 84.0, 119.0, 182.0, 322.0, 628.0, 1235.0, 2497.0, 5326.0, 13298.0, 38029.0, 131987.0, 443875.0, 291279.0, 78405.0, 24096.0, 9118.0, 3841.0, 1871.0, 923.0, 492.0, 267.0, 167.0, 91.0, 95.0, 47.0, 25.0, 23.0, 13.0, 11.0, 11.0, 6.0, 4.0, 3.0, 2.0, 5.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8916015625, -0.8626480102539062, -0.8336944580078125, -0.8047409057617188, -0.775787353515625, -0.7468338012695312, -0.7178802490234375, -0.6889266967773438, -0.65997314453125, -0.6310195922851562, -0.6020660400390625, -0.5731124877929688, -0.544158935546875, -0.5152053833007812, -0.4862518310546875, -0.45729827880859375, -0.4283447265625, -0.39939117431640625, -0.3704376220703125, -0.34148406982421875, -0.312530517578125, -0.28357696533203125, -0.2546234130859375, -0.22566986083984375, -0.19671630859375, -0.16776275634765625, -0.1388092041015625, -0.10985565185546875, -0.080902099609375, -0.05194854736328125, -0.0229949951171875, 0.00595855712890625, 0.034912109375, 0.06386566162109375, 0.0928192138671875, 0.12177276611328125, 0.150726318359375, 0.17967987060546875, 0.2086334228515625, 0.23758697509765625, 0.26654052734375, 0.29549407958984375, 0.3244476318359375, 0.35340118408203125, 0.382354736328125, 0.41130828857421875, 0.4402618408203125, 0.46921539306640625, 0.4981689453125, 0.5271224975585938, 0.5560760498046875, 0.5850296020507812, 0.613983154296875, 0.6429367065429688, 0.6718902587890625, 0.7008438110351562, 0.72979736328125, 0.7587509155273438, 0.7877044677734375, 0.8166580200195312, 0.845611572265625, 0.8745651245117188, 0.9035186767578125, 0.9324722290039062, 0.96142578125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 6.0, 5.0, 2.0, 9.0, 10.0, 7.0, 10.0, 8.0, 18.0, 23.0, 21.0, 27.0, 28.0, 35.0, 33.0, 30.0, 46.0, 46.0, 43.0, 47.0, 42.0, 38.0, 39.0, 42.0, 47.0, 45.0, 38.0, 31.0, 32.0, 42.0, 18.0, 24.0, 22.0, 17.0, 19.0, 17.0, 4.0, 6.0, 8.0, 6.0, 5.0, 1.0, 5.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.59716796875, -0.5787887573242188, -0.5604095458984375, -0.5420303344726562, -0.523651123046875, -0.5052719116210938, -0.4868927001953125, -0.46851348876953125, -0.45013427734375, -0.43175506591796875, -0.4133758544921875, -0.39499664306640625, -0.376617431640625, -0.35823822021484375, -0.3398590087890625, -0.32147979736328125, -0.3031005859375, -0.28472137451171875, -0.2663421630859375, -0.24796295166015625, -0.229583740234375, -0.21120452880859375, -0.1928253173828125, -0.17444610595703125, -0.15606689453125, -0.13768768310546875, -0.1193084716796875, -0.10092926025390625, -0.082550048828125, -0.06417083740234375, -0.0457916259765625, -0.02741241455078125, -0.009033203125, 0.00934600830078125, 0.0277252197265625, 0.04610443115234375, 0.064483642578125, 0.08286285400390625, 0.1012420654296875, 0.11962127685546875, 0.13800048828125, 0.15637969970703125, 0.1747589111328125, 0.19313812255859375, 0.211517333984375, 0.22989654541015625, 0.2482757568359375, 0.26665496826171875, 0.2850341796875, 0.30341339111328125, 0.3217926025390625, 0.34017181396484375, 0.358551025390625, 0.37693023681640625, 0.3953094482421875, 0.41368865966796875, 0.43206787109375, 0.45044708251953125, 0.4688262939453125, 0.48720550537109375, 0.505584716796875, 0.5239639282226562, 0.5423431396484375, 0.5607223510742188, 0.5791015625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 5.0, 3.0, 6.0, 13.0, 18.0, 28.0, 61.0, 81.0, 136.0, 218.0, 432.0, 1287.0, 5239.0, 33991.0, 735043.0, 252017.0, 15387.0, 2918.0, 857.0, 319.0, 182.0, 93.0, 71.0, 51.0, 37.0, 21.0, 12.0, 8.0, 10.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.966796875, -0.9332427978515625, -0.899688720703125, -0.8661346435546875, -0.83258056640625, -0.7990264892578125, -0.765472412109375, -0.7319183349609375, -0.6983642578125, -0.6648101806640625, -0.631256103515625, -0.5977020263671875, -0.56414794921875, -0.5305938720703125, -0.497039794921875, -0.4634857177734375, -0.429931640625, -0.3963775634765625, -0.362823486328125, -0.3292694091796875, -0.29571533203125, -0.2621612548828125, -0.228607177734375, -0.1950531005859375, -0.1614990234375, -0.1279449462890625, -0.094390869140625, -0.0608367919921875, -0.02728271484375, 0.0062713623046875, 0.039825439453125, 0.0733795166015625, 0.10693359375, 0.1404876708984375, 0.174041748046875, 0.2075958251953125, 0.24114990234375, 0.2747039794921875, 0.308258056640625, 0.3418121337890625, 0.3753662109375, 0.4089202880859375, 0.442474365234375, 0.4760284423828125, 0.50958251953125, 0.5431365966796875, 0.576690673828125, 0.6102447509765625, 0.643798828125, 0.6773529052734375, 0.710906982421875, 0.7444610595703125, 0.77801513671875, 0.8115692138671875, 0.845123291015625, 0.8786773681640625, 0.9122314453125, 0.9457855224609375, 0.979339599609375, 1.0128936767578125, 1.04644775390625, 1.0800018310546875, 1.113555908203125, 1.1471099853515625, 1.1806640625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 7.0, 7.0, 9.0, 9.0, 8.0, 9.0, 34.0, 62.0, 78.0, 100.0, 158.0, 144.0, 127.0, 91.0, 45.0, 34.0, 29.0, 17.0, 4.0, 9.0, 10.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0001342296600341797, -0.00013001449406147003, -0.00012579932808876038, -0.00012158416211605072, -0.00011736899614334106, -0.00011315383017063141, -0.00010893866419792175, -0.0001047234982252121, -0.00010050833225250244, -9.629316627979279e-05, -9.207800030708313e-05, -8.786283433437347e-05, -8.364766836166382e-05, -7.943250238895416e-05, -7.521733641624451e-05, -7.100217044353485e-05, -6.67870044708252e-05, -6.257183849811554e-05, -5.8356672525405884e-05, -5.414150655269623e-05, -4.992634057998657e-05, -4.5711174607276917e-05, -4.149600863456726e-05, -3.7280842661857605e-05, -3.306567668914795e-05, -2.8850510716438293e-05, -2.4635344743728638e-05, -2.0420178771018982e-05, -1.6205012798309326e-05, -1.198984682559967e-05, -7.774680852890015e-06, -3.559514880180359e-06, 6.556510925292969e-07, 4.870817065238953e-06, 9.085983037948608e-06, 1.3301149010658264e-05, 1.751631498336792e-05, 2.1731480956077576e-05, 2.594664692878723e-05, 3.0161812901496887e-05, 3.437697887420654e-05, 3.85921448469162e-05, 4.2807310819625854e-05, 4.702247679233551e-05, 5.1237642765045166e-05, 5.545280873775482e-05, 5.966797471046448e-05, 6.388314068317413e-05, 6.809830665588379e-05, 7.231347262859344e-05, 7.65286386013031e-05, 8.074380457401276e-05, 8.495897054672241e-05, 8.917413651943207e-05, 9.338930249214172e-05, 9.760446846485138e-05, 0.00010181963443756104, 0.00010603480041027069, 0.00011024996638298035, 0.00011446513235569, 0.00011868029832839966, 0.00012289546430110931, 0.00012711063027381897, 0.00013132579624652863, 0.00013554096221923828]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 6.0, 13.0, 18.0, 32.0, 49.0, 79.0, 152.0, 258.0, 816.0, 9416.0, 906999.0, 126899.0, 2865.0, 487.0, 202.0, 93.0, 73.0, 39.0, 32.0, 14.0, 8.0, 8.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.150390625, -2.088592529296875, -2.02679443359375, -1.964996337890625, -1.9031982421875, -1.841400146484375, -1.77960205078125, -1.717803955078125, -1.656005859375, -1.594207763671875, -1.53240966796875, -1.470611572265625, -1.4088134765625, -1.347015380859375, -1.28521728515625, -1.223419189453125, -1.16162109375, -1.099822998046875, -1.03802490234375, -0.976226806640625, -0.9144287109375, -0.852630615234375, -0.79083251953125, -0.729034423828125, -0.667236328125, -0.605438232421875, -0.54364013671875, -0.481842041015625, -0.4200439453125, -0.358245849609375, -0.29644775390625, -0.234649658203125, -0.1728515625, -0.111053466796875, -0.04925537109375, 0.012542724609375, 0.0743408203125, 0.136138916015625, 0.19793701171875, 0.259735107421875, 0.321533203125, 0.383331298828125, 0.44512939453125, 0.506927490234375, 0.5687255859375, 0.630523681640625, 0.69232177734375, 0.754119873046875, 0.81591796875, 0.877716064453125, 0.93951416015625, 1.001312255859375, 1.0631103515625, 1.124908447265625, 1.18670654296875, 1.248504638671875, 1.310302734375, 1.372100830078125, 1.43389892578125, 1.495697021484375, 1.5574951171875, 1.619293212890625, 1.68109130859375, 1.742889404296875, 1.8046875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 11.0, 11.0, 22.0, 35.0, 59.0, 113.0, 164.0, 190.0, 152.0, 100.0, 56.0, 24.0, 21.0, 17.0, 7.0, 7.0, 4.0, 7.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9990234375, -0.9722747802734375, -0.945526123046875, -0.9187774658203125, -0.89202880859375, -0.8652801513671875, -0.838531494140625, -0.8117828369140625, -0.7850341796875, -0.7582855224609375, -0.731536865234375, -0.7047882080078125, -0.67803955078125, -0.6512908935546875, -0.624542236328125, -0.5977935791015625, -0.571044921875, -0.5442962646484375, -0.517547607421875, -0.4907989501953125, -0.46405029296875, -0.4373016357421875, -0.410552978515625, -0.3838043212890625, -0.3570556640625, -0.3303070068359375, -0.303558349609375, -0.2768096923828125, -0.25006103515625, -0.2233123779296875, -0.196563720703125, -0.1698150634765625, -0.14306640625, -0.1163177490234375, -0.089569091796875, -0.0628204345703125, -0.03607177734375, -0.0093231201171875, 0.017425537109375, 0.0441741943359375, 0.0709228515625, 0.0976715087890625, 0.124420166015625, 0.1511688232421875, 0.17791748046875, 0.2046661376953125, 0.231414794921875, 0.2581634521484375, 0.284912109375, 0.3116607666015625, 0.338409423828125, 0.3651580810546875, 0.39190673828125, 0.4186553955078125, 0.445404052734375, 0.4721527099609375, 0.4989013671875, 0.5256500244140625, 0.552398681640625, 0.5791473388671875, 0.60589599609375, 0.6326446533203125, 0.659393310546875, 0.6861419677734375, 0.712890625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 6.0, 22.0, 42.0, 120.0, 276.0, 315.0, 149.0, 45.0, 28.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.204580307006836, -25.635066986083984, -25.065555572509766, -24.496042251586914, -23.926528930664062, -23.357017517089844, -22.787504196166992, -22.217992782592773, -21.648479461669922, -21.07896614074707, -20.50945472717285, -19.93994140625, -19.37042999267578, -18.80091667175293, -18.231403350830078, -17.66189193725586, -17.092378616333008, -16.522865295410156, -15.953353881835938, -15.383840560913086, -14.81432819366455, -14.244815826416016, -13.675302505493164, -13.105790138244629, -12.536277770996094, -11.966765403747559, -11.397253036499023, -10.827739715576172, -10.258227348327637, -9.688714981079102, -9.11920166015625, -8.549689292907715, -7.980177879333496, -7.410665512084961, -6.841152667999268, -6.271639823913574, -5.702127456665039, -5.132615089416504, -4.5631022453308105, -3.9935896396636963, -3.424077033996582, -2.8545644283294678, -2.2850518226623535, -1.7155392169952393, -1.146026611328125, -0.5765140056610107, -0.007001399993896484, 0.5625112056732178, 1.132023811340332, 1.7015364170074463, 2.2710490226745605, 2.840561628341675, 3.410074234008789, 3.9795868396759033, 4.549099445343018, 5.118612289428711, 5.688124656677246, 6.257637023925781, 6.827149868011475, 7.396662712097168, 7.966175079345703, 8.535687446594238, 9.105199813842773, 9.674713134765625, 10.24422550201416]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 5.0, 14.0, 9.0, 17.0, 14.0, 23.0, 19.0, 13.0, 25.0, 20.0, 26.0, 25.0, 40.0, 35.0, 37.0, 35.0, 46.0, 37.0, 52.0, 46.0, 37.0, 41.0, 40.0, 25.0, 30.0, 28.0, 35.0, 30.0, 26.0, 19.0, 22.0, 21.0, 17.0, 18.0, 12.0, 13.0, 9.0, 15.0, 5.0, 5.0, 5.0, 3.0, 4.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.975113868713379, -2.883923292160034, -2.7927327156066895, -2.7015419006347656, -2.610351324081421, -2.519160747528076, -2.4279701709747314, -2.3367795944213867, -2.245588779449463, -2.154398202896118, -2.0632076263427734, -1.9720169305801392, -1.8808262348175049, -1.7896356582641602, -1.6984450817108154, -1.6072543859481812, -1.5160638093948364, -1.4248732328414917, -1.3336825370788574, -1.2424919605255127, -1.1513012647628784, -1.0601106882095337, -0.9689200520515442, -0.8777294158935547, -0.7865387797355652, -0.6953481435775757, -0.6041575074195862, -0.5129668712615967, -0.42177626490592957, -0.33058562874794006, -0.23939502239227295, -0.14820438623428345, -0.057013750076293945, 0.03417687863111496, 0.12536750733852386, 0.21655812859535217, 0.3077487647533417, 0.3989394009113312, 0.4901300072669983, 0.5813206434249878, 0.6725112795829773, 0.7637019157409668, 0.8548925518989563, 0.9460831880569458, 1.0372737646102905, 1.1284644603729248, 1.2196550369262695, 1.3108456134796143, 1.4020363092422485, 1.4932268857955933, 1.5844175815582275, 1.6756081581115723, 1.7667988538742065, 1.8579894304275513, 1.9491801261901855, 2.0403707027435303, 2.131561279296875, 2.2227518558502197, 2.3139424324035645, 2.4051332473754883, 2.496323823928833, 2.5875144004821777, 2.6787049770355225, 2.769895553588867, 2.861086368560791]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 4.0, 14.0, 8.0, 21.0, 11.0, 15.0, 31.0, 38.0, 55.0, 89.0, 140.0, 305.0, 710.0, 2496.0, 12883.0, 180267.0, 3948841.0, 40174.0, 5546.0, 1480.0, 595.0, 283.0, 142.0, 64.0, 30.0, 20.0, 9.0, 4.0, 4.0, 4.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.017578125, -1.930877685546875, -1.84417724609375, -1.757476806640625, -1.6707763671875, -1.584075927734375, -1.49737548828125, -1.410675048828125, -1.323974609375, -1.237274169921875, -1.15057373046875, -1.063873291015625, -0.9771728515625, -0.890472412109375, -0.80377197265625, -0.717071533203125, -0.63037109375, -0.543670654296875, -0.45697021484375, -0.370269775390625, -0.2835693359375, -0.196868896484375, -0.11016845703125, -0.023468017578125, 0.063232421875, 0.149932861328125, 0.23663330078125, 0.323333740234375, 0.4100341796875, 0.496734619140625, 0.58343505859375, 0.670135498046875, 0.7568359375, 0.843536376953125, 0.93023681640625, 1.016937255859375, 1.1036376953125, 1.190338134765625, 1.27703857421875, 1.363739013671875, 1.450439453125, 1.537139892578125, 1.62384033203125, 1.710540771484375, 1.7972412109375, 1.883941650390625, 1.97064208984375, 2.057342529296875, 2.14404296875, 2.230743408203125, 2.31744384765625, 2.404144287109375, 2.4908447265625, 2.577545166015625, 2.66424560546875, 2.750946044921875, 2.837646484375, 2.924346923828125, 3.01104736328125, 3.097747802734375, 3.1844482421875, 3.271148681640625, 3.35784912109375, 3.444549560546875, 3.53125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 9.0, 11.0, 8.0, 23.0, 25.0, 37.0, 54.0, 44.0, 78.0, 77.0, 77.0, 95.0, 69.0, 85.0, 71.0, 61.0, 45.0, 41.0, 30.0, 21.0, 22.0, 10.0, 3.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.303955078125, -0.2960948944091797, -0.2882347106933594, -0.28037452697753906, -0.27251434326171875, -0.26465415954589844, -0.2567939758300781, -0.2489337921142578, -0.2410736083984375, -0.2332134246826172, -0.22535324096679688, -0.21749305725097656, -0.20963287353515625, -0.20177268981933594, -0.19391250610351562, -0.1860523223876953, -0.178192138671875, -0.1703319549560547, -0.16247177124023438, -0.15461158752441406, -0.14675140380859375, -0.13889122009277344, -0.13103103637695312, -0.12317085266113281, -0.1153106689453125, -0.10745048522949219, -0.09959030151367188, -0.09173011779785156, -0.08386993408203125, -0.07600975036621094, -0.06814956665039062, -0.06028938293457031, -0.05242919921875, -0.04456901550292969, -0.036708831787109375, -0.028848648071289062, -0.02098846435546875, -0.013128280639648438, -0.005268096923828125, 0.0025920867919921875, 0.0104522705078125, 0.018312454223632812, 0.026172637939453125, 0.03403282165527344, 0.04189300537109375, 0.04975318908691406, 0.057613372802734375, 0.06547355651855469, 0.073333740234375, 0.08119392395019531, 0.08905410766601562, 0.09691429138183594, 0.10477447509765625, 0.11263465881347656, 0.12049484252929688, 0.1283550262451172, 0.1362152099609375, 0.1440753936767578, 0.15193557739257812, 0.15979576110839844, 0.16765594482421875, 0.17551612854003906, 0.18337631225585938, 0.1912364959716797, 0.1990966796875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 2.0, 7.0, 8.0, 19.0, 22.0, 24.0, 37.0, 67.0, 136.0, 185.0, 354.0, 586.0, 1530.0, 6057.0, 66047.0, 4064033.0, 47192.0, 5155.0, 1394.0, 601.0, 301.0, 206.0, 101.0, 77.0, 37.0, 27.0, 22.0, 23.0, 15.0, 6.0, 5.0, 4.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9921875, -2.86981201171875, -2.7474365234375, -2.62506103515625, -2.502685546875, -2.38031005859375, -2.2579345703125, -2.13555908203125, -2.01318359375, -1.89080810546875, -1.7684326171875, -1.64605712890625, -1.523681640625, -1.40130615234375, -1.2789306640625, -1.15655517578125, -1.0341796875, -0.91180419921875, -0.7894287109375, -0.66705322265625, -0.544677734375, -0.42230224609375, -0.2999267578125, -0.17755126953125, -0.05517578125, 0.06719970703125, 0.1895751953125, 0.31195068359375, 0.434326171875, 0.55670166015625, 0.6790771484375, 0.80145263671875, 0.923828125, 1.04620361328125, 1.1685791015625, 1.29095458984375, 1.413330078125, 1.53570556640625, 1.6580810546875, 1.78045654296875, 1.90283203125, 2.02520751953125, 2.1475830078125, 2.26995849609375, 2.392333984375, 2.51470947265625, 2.6370849609375, 2.75946044921875, 2.8818359375, 3.00421142578125, 3.1265869140625, 3.24896240234375, 3.371337890625, 3.49371337890625, 3.6160888671875, 3.73846435546875, 3.86083984375, 3.98321533203125, 4.1055908203125, 4.22796630859375, 4.350341796875, 4.47271728515625, 4.5950927734375, 4.71746826171875, 4.83984375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 6.0, 5.0, 17.0, 19.0, 45.0, 135.0, 515.0, 2798.0, 349.0, 101.0, 36.0, 19.0, 16.0, 10.0, 2.0, 3.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6708984375, -0.6344451904296875, -0.597991943359375, -0.5615386962890625, -0.52508544921875, -0.4886322021484375, -0.452178955078125, -0.4157257080078125, -0.3792724609375, -0.3428192138671875, -0.306365966796875, -0.2699127197265625, -0.23345947265625, -0.1970062255859375, -0.160552978515625, -0.1240997314453125, -0.087646484375, -0.0511932373046875, -0.014739990234375, 0.0217132568359375, 0.05816650390625, 0.0946197509765625, 0.131072998046875, 0.1675262451171875, 0.2039794921875, 0.2404327392578125, 0.276885986328125, 0.3133392333984375, 0.34979248046875, 0.3862457275390625, 0.422698974609375, 0.4591522216796875, 0.49560546875, 0.5320587158203125, 0.568511962890625, 0.6049652099609375, 0.64141845703125, 0.6778717041015625, 0.714324951171875, 0.7507781982421875, 0.7872314453125, 0.8236846923828125, 0.860137939453125, 0.8965911865234375, 0.93304443359375, 0.9694976806640625, 1.005950927734375, 1.0424041748046875, 1.078857421875, 1.1153106689453125, 1.151763916015625, 1.1882171630859375, 1.22467041015625, 1.2611236572265625, 1.297576904296875, 1.3340301513671875, 1.3704833984375, 1.4069366455078125, 1.443389892578125, 1.4798431396484375, 1.51629638671875, 1.5527496337890625, 1.589202880859375, 1.6256561279296875, 1.662109375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 1.0, 3.0, 7.0, 9.0, 26.0, 64.0, 158.0, 261.0, 246.0, 141.0, 48.0, 22.0, 8.0, 5.0, 1.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.11191463470459, -8.899765968322754, -8.687617301940918, -8.475468635559082, -8.263320922851562, -8.051172256469727, -7.839023590087891, -7.626874923706055, -7.414726257324219, -7.202577590942383, -6.990428924560547, -6.778280735015869, -6.566132068634033, -6.353983402252197, -6.1418352127075195, -5.929686546325684, -5.717537879943848, -5.505389213562012, -5.293240547180176, -5.081092357635498, -4.868943691253662, -4.656795024871826, -4.444646835327148, -4.2324981689453125, -4.020349502563477, -3.8082008361816406, -3.596052408218384, -3.383903980255127, -3.171755313873291, -2.959606647491455, -2.7474582195281982, -2.5353097915649414, -2.3231611251831055, -2.1110124588012695, -1.8988640308380127, -1.6867154836654663, -1.47456693649292, -1.2624183893203735, -1.0502698421478271, -0.8381212949752808, -0.6259727478027344, -0.413824200630188, -0.2016756534576416, 0.010472893714904785, 0.22262144088745117, 0.43476998805999756, 0.646918535232544, 0.8590670824050903, 1.0712156295776367, 1.283364176750183, 1.4955127239227295, 1.7076612710952759, 1.9198098182678223, 2.131958484649658, 2.344106912612915, 2.556255340576172, 2.768404006958008, 2.9805526733398438, 3.1927011013031006, 3.4048495292663574, 3.6169981956481934, 3.8291468620300293, 4.041295051574707, 4.253443717956543, 4.465592384338379]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 14.0, 14.0, 23.0, 35.0, 53.0, 67.0, 84.0, 100.0, 111.0, 103.0, 107.0, 94.0, 73.0, 40.0, 26.0, 18.0, 11.0, 15.0, 7.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.850165367126465, -4.724785327911377, -4.599405288696289, -4.474025249481201, -4.348645210266113, -4.223265647888184, -4.0978851318359375, -3.9725053310394287, -3.84712553024292, -3.721745491027832, -3.596365451812744, -3.4709854125976562, -3.3456056118011475, -3.2202255725860596, -3.0948455333709717, -2.969465494155884, -2.844085454940796, -2.718705415725708, -2.59332537651062, -2.4679455757141113, -2.3425655364990234, -2.2171854972839355, -2.0918054580688477, -1.9664254188537598, -1.8410454988479614, -1.7156654596328735, -1.5902855396270752, -1.4649055004119873, -1.3395254611968994, -1.214145541191101, -1.0887655019760132, -0.9633855223655701, -0.8380053043365479, -0.7126253247261047, -0.5872453451156616, -0.46186530590057373, -0.3364853262901306, -0.2111053466796875, -0.08572530746459961, 0.039654672145843506, 0.16503465175628662, 0.29041463136672974, 0.41579464077949524, 0.5411746501922607, 0.6665546298027039, 0.791934609413147, 0.9173146486282349, 1.0426945686340332, 1.168074607849121, 1.293454647064209, 1.4188345670700073, 1.5442146062850952, 1.6695945262908936, 1.7949745655059814, 1.9203546047210693, 2.0457346439361572, 2.171114444732666, 2.296494483947754, 2.421874523162842, 2.5472545623779297, 2.6726343631744385, 2.7980144023895264, 2.9233944416046143, 3.048774480819702, 3.17415452003479]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 1.0, 7.0, 13.0, 15.0, 19.0, 25.0, 46.0, 62.0, 124.0, 208.0, 420.0, 984.0, 3071.0, 14694.0, 166355.0, 762207.0, 86849.0, 9548.0, 2348.0, 778.0, 346.0, 157.0, 87.0, 63.0, 40.0, 25.0, 18.0, 16.0, 11.0, 3.0, 3.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.033203125, -2.947479248046875, -2.86175537109375, -2.776031494140625, -2.6903076171875, -2.604583740234375, -2.51885986328125, -2.433135986328125, -2.347412109375, -2.261688232421875, -2.17596435546875, -2.090240478515625, -2.0045166015625, -1.918792724609375, -1.83306884765625, -1.747344970703125, -1.66162109375, -1.575897216796875, -1.49017333984375, -1.404449462890625, -1.3187255859375, -1.233001708984375, -1.14727783203125, -1.061553955078125, -0.975830078125, -0.890106201171875, -0.80438232421875, -0.718658447265625, -0.6329345703125, -0.547210693359375, -0.46148681640625, -0.375762939453125, -0.2900390625, -0.204315185546875, -0.11859130859375, -0.032867431640625, 0.0528564453125, 0.138580322265625, 0.22430419921875, 0.310028076171875, 0.395751953125, 0.481475830078125, 0.56719970703125, 0.652923583984375, 0.7386474609375, 0.824371337890625, 0.91009521484375, 0.995819091796875, 1.08154296875, 1.167266845703125, 1.25299072265625, 1.338714599609375, 1.4244384765625, 1.510162353515625, 1.59588623046875, 1.681610107421875, 1.767333984375, 1.853057861328125, 1.93878173828125, 2.024505615234375, 2.1102294921875, 2.195953369140625, 2.28167724609375, 2.367401123046875, 2.453125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 15.0, 12.0, 19.0, 23.0, 30.0, 60.0, 53.0, 83.0, 67.0, 88.0, 86.0, 73.0, 87.0, 68.0, 61.0, 40.0, 46.0, 30.0, 23.0, 15.0, 10.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.382568359375, -0.3726539611816406, -0.36273956298828125, -0.3528251647949219, -0.3429107666015625, -0.3329963684082031, -0.32308197021484375, -0.3131675720214844, -0.303253173828125, -0.2933387756347656, -0.28342437744140625, -0.2735099792480469, -0.2635955810546875, -0.2536811828613281, -0.24376678466796875, -0.23385238647460938, -0.22393798828125, -0.21402359008789062, -0.20410919189453125, -0.19419479370117188, -0.1842803955078125, -0.17436599731445312, -0.16445159912109375, -0.15453720092773438, -0.144622802734375, -0.13470840454101562, -0.12479400634765625, -0.11487960815429688, -0.1049652099609375, -0.09505081176757812, -0.08513641357421875, -0.07522201538085938, -0.0653076171875, -0.055393218994140625, -0.04547882080078125, -0.035564422607421875, -0.0256500244140625, -0.015735626220703125, -0.00582122802734375, 0.004093170166015625, 0.014007568359375, 0.023921966552734375, 0.03383636474609375, 0.043750762939453125, 0.0536651611328125, 0.06357955932617188, 0.07349395751953125, 0.08340835571289062, 0.09332275390625, 0.10323715209960938, 0.11315155029296875, 0.12306594848632812, 0.1329803466796875, 0.14289474487304688, 0.15280914306640625, 0.16272354125976562, 0.172637939453125, 0.18255233764648438, 0.19246673583984375, 0.20238113403320312, 0.2122955322265625, 0.22220993041992188, 0.23212432861328125, 0.24203872680664062, 0.251953125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 7.0, 12.0, 13.0, 30.0, 35.0, 67.0, 92.0, 189.0, 383.0, 1014.0, 2782.0, 9084.0, 34981.0, 173434.0, 571225.0, 200864.0, 39348.0, 9979.0, 3099.0, 1033.0, 410.0, 221.0, 114.0, 49.0, 25.0, 20.0, 18.0, 6.0, 8.0, 5.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.455078125, -1.4116973876953125, -1.368316650390625, -1.3249359130859375, -1.28155517578125, -1.2381744384765625, -1.194793701171875, -1.1514129638671875, -1.1080322265625, -1.0646514892578125, -1.021270751953125, -0.9778900146484375, -0.93450927734375, -0.8911285400390625, -0.847747802734375, -0.8043670654296875, -0.760986328125, -0.7176055908203125, -0.674224853515625, -0.6308441162109375, -0.58746337890625, -0.5440826416015625, -0.500701904296875, -0.4573211669921875, -0.4139404296875, -0.3705596923828125, -0.327178955078125, -0.2837982177734375, -0.24041748046875, -0.1970367431640625, -0.153656005859375, -0.1102752685546875, -0.06689453125, -0.0235137939453125, 0.019866943359375, 0.0632476806640625, 0.10662841796875, 0.1500091552734375, 0.193389892578125, 0.2367706298828125, 0.2801513671875, 0.3235321044921875, 0.366912841796875, 0.4102935791015625, 0.45367431640625, 0.4970550537109375, 0.540435791015625, 0.5838165283203125, 0.627197265625, 0.6705780029296875, 0.713958740234375, 0.7573394775390625, 0.80072021484375, 0.8441009521484375, 0.887481689453125, 0.9308624267578125, 0.9742431640625, 1.0176239013671875, 1.061004638671875, 1.1043853759765625, 1.14776611328125, 1.1911468505859375, 1.234527587890625, 1.2779083251953125, 1.3212890625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 5.0, 0.0, 0.0, 2.0, 5.0, 4.0, 4.0, 2.0, 5.0, 6.0, 7.0, 12.0, 10.0, 12.0, 18.0, 14.0, 12.0, 21.0, 17.0, 30.0, 26.0, 39.0, 44.0, 36.0, 44.0, 45.0, 40.0, 45.0, 51.0, 36.0, 46.0, 36.0, 28.0, 30.0, 35.0, 28.0, 27.0, 30.0, 24.0, 15.0, 18.0, 23.0, 14.0, 6.0, 11.0, 12.0, 6.0, 6.0, 5.0, 5.0, 8.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0], "bins": [-0.76171875, -0.7396316528320312, -0.7175445556640625, -0.6954574584960938, -0.673370361328125, -0.6512832641601562, -0.6291961669921875, -0.6071090698242188, -0.58502197265625, -0.5629348754882812, -0.5408477783203125, -0.5187606811523438, -0.496673583984375, -0.47458648681640625, -0.4524993896484375, -0.43041229248046875, -0.4083251953125, -0.38623809814453125, -0.3641510009765625, -0.34206390380859375, -0.319976806640625, -0.29788970947265625, -0.2758026123046875, -0.25371551513671875, -0.23162841796875, -0.20954132080078125, -0.1874542236328125, -0.16536712646484375, -0.143280029296875, -0.12119293212890625, -0.0991058349609375, -0.07701873779296875, -0.054931640625, -0.03284454345703125, -0.0107574462890625, 0.01132965087890625, 0.033416748046875, 0.05550384521484375, 0.0775909423828125, 0.09967803955078125, 0.12176513671875, 0.14385223388671875, 0.1659393310546875, 0.18802642822265625, 0.210113525390625, 0.23220062255859375, 0.2542877197265625, 0.27637481689453125, 0.2984619140625, 0.32054901123046875, 0.3426361083984375, 0.36472320556640625, 0.386810302734375, 0.40889739990234375, 0.4309844970703125, 0.45307159423828125, 0.47515869140625, 0.49724578857421875, 0.5193328857421875, 0.5414199829101562, 0.563507080078125, 0.5855941772460938, 0.6076812744140625, 0.6297683715820312, 0.65185546875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 9.0, 8.0, 3.0, 10.0, 18.0, 18.0, 21.0, 56.0, 82.0, 112.0, 216.0, 413.0, 852.0, 2164.0, 6427.0, 28299.0, 204575.0, 632986.0, 142223.0, 21325.0, 5288.0, 1758.0, 779.0, 388.0, 206.0, 116.0, 68.0, 51.0, 21.0, 19.0, 19.0, 12.0, 6.0, 2.0, 2.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5703125, -0.5487213134765625, -0.527130126953125, -0.5055389404296875, -0.48394775390625, -0.4623565673828125, -0.440765380859375, -0.4191741943359375, -0.3975830078125, -0.3759918212890625, -0.354400634765625, -0.3328094482421875, -0.31121826171875, -0.2896270751953125, -0.268035888671875, -0.2464447021484375, -0.224853515625, -0.2032623291015625, -0.181671142578125, -0.1600799560546875, -0.13848876953125, -0.1168975830078125, -0.095306396484375, -0.0737152099609375, -0.0521240234375, -0.0305328369140625, -0.008941650390625, 0.0126495361328125, 0.03424072265625, 0.0558319091796875, 0.077423095703125, 0.0990142822265625, 0.12060546875, 0.1421966552734375, 0.163787841796875, 0.1853790283203125, 0.20697021484375, 0.2285614013671875, 0.250152587890625, 0.2717437744140625, 0.2933349609375, 0.3149261474609375, 0.336517333984375, 0.3581085205078125, 0.37969970703125, 0.4012908935546875, 0.422882080078125, 0.4444732666015625, 0.466064453125, 0.4876556396484375, 0.509246826171875, 0.5308380126953125, 0.55242919921875, 0.5740203857421875, 0.595611572265625, 0.6172027587890625, 0.6387939453125, 0.6603851318359375, 0.681976318359375, 0.7035675048828125, 0.72515869140625, 0.7467498779296875, 0.768341064453125, 0.7899322509765625, 0.8115234375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 4.0, 3.0, 3.0, 5.0, 10.0, 10.0, 15.0, 32.0, 48.0, 106.0, 161.0, 201.0, 161.0, 110.0, 46.0, 33.0, 22.0, 15.0, 7.0, 3.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00025963783264160156, -0.00025290995836257935, -0.00024618208408355713, -0.0002394542098045349, -0.0002327263355255127, -0.00022599846124649048, -0.00021927058696746826, -0.00021254271268844604, -0.00020581483840942383, -0.0001990869641304016, -0.0001923590898513794, -0.00018563121557235718, -0.00017890334129333496, -0.00017217546701431274, -0.00016544759273529053, -0.0001587197184562683, -0.0001519918441772461, -0.00014526396989822388, -0.00013853609561920166, -0.00013180822134017944, -0.00012508034706115723, -0.00011835247278213501, -0.00011162459850311279, -0.00010489672422409058, -9.816884994506836e-05, -9.144097566604614e-05, -8.471310138702393e-05, -7.798522710800171e-05, -7.125735282897949e-05, -6.452947854995728e-05, -5.780160427093506e-05, -5.107372999191284e-05, -4.4345855712890625e-05, -3.761798143386841e-05, -3.089010715484619e-05, -2.4162232875823975e-05, -1.7434358596801758e-05, -1.0706484317779541e-05, -3.978610038757324e-06, 2.7492642402648926e-06, 9.47713851928711e-06, 1.6205012798309326e-05, 2.2932887077331543e-05, 2.966076135635376e-05, 3.6388635635375977e-05, 4.311650991439819e-05, 4.984438419342041e-05, 5.657225847244263e-05, 6.330013275146484e-05, 7.002800703048706e-05, 7.675588130950928e-05, 8.34837555885315e-05, 9.021162986755371e-05, 9.693950414657593e-05, 0.00010366737842559814, 0.00011039525270462036, 0.00011712312698364258, 0.0001238510012626648, 0.000130578875541687, 0.00013730674982070923, 0.00014403462409973145, 0.00015076249837875366, 0.00015749037265777588, 0.0001642182469367981, 0.0001709461212158203]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 8.0, 8.0, 25.0, 36.0, 75.0, 180.0, 395.0, 1146.0, 3876.0, 26347.0, 548749.0, 441185.0, 21310.0, 3443.0, 1033.0, 406.0, 160.0, 67.0, 42.0, 28.0, 9.0, 9.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2021484375, -1.1704788208007812, -1.1388092041015625, -1.1071395874023438, -1.075469970703125, -1.0438003540039062, -1.0121307373046875, -0.9804611206054688, -0.94879150390625, -0.9171218872070312, -0.8854522705078125, -0.8537826538085938, -0.822113037109375, -0.7904434204101562, -0.7587738037109375, -0.7271041870117188, -0.6954345703125, -0.6637649536132812, -0.6320953369140625, -0.6004257202148438, -0.568756103515625, -0.5370864868164062, -0.5054168701171875, -0.47374725341796875, -0.44207763671875, -0.41040802001953125, -0.3787384033203125, -0.34706878662109375, -0.315399169921875, -0.28372955322265625, -0.2520599365234375, -0.22039031982421875, -0.188720703125, -0.15705108642578125, -0.1253814697265625, -0.09371185302734375, -0.062042236328125, -0.03037261962890625, 0.0012969970703125, 0.03296661376953125, 0.06463623046875, 0.09630584716796875, 0.1279754638671875, 0.15964508056640625, 0.191314697265625, 0.22298431396484375, 0.2546539306640625, 0.28632354736328125, 0.3179931640625, 0.34966278076171875, 0.3813323974609375, 0.41300201416015625, 0.444671630859375, 0.47634124755859375, 0.5080108642578125, 0.5396804809570312, 0.57135009765625, 0.6030197143554688, 0.6346893310546875, 0.6663589477539062, 0.698028564453125, 0.7296981811523438, 0.7613677978515625, 0.7930374145507812, 0.82470703125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 6.0, 1.0, 1.0, 3.0, 10.0, 9.0, 30.0, 24.0, 31.0, 40.0, 49.0, 69.0, 75.0, 85.0, 110.0, 96.0, 92.0, 71.0, 54.0, 42.0, 26.0, 22.0, 21.0, 10.0, 8.0, 6.0, 4.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.51708984375, -0.5025253295898438, -0.4879608154296875, -0.47339630126953125, -0.458831787109375, -0.44426727294921875, -0.4297027587890625, -0.41513824462890625, -0.40057373046875, -0.38600921630859375, -0.3714447021484375, -0.35688018798828125, -0.342315673828125, -0.32775115966796875, -0.3131866455078125, -0.29862213134765625, -0.2840576171875, -0.26949310302734375, -0.2549285888671875, -0.24036407470703125, -0.225799560546875, -0.21123504638671875, -0.1966705322265625, -0.18210601806640625, -0.16754150390625, -0.15297698974609375, -0.1384124755859375, -0.12384796142578125, -0.109283447265625, -0.09471893310546875, -0.0801544189453125, -0.06558990478515625, -0.051025390625, -0.03646087646484375, -0.0218963623046875, -0.00733184814453125, 0.007232666015625, 0.02179718017578125, 0.0363616943359375, 0.05092620849609375, 0.06549072265625, 0.08005523681640625, 0.0946197509765625, 0.10918426513671875, 0.123748779296875, 0.13831329345703125, 0.1528778076171875, 0.16744232177734375, 0.1820068359375, 0.19657135009765625, 0.2111358642578125, 0.22570037841796875, 0.240264892578125, 0.25482940673828125, 0.2693939208984375, 0.28395843505859375, 0.29852294921875, 0.31308746337890625, 0.3276519775390625, 0.34221649169921875, 0.356781005859375, 0.37134552001953125, 0.3859100341796875, 0.40047454833984375, 0.4150390625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 26.0, 188.0, 628.0, 156.0, 11.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.05990600585938, -70.73634338378906, -69.41277313232422, -68.0892105102539, -66.76564025878906, -65.44207763671875, -64.1185073852539, -62.794944763183594, -61.471378326416016, -60.14781188964844, -58.82424545288086, -57.50067901611328, -56.17711639404297, -54.85354995727539, -53.52998352050781, -52.206417083740234, -50.882850646972656, -49.55928421020508, -48.2357177734375, -46.91215133666992, -45.588584899902344, -44.26502227783203, -42.94145584106445, -41.617889404296875, -40.2943229675293, -38.97075653076172, -37.64719009399414, -36.32362365722656, -35.00006103515625, -33.67649459838867, -32.352928161621094, -31.029361724853516, -29.705791473388672, -28.382225036621094, -27.058658599853516, -25.73509407043457, -24.411527633666992, -23.087961196899414, -21.76439666748047, -20.44083023071289, -19.117263793945312, -17.793697357177734, -16.470130920410156, -15.146566390991211, -13.822999954223633, -12.499433517456055, -11.175868034362793, -9.852302551269531, -8.528736114501953, -7.205170154571533, -5.881604194641113, -4.558038234710693, -3.2344722747802734, -1.9109063148498535, -0.5873403549194336, 0.7362251281738281, 2.0597915649414062, 3.383357524871826, 4.706923484802246, 6.030489444732666, 7.354055404663086, 8.677621841430664, 10.001187324523926, 11.324752807617188, 12.648319244384766]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 3.0, 4.0, 3.0, 3.0, 7.0, 4.0, 6.0, 6.0, 12.0, 14.0, 11.0, 22.0, 17.0, 22.0, 17.0, 24.0, 39.0, 26.0, 37.0, 39.0, 47.0, 39.0, 38.0, 53.0, 47.0, 45.0, 50.0, 33.0, 37.0, 25.0, 37.0, 28.0, 21.0, 28.0, 35.0, 23.0, 15.0, 18.0, 14.0, 16.0, 13.0, 8.0, 7.0, 6.0, 8.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.11401104927063, -2.999189853668213, -2.884368419647217, -2.7695472240448, -2.6547257900238037, -2.5399045944213867, -2.4250831604003906, -2.3102619647979736, -2.1954407691955566, -2.0806195735931396, -1.9657981395721436, -1.8509769439697266, -1.7361555099487305, -1.6213343143463135, -1.506512999534607, -1.3916916847229004, -1.2768702507019043, -1.1620489358901978, -1.0472276210784912, -0.9324063658714294, -0.8175850510597229, -0.7027637362480164, -0.5879424810409546, -0.47312116622924805, -0.3582998514175415, -0.24347855150699615, -0.1286572515964508, -0.01383596658706665, 0.10098534822463989, 0.21580666303634644, 0.3306279182434082, 0.44544923305511475, 0.5602707862854004, 0.6750921010971069, 0.7899134159088135, 0.9047346711158752, 1.0195560455322266, 1.1343772411346436, 1.24919855594635, 1.3640198707580566, 1.4788411855697632, 1.5936625003814697, 1.7084838151931763, 1.8233051300048828, 1.9381263256072998, 2.052947759628296, 2.167768955230713, 2.282590389251709, 2.397411584854126, 2.512232780456543, 2.627054214477539, 2.741875410079956, 2.856696844100952, 2.971518039703369, 3.0863394737243652, 3.2011606693267822, 3.315981864929199, 3.430803060531616, 3.5456244945526123, 3.6604456901550293, 3.7752671241760254, 3.8900883197784424, 4.004909515380859, 4.1197309494018555, 4.234552383422852]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 6.0, 5.0, 7.0, 6.0, 2.0, 11.0, 8.0, 14.0, 18.0, 15.0, 25.0, 46.0, 39.0, 56.0, 114.0, 157.0, 264.0, 480.0, 926.0, 2157.0, 6016.0, 25216.0, 436443.0, 3673174.0, 36403.0, 7587.0, 2590.0, 1075.0, 589.0, 283.0, 201.0, 105.0, 82.0, 40.0, 33.0, 28.0, 13.0, 18.0, 7.0, 10.0, 6.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.634765625, -3.53936767578125, -3.4439697265625, -3.34857177734375, -3.253173828125, -3.15777587890625, -3.0623779296875, -2.96697998046875, -2.87158203125, -2.77618408203125, -2.6807861328125, -2.58538818359375, -2.489990234375, -2.39459228515625, -2.2991943359375, -2.20379638671875, -2.1083984375, -2.01300048828125, -1.9176025390625, -1.82220458984375, -1.726806640625, -1.63140869140625, -1.5360107421875, -1.44061279296875, -1.34521484375, -1.24981689453125, -1.1544189453125, -1.05902099609375, -0.963623046875, -0.86822509765625, -0.7728271484375, -0.67742919921875, -0.58203125, -0.48663330078125, -0.3912353515625, -0.29583740234375, -0.200439453125, -0.10504150390625, -0.0096435546875, 0.08575439453125, 0.18115234375, 0.27655029296875, 0.3719482421875, 0.46734619140625, 0.562744140625, 0.65814208984375, 0.7535400390625, 0.84893798828125, 0.9443359375, 1.03973388671875, 1.1351318359375, 1.23052978515625, 1.325927734375, 1.42132568359375, 1.5167236328125, 1.61212158203125, 1.70751953125, 1.80291748046875, 1.8983154296875, 1.99371337890625, 2.089111328125, 2.18450927734375, 2.2799072265625, 2.37530517578125, 2.470703125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 7.0, 17.0, 24.0, 27.0, 29.0, 46.0, 60.0, 68.0, 61.0, 69.0, 79.0, 69.0, 75.0, 62.0, 76.0, 55.0, 44.0, 32.0, 32.0, 24.0, 14.0, 12.0, 5.0, 5.0, 6.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.385498046875, -0.37567138671875, -0.3658447265625, -0.35601806640625, -0.34619140625, -0.33636474609375, -0.3265380859375, -0.31671142578125, -0.306884765625, -0.29705810546875, -0.2872314453125, -0.27740478515625, -0.267578125, -0.25775146484375, -0.2479248046875, -0.23809814453125, -0.228271484375, -0.21844482421875, -0.2086181640625, -0.19879150390625, -0.18896484375, -0.17913818359375, -0.1693115234375, -0.15948486328125, -0.149658203125, -0.13983154296875, -0.1300048828125, -0.12017822265625, -0.1103515625, -0.10052490234375, -0.0906982421875, -0.08087158203125, -0.071044921875, -0.06121826171875, -0.0513916015625, -0.04156494140625, -0.03173828125, -0.02191162109375, -0.0120849609375, -0.00225830078125, 0.007568359375, 0.01739501953125, 0.0272216796875, 0.03704833984375, 0.046875, 0.05670166015625, 0.0665283203125, 0.07635498046875, 0.086181640625, 0.09600830078125, 0.1058349609375, 0.11566162109375, 0.12548828125, 0.13531494140625, 0.1451416015625, 0.15496826171875, 0.164794921875, 0.17462158203125, 0.1844482421875, 0.19427490234375, 0.2041015625, 0.21392822265625, 0.2237548828125, 0.23358154296875, 0.243408203125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 8.0, 8.0, 9.0, 12.0, 20.0, 27.0, 45.0, 46.0, 59.0, 85.0, 116.0, 160.0, 202.0, 348.0, 662.0, 1313.0, 3200.0, 11866.0, 81589.0, 3901253.0, 167107.0, 18093.0, 4446.0, 1614.0, 749.0, 387.0, 239.0, 182.0, 103.0, 92.0, 71.0, 50.0, 34.0, 22.0, 23.0, 14.0, 16.0, 3.0, 5.0, 1.0, 8.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.27734375, -3.1878662109375, -3.098388671875, -3.0089111328125, -2.91943359375, -2.8299560546875, -2.740478515625, -2.6510009765625, -2.5615234375, -2.4720458984375, -2.382568359375, -2.2930908203125, -2.20361328125, -2.1141357421875, -2.024658203125, -1.9351806640625, -1.845703125, -1.7562255859375, -1.666748046875, -1.5772705078125, -1.48779296875, -1.3983154296875, -1.308837890625, -1.2193603515625, -1.1298828125, -1.0404052734375, -0.950927734375, -0.8614501953125, -0.77197265625, -0.6824951171875, -0.593017578125, -0.5035400390625, -0.4140625, -0.3245849609375, -0.235107421875, -0.1456298828125, -0.05615234375, 0.0333251953125, 0.122802734375, 0.2122802734375, 0.3017578125, 0.3912353515625, 0.480712890625, 0.5701904296875, 0.65966796875, 0.7491455078125, 0.838623046875, 0.9281005859375, 1.017578125, 1.1070556640625, 1.196533203125, 1.2860107421875, 1.37548828125, 1.4649658203125, 1.554443359375, 1.6439208984375, 1.7333984375, 1.8228759765625, 1.912353515625, 2.0018310546875, 2.09130859375, 2.1807861328125, 2.270263671875, 2.3597412109375, 2.44921875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 6.0, 11.0, 17.0, 31.0, 49.0, 140.0, 831.0, 2596.0, 209.0, 90.0, 36.0, 24.0, 15.0, 8.0, 9.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.146484375, -1.105743408203125, -1.06500244140625, -1.024261474609375, -0.9835205078125, -0.942779541015625, -0.90203857421875, -0.861297607421875, -0.820556640625, -0.779815673828125, -0.73907470703125, -0.698333740234375, -0.6575927734375, -0.616851806640625, -0.57611083984375, -0.535369873046875, -0.49462890625, -0.453887939453125, -0.41314697265625, -0.372406005859375, -0.3316650390625, -0.290924072265625, -0.25018310546875, -0.209442138671875, -0.168701171875, -0.127960205078125, -0.08721923828125, -0.046478271484375, -0.0057373046875, 0.035003662109375, 0.07574462890625, 0.116485595703125, 0.1572265625, 0.197967529296875, 0.23870849609375, 0.279449462890625, 0.3201904296875, 0.360931396484375, 0.40167236328125, 0.442413330078125, 0.483154296875, 0.523895263671875, 0.56463623046875, 0.605377197265625, 0.6461181640625, 0.686859130859375, 0.72760009765625, 0.768341064453125, 0.80908203125, 0.849822998046875, 0.89056396484375, 0.931304931640625, 0.9720458984375, 1.012786865234375, 1.05352783203125, 1.094268798828125, 1.135009765625, 1.175750732421875, 1.21649169921875, 1.257232666015625, 1.2979736328125, 1.338714599609375, 1.37945556640625, 1.420196533203125, 1.4609375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 9.0, 6.0, 35.0, 84.0, 164.0, 297.0, 231.0, 106.0, 38.0, 21.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.816176414489746, -9.580138206481934, -9.344099998474121, -9.108060836791992, -8.87202262878418, -8.635984420776367, -8.399946212768555, -8.163908004760742, -7.92786979675293, -7.691831588745117, -7.4557929039001465, -7.219754695892334, -6.9837164878845215, -6.747677803039551, -6.511639595031738, -6.275601387023926, -6.039562702178955, -5.803524494171143, -5.567485809326172, -5.331447601318359, -5.095409393310547, -4.859371185302734, -4.623332500457764, -4.387294292449951, -4.1512556076049805, -3.915217161178589, -3.6791789531707764, -3.4431405067443848, -3.2071022987365723, -2.9710638523101807, -2.735025405883789, -2.4989871978759766, -2.262948513031006, -2.0269100666046143, -1.7908718585968018, -1.5548334121704102, -1.318795084953308, -1.082756757736206, -0.8467183113098145, -0.6106799840927124, -0.37464165687561035, -0.1386032998561859, 0.09743505716323853, 0.33347344398498535, 0.5695117712020874, 0.8055500984191895, 1.041588544845581, 1.277626872062683, 1.5136651992797852, 1.7497035264968872, 1.9857418537139893, 2.221780300140381, 2.4578185081481934, 2.693856954574585, 2.9298954010009766, 3.165933609008789, 3.4019720554351807, 3.6380105018615723, 3.8740487098693848, 4.1100873947143555, 4.346125602722168, 4.5821638107299805, 4.818202018737793, 5.054240703582764, 5.290278911590576]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 5.0, 6.0, 12.0, 10.0, 19.0, 46.0, 60.0, 56.0, 77.0, 97.0, 84.0, 86.0, 87.0, 86.0, 69.0, 58.0, 48.0, 26.0, 22.0, 18.0, 13.0, 6.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.4029347896575928, -3.2981135845184326, -3.1932923793792725, -3.0884711742401123, -2.983649969100952, -2.878828763961792, -2.774007558822632, -2.6691863536834717, -2.5643651485443115, -2.4595439434051514, -2.354722738265991, -2.249901533126831, -2.145080327987671, -2.0402591228485107, -1.9354379177093506, -1.8306167125701904, -1.7257956266403198, -1.6209744215011597, -1.5161532163619995, -1.4113320112228394, -1.3065108060836792, -1.2016897201538086, -1.0968685150146484, -0.9920472502708435, -0.8872260451316833, -0.7824048399925232, -0.677583634853363, -0.5727624893188477, -0.4679412543773651, -0.36312007904052734, -0.2582988739013672, -0.15347766876220703, -0.048656463623046875, 0.056164734065532684, 0.16098593175411224, 0.2658071219921112, 0.37062832713127136, 0.47544950246810913, 0.5802707076072693, 0.6850919127464294, 0.7899131178855896, 0.8947343230247498, 0.9995555281639099, 1.1043766736984253, 1.2091978788375854, 1.3140190839767456, 1.4188402891159058, 1.523661494255066, 1.628482699394226, 1.7333039045333862, 1.8381251096725464, 1.9429463148117065, 2.047767400741577, 2.1525886058807373, 2.2574098110198975, 2.3622310161590576, 2.4670522212982178, 2.571873426437378, 2.676694631576538, 2.7815158367156982, 2.8863370418548584, 2.9911582469940186, 3.0959794521331787, 3.200800657272339, 3.305621862411499]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 0.0, 3.0, 0.0, 4.0, 5.0, 7.0, 8.0, 13.0, 10.0, 25.0, 31.0, 63.0, 51.0, 90.0, 135.0, 203.0, 310.0, 493.0, 968.0, 1877.0, 4108.0, 9721.0, 27333.0, 92556.0, 334862.0, 400888.0, 119885.0, 33660.0, 11614.0, 4798.0, 2086.0, 1137.0, 569.0, 349.0, 228.0, 142.0, 91.0, 69.0, 58.0, 21.0, 25.0, 13.0, 15.0, 13.0, 7.0, 6.0, 7.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.65234375, -1.6024169921875, -1.552490234375, -1.5025634765625, -1.45263671875, -1.4027099609375, -1.352783203125, -1.3028564453125, -1.2529296875, -1.2030029296875, -1.153076171875, -1.1031494140625, -1.05322265625, -1.0032958984375, -0.953369140625, -0.9034423828125, -0.853515625, -0.8035888671875, -0.753662109375, -0.7037353515625, -0.65380859375, -0.6038818359375, -0.553955078125, -0.5040283203125, -0.4541015625, -0.4041748046875, -0.354248046875, -0.3043212890625, -0.25439453125, -0.2044677734375, -0.154541015625, -0.1046142578125, -0.0546875, -0.0047607421875, 0.045166015625, 0.0950927734375, 0.14501953125, 0.1949462890625, 0.244873046875, 0.2947998046875, 0.3447265625, 0.3946533203125, 0.444580078125, 0.4945068359375, 0.54443359375, 0.5943603515625, 0.644287109375, 0.6942138671875, 0.744140625, 0.7940673828125, 0.843994140625, 0.8939208984375, 0.94384765625, 0.9937744140625, 1.043701171875, 1.0936279296875, 1.1435546875, 1.1934814453125, 1.243408203125, 1.2933349609375, 1.34326171875, 1.3931884765625, 1.443115234375, 1.4930419921875, 1.54296875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 9.0, 9.0, 20.0, 26.0, 18.0, 38.0, 46.0, 49.0, 54.0, 61.0, 75.0, 82.0, 94.0, 81.0, 70.0, 62.0, 52.0, 38.0, 28.0, 30.0, 27.0, 17.0, 9.0, 6.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44384765625, -0.43189239501953125, -0.4199371337890625, -0.40798187255859375, -0.396026611328125, -0.38407135009765625, -0.3721160888671875, -0.36016082763671875, -0.34820556640625, -0.33625030517578125, -0.3242950439453125, -0.31233978271484375, -0.300384521484375, -0.28842926025390625, -0.2764739990234375, -0.26451873779296875, -0.2525634765625, -0.24060821533203125, -0.2286529541015625, -0.21669769287109375, -0.204742431640625, -0.19278717041015625, -0.1808319091796875, -0.16887664794921875, -0.15692138671875, -0.14496612548828125, -0.1330108642578125, -0.12105560302734375, -0.109100341796875, -0.09714508056640625, -0.0851898193359375, -0.07323455810546875, -0.061279296875, -0.04932403564453125, -0.0373687744140625, -0.02541351318359375, -0.013458251953125, -0.00150299072265625, 0.0104522705078125, 0.02240753173828125, 0.03436279296875, 0.04631805419921875, 0.0582733154296875, 0.07022857666015625, 0.082183837890625, 0.09413909912109375, 0.1060943603515625, 0.11804962158203125, 0.1300048828125, 0.14196014404296875, 0.1539154052734375, 0.16587066650390625, 0.177825927734375, 0.18978118896484375, 0.2017364501953125, 0.21369171142578125, 0.22564697265625, 0.23760223388671875, 0.2495574951171875, 0.26151275634765625, 0.273468017578125, 0.28542327880859375, 0.2973785400390625, 0.30933380126953125, 0.3212890625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 6.0, 10.0, 12.0, 25.0, 26.0, 30.0, 46.0, 58.0, 79.0, 118.0, 187.0, 278.0, 373.0, 608.0, 1089.0, 1731.0, 3423.0, 7123.0, 16398.0, 41049.0, 113093.0, 290814.0, 336069.0, 145252.0, 52198.0, 20162.0, 8644.0, 4121.0, 2164.0, 1199.0, 796.0, 425.0, 300.0, 196.0, 146.0, 88.0, 67.0, 45.0, 24.0, 18.0, 18.0, 13.0, 14.0, 3.0, 2.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.9765625, -0.9461593627929688, -0.9157562255859375, -0.8853530883789062, -0.854949951171875, -0.8245468139648438, -0.7941436767578125, -0.7637405395507812, -0.73333740234375, -0.7029342651367188, -0.6725311279296875, -0.6421279907226562, -0.611724853515625, -0.5813217163085938, -0.5509185791015625, -0.5205154418945312, -0.4901123046875, -0.45970916748046875, -0.4293060302734375, -0.39890289306640625, -0.368499755859375, -0.33809661865234375, -0.3076934814453125, -0.27729034423828125, -0.24688720703125, -0.21648406982421875, -0.1860809326171875, -0.15567779541015625, -0.125274658203125, -0.09487152099609375, -0.0644683837890625, -0.03406524658203125, -0.003662109375, 0.02674102783203125, 0.0571441650390625, 0.08754730224609375, 0.117950439453125, 0.14835357666015625, 0.1787567138671875, 0.20915985107421875, 0.23956298828125, 0.26996612548828125, 0.3003692626953125, 0.33077239990234375, 0.361175537109375, 0.39157867431640625, 0.4219818115234375, 0.45238494873046875, 0.4827880859375, 0.5131912231445312, 0.5435943603515625, 0.5739974975585938, 0.604400634765625, 0.6348037719726562, 0.6652069091796875, 0.6956100463867188, 0.72601318359375, 0.7564163208007812, 0.7868194580078125, 0.8172225952148438, 0.847625732421875, 0.8780288696289062, 0.9084320068359375, 0.9388351440429688, 0.96923828125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 6.0, 8.0, 5.0, 9.0, 10.0, 12.0, 18.0, 17.0, 32.0, 20.0, 34.0, 37.0, 24.0, 37.0, 49.0, 38.0, 51.0, 44.0, 50.0, 46.0, 55.0, 62.0, 50.0, 35.0, 43.0, 40.0, 34.0, 28.0, 23.0, 15.0, 20.0, 14.0, 7.0, 8.0, 8.0, 7.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.208984375, -1.1733856201171875, -1.137786865234375, -1.1021881103515625, -1.06658935546875, -1.0309906005859375, -0.995391845703125, -0.9597930908203125, -0.9241943359375, -0.8885955810546875, -0.852996826171875, -0.8173980712890625, -0.78179931640625, -0.7462005615234375, -0.710601806640625, -0.6750030517578125, -0.639404296875, -0.6038055419921875, -0.568206787109375, -0.5326080322265625, -0.49700927734375, -0.4614105224609375, -0.425811767578125, -0.3902130126953125, -0.3546142578125, -0.3190155029296875, -0.283416748046875, -0.2478179931640625, -0.21221923828125, -0.1766204833984375, -0.141021728515625, -0.1054229736328125, -0.06982421875, -0.0342254638671875, 0.001373291015625, 0.0369720458984375, 0.07257080078125, 0.1081695556640625, 0.143768310546875, 0.1793670654296875, 0.2149658203125, 0.2505645751953125, 0.286163330078125, 0.3217620849609375, 0.35736083984375, 0.3929595947265625, 0.428558349609375, 0.4641571044921875, 0.499755859375, 0.5353546142578125, 0.570953369140625, 0.6065521240234375, 0.64215087890625, 0.6777496337890625, 0.713348388671875, 0.7489471435546875, 0.7845458984375, 0.8201446533203125, 0.855743408203125, 0.8913421630859375, 0.92694091796875, 0.9625396728515625, 0.998138427734375, 1.0337371826171875, 1.0693359375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 6.0, 8.0, 5.0, 19.0, 29.0, 31.0, 61.0, 95.0, 171.0, 354.0, 809.0, 2305.0, 10504.0, 112622.0, 795024.0, 112131.0, 10501.0, 2337.0, 785.0, 345.0, 167.0, 104.0, 52.0, 34.0, 18.0, 12.0, 9.0, 6.0, 4.0, 3.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8984375, -0.8585052490234375, -0.818572998046875, -0.7786407470703125, -0.73870849609375, -0.6987762451171875, -0.658843994140625, -0.6189117431640625, -0.5789794921875, -0.5390472412109375, -0.499114990234375, -0.4591827392578125, -0.41925048828125, -0.3793182373046875, -0.339385986328125, -0.2994537353515625, -0.259521484375, -0.2195892333984375, -0.179656982421875, -0.1397247314453125, -0.09979248046875, -0.0598602294921875, -0.019927978515625, 0.0200042724609375, 0.0599365234375, 0.0998687744140625, 0.139801025390625, 0.1797332763671875, 0.21966552734375, 0.2595977783203125, 0.299530029296875, 0.3394622802734375, 0.37939453125, 0.4193267822265625, 0.459259033203125, 0.4991912841796875, 0.53912353515625, 0.5790557861328125, 0.618988037109375, 0.6589202880859375, 0.6988525390625, 0.7387847900390625, 0.778717041015625, 0.8186492919921875, 0.85858154296875, 0.8985137939453125, 0.938446044921875, 0.9783782958984375, 1.018310546875, 1.0582427978515625, 1.098175048828125, 1.1381072998046875, 1.17803955078125, 1.2179718017578125, 1.257904052734375, 1.2978363037109375, 1.3377685546875, 1.3777008056640625, 1.417633056640625, 1.4575653076171875, 1.49749755859375, 1.5374298095703125, 1.577362060546875, 1.6172943115234375, 1.6572265625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 8.0, 1.0, 7.0, 4.0, 11.0, 13.0, 26.0, 35.0, 35.0, 48.0, 74.0, 77.0, 81.0, 100.0, 103.0, 80.0, 71.0, 54.0, 40.0, 32.0, 34.0, 19.0, 11.0, 13.0, 12.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011652708053588867, -0.00011247489601373672, -0.00010842271149158478, -0.00010437052696943283, -0.00010031834244728088, -9.626615792512894e-05, -9.221397340297699e-05, -8.816178888082504e-05, -8.41096043586731e-05, -8.005741983652115e-05, -7.60052353143692e-05, -7.195305079221725e-05, -6.790086627006531e-05, -6.384868174791336e-05, -5.9796497225761414e-05, -5.5744312703609467e-05, -5.169212818145752e-05, -4.763994365930557e-05, -4.3587759137153625e-05, -3.953557461500168e-05, -3.548339009284973e-05, -3.1431205570697784e-05, -2.7379021048545837e-05, -2.332683652639389e-05, -1.9274652004241943e-05, -1.5222467482089996e-05, -1.117028295993805e-05, -7.118098437786102e-06, -3.0659139156341553e-06, 9.862706065177917e-07, 5.038455128669739e-06, 9.090639650821686e-06, 1.3142824172973633e-05, 1.719500869512558e-05, 2.1247193217277527e-05, 2.5299377739429474e-05, 2.935156226158142e-05, 3.340374678373337e-05, 3.7455931305885315e-05, 4.150811582803726e-05, 4.556030035018921e-05, 4.9612484872341156e-05, 5.36646693944931e-05, 5.771685391664505e-05, 6.1769038438797e-05, 6.582122296094894e-05, 6.987340748310089e-05, 7.392559200525284e-05, 7.797777652740479e-05, 8.202996104955673e-05, 8.608214557170868e-05, 9.013433009386063e-05, 9.418651461601257e-05, 9.823869913816452e-05, 0.00010229088366031647, 0.00010634306818246841, 0.00011039525270462036, 0.00011444743722677231, 0.00011849962174892426, 0.0001225518062710762, 0.00012660399079322815, 0.0001306561753153801, 0.00013470835983753204, 0.000138760544359684, 0.00014281272888183594]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 4.0, 8.0, 23.0, 25.0, 33.0, 58.0, 117.0, 192.0, 412.0, 836.0, 2035.0, 5752.0, 18874.0, 82765.0, 395586.0, 420713.0, 90853.0, 20282.0, 6018.0, 2170.0, 884.0, 418.0, 210.0, 117.0, 64.0, 38.0, 14.0, 14.0, 11.0, 11.0, 2.0, 4.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59375, -0.5709381103515625, -0.548126220703125, -0.5253143310546875, -0.50250244140625, -0.4796905517578125, -0.456878662109375, -0.4340667724609375, -0.4112548828125, -0.3884429931640625, -0.365631103515625, -0.3428192138671875, -0.32000732421875, -0.2971954345703125, -0.274383544921875, -0.2515716552734375, -0.228759765625, -0.2059478759765625, -0.183135986328125, -0.1603240966796875, -0.13751220703125, -0.1147003173828125, -0.091888427734375, -0.0690765380859375, -0.0462646484375, -0.0234527587890625, -0.000640869140625, 0.0221710205078125, 0.04498291015625, 0.0677947998046875, 0.090606689453125, 0.1134185791015625, 0.13623046875, 0.1590423583984375, 0.181854248046875, 0.2046661376953125, 0.22747802734375, 0.2502899169921875, 0.273101806640625, 0.2959136962890625, 0.3187255859375, 0.3415374755859375, 0.364349365234375, 0.3871612548828125, 0.40997314453125, 0.4327850341796875, 0.455596923828125, 0.4784088134765625, 0.501220703125, 0.5240325927734375, 0.546844482421875, 0.5696563720703125, 0.59246826171875, 0.6152801513671875, 0.638092041015625, 0.6609039306640625, 0.6837158203125, 0.7065277099609375, 0.729339599609375, 0.7521514892578125, 0.77496337890625, 0.7977752685546875, 0.820587158203125, 0.8433990478515625, 0.8662109375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 8.0, 5.0, 15.0, 16.0, 11.0, 17.0, 23.0, 24.0, 36.0, 52.0, 63.0, 55.0, 71.0, 80.0, 70.0, 83.0, 66.0, 60.0, 52.0, 30.0, 40.0, 23.0, 21.0, 11.0, 18.0, 16.0, 7.0, 5.0, 9.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5751953125, -0.5532302856445312, -0.5312652587890625, -0.5093002319335938, -0.487335205078125, -0.46537017822265625, -0.4434051513671875, -0.42144012451171875, -0.39947509765625, -0.37751007080078125, -0.3555450439453125, -0.33358001708984375, -0.311614990234375, -0.28964996337890625, -0.2676849365234375, -0.24571990966796875, -0.2237548828125, -0.20178985595703125, -0.1798248291015625, -0.15785980224609375, -0.135894775390625, -0.11392974853515625, -0.0919647216796875, -0.06999969482421875, -0.04803466796875, -0.02606964111328125, -0.0041046142578125, 0.01786041259765625, 0.039825439453125, 0.06179046630859375, 0.0837554931640625, 0.10572052001953125, 0.127685546875, 0.14965057373046875, 0.1716156005859375, 0.19358062744140625, 0.215545654296875, 0.23751068115234375, 0.2594757080078125, 0.28144073486328125, 0.30340576171875, 0.32537078857421875, 0.3473358154296875, 0.36930084228515625, 0.391265869140625, 0.41323089599609375, 0.4351959228515625, 0.45716094970703125, 0.4791259765625, 0.5010910034179688, 0.5230560302734375, 0.5450210571289062, 0.566986083984375, 0.5889511108398438, 0.6109161376953125, 0.6328811645507812, 0.65484619140625, 0.6768112182617188, 0.6987762451171875, 0.7207412719726562, 0.742706298828125, 0.7646713256835938, 0.7866363525390625, 0.8086013793945312, 0.83056640625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 9.0, 6.0, 9.0, 27.0, 44.0, 103.0, 142.0, 183.0, 198.0, 120.0, 80.0, 41.0, 22.0, 16.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.37784194946289, -17.83738136291504, -17.296920776367188, -16.756460189819336, -16.215999603271484, -15.675539016723633, -15.135077476501465, -14.594616889953613, -14.054156303405762, -13.51369571685791, -12.973235130310059, -12.432774543762207, -11.892313003540039, -11.351852416992188, -10.811391830444336, -10.270931243896484, -9.730470657348633, -9.190010070800781, -8.64954948425293, -8.109088897705078, -7.568627834320068, -7.028167247772217, -6.487706184387207, -5.9472455978393555, -5.406785011291504, -4.866324424743652, -4.325863838195801, -3.785402774810791, -3.2449421882629395, -2.704481601715088, -2.1640207767486572, -1.6235599517822266, -1.083099365234375, -0.5426386594772339, -0.0021779537200927734, 0.5382827520370483, 1.0787434577941895, 1.619204044342041, 2.1596648693084717, 2.7001256942749023, 3.240586280822754, 3.7810468673706055, 4.321507453918457, 4.861968517303467, 5.402429103851318, 5.94288969039917, 6.48335075378418, 7.023811340332031, 7.564271926879883, 8.104732513427734, 8.645193099975586, 9.185653686523438, 9.726114273071289, 10.26657485961914, 10.807036399841309, 11.34749698638916, 11.887957572937012, 12.428418159484863, 12.968878746032715, 13.509339332580566, 14.049800872802734, 14.590261459350586, 15.130722045898438, 15.671182632446289, 16.21164321899414]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 4.0, 5.0, 8.0, 2.0, 3.0, 12.0, 14.0, 18.0, 13.0, 15.0, 19.0, 28.0, 30.0, 30.0, 39.0, 33.0, 49.0, 32.0, 35.0, 44.0, 37.0, 51.0, 42.0, 42.0, 39.0, 40.0, 33.0, 32.0, 26.0, 34.0, 22.0, 26.0, 24.0, 17.0, 25.0, 12.0, 12.0, 10.0, 12.0, 6.0, 9.0, 7.0, 1.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.618541717529297, -4.451461315155029, -4.2843804359436035, -4.117300033569336, -3.9502196311950684, -3.7831389904022217, -3.616058349609375, -3.4489779472351074, -3.2818973064422607, -3.114816665649414, -2.9477362632751465, -2.7806556224823, -2.613574981689453, -2.4464945793151855, -2.279413938522339, -2.112333297729492, -1.9452528953552246, -1.7781723737716675, -1.6110918521881104, -1.4440112113952637, -1.2769306898117065, -1.1098501682281494, -0.9427695274353027, -0.7756890058517456, -0.6086084842681885, -0.44152793288230896, -0.27444738149642944, -0.10736680030822754, 0.05971372127532959, 0.22679424285888672, 0.3938748836517334, 0.5609554052352905, 0.7280359268188477, 0.8951164484024048, 1.062196969985962, 1.2292776107788086, 1.3963581323623657, 1.5634386539459229, 1.7305192947387695, 1.8975998163223267, 2.064680337905884, 2.2317609786987305, 2.398841381072998, 2.5659220218658447, 2.7330026626586914, 2.900083065032959, 3.0671637058258057, 3.2342443466186523, 3.40132474899292, 3.5684053897857666, 3.735485792160034, 3.902566432952881, 4.069646835327148, 4.236727714538574, 4.403808116912842, 4.570888519287109, 4.737969398498535, 4.905049800872803, 5.0721306800842285, 5.239211082458496, 5.406291484832764, 5.573371887207031, 5.740452766418457, 5.907533168792725, 6.074613571166992]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 6.0, 3.0, 4.0, 11.0, 14.0, 22.0, 27.0, 33.0, 37.0, 80.0, 120.0, 186.0, 397.0, 903.0, 2534.0, 9410.0, 54807.0, 3906856.0, 193248.0, 18314.0, 4375.0, 1566.0, 664.0, 298.0, 158.0, 78.0, 52.0, 31.0, 17.0, 10.0, 10.0, 7.0, 7.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.53515625, -4.4149169921875, -4.294677734375, -4.1744384765625, -4.05419921875, -3.9339599609375, -3.813720703125, -3.6934814453125, -3.5732421875, -3.4530029296875, -3.332763671875, -3.2125244140625, -3.09228515625, -2.9720458984375, -2.851806640625, -2.7315673828125, -2.611328125, -2.4910888671875, -2.370849609375, -2.2506103515625, -2.13037109375, -2.0101318359375, -1.889892578125, -1.7696533203125, -1.6494140625, -1.5291748046875, -1.408935546875, -1.2886962890625, -1.16845703125, -1.0482177734375, -0.927978515625, -0.8077392578125, -0.6875, -0.5672607421875, -0.447021484375, -0.3267822265625, -0.20654296875, -0.0863037109375, 0.033935546875, 0.1541748046875, 0.2744140625, 0.3946533203125, 0.514892578125, 0.6351318359375, 0.75537109375, 0.8756103515625, 0.995849609375, 1.1160888671875, 1.236328125, 1.3565673828125, 1.476806640625, 1.5970458984375, 1.71728515625, 1.8375244140625, 1.957763671875, 2.0780029296875, 2.1982421875, 2.3184814453125, 2.438720703125, 2.5589599609375, 2.67919921875, 2.7994384765625, 2.919677734375, 3.0399169921875, 3.16015625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 8.0, 5.0, 11.0, 18.0, 35.0, 33.0, 37.0, 51.0, 71.0, 67.0, 72.0, 69.0, 86.0, 81.0, 70.0, 54.0, 42.0, 42.0, 39.0, 26.0, 26.0, 18.0, 17.0, 12.0, 6.0, 3.0, 2.0, 2.0, 0.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.473388671875, -0.46105194091796875, -0.4487152099609375, -0.43637847900390625, -0.424041748046875, -0.41170501708984375, -0.3993682861328125, -0.38703155517578125, -0.37469482421875, -0.36235809326171875, -0.3500213623046875, -0.33768463134765625, -0.325347900390625, -0.31301116943359375, -0.3006744384765625, -0.28833770751953125, -0.2760009765625, -0.26366424560546875, -0.2513275146484375, -0.23899078369140625, -0.226654052734375, -0.21431732177734375, -0.2019805908203125, -0.18964385986328125, -0.17730712890625, -0.16497039794921875, -0.1526336669921875, -0.14029693603515625, -0.127960205078125, -0.11562347412109375, -0.1032867431640625, -0.09095001220703125, -0.07861328125, -0.06627655029296875, -0.0539398193359375, -0.04160308837890625, -0.029266357421875, -0.01692962646484375, -0.0045928955078125, 0.00774383544921875, 0.02008056640625, 0.03241729736328125, 0.0447540283203125, 0.05709075927734375, 0.069427490234375, 0.08176422119140625, 0.0941009521484375, 0.10643768310546875, 0.1187744140625, 0.13111114501953125, 0.1434478759765625, 0.15578460693359375, 0.168121337890625, 0.18045806884765625, 0.1927947998046875, 0.20513153076171875, 0.21746826171875, 0.22980499267578125, 0.2421417236328125, 0.25447845458984375, 0.266815185546875, 0.27915191650390625, 0.2914886474609375, 0.30382537841796875, 0.316162109375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 8.0, 10.0, 24.0, 35.0, 40.0, 68.0, 144.0, 204.0, 298.0, 547.0, 957.0, 1722.0, 3493.0, 7797.0, 22851.0, 107109.0, 3618390.0, 363212.0, 44113.0, 12625.0, 5066.0, 2426.0, 1287.0, 700.0, 442.0, 282.0, 177.0, 88.0, 63.0, 42.0, 32.0, 20.0, 4.0, 6.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.38671875, -2.30908203125, -2.2314453125, -2.15380859375, -2.076171875, -1.99853515625, -1.9208984375, -1.84326171875, -1.765625, -1.68798828125, -1.6103515625, -1.53271484375, -1.455078125, -1.37744140625, -1.2998046875, -1.22216796875, -1.14453125, -1.06689453125, -0.9892578125, -0.91162109375, -0.833984375, -0.75634765625, -0.6787109375, -0.60107421875, -0.5234375, -0.44580078125, -0.3681640625, -0.29052734375, -0.212890625, -0.13525390625, -0.0576171875, 0.02001953125, 0.09765625, 0.17529296875, 0.2529296875, 0.33056640625, 0.408203125, 0.48583984375, 0.5634765625, 0.64111328125, 0.71875, 0.79638671875, 0.8740234375, 0.95166015625, 1.029296875, 1.10693359375, 1.1845703125, 1.26220703125, 1.33984375, 1.41748046875, 1.4951171875, 1.57275390625, 1.650390625, 1.72802734375, 1.8056640625, 1.88330078125, 1.9609375, 2.03857421875, 2.1162109375, 2.19384765625, 2.271484375, 2.34912109375, 2.4267578125, 2.50439453125, 2.58203125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 4.0, 3.0, 6.0, 16.0, 15.0, 36.0, 45.0, 92.0, 193.0, 1185.0, 1987.0, 239.0, 98.0, 59.0, 36.0, 17.0, 12.0, 11.0, 5.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.4560546875, -1.4076080322265625, -1.359161376953125, -1.3107147216796875, -1.26226806640625, -1.2138214111328125, -1.165374755859375, -1.1169281005859375, -1.0684814453125, -1.0200347900390625, -0.971588134765625, -0.9231414794921875, -0.87469482421875, -0.8262481689453125, -0.777801513671875, -0.7293548583984375, -0.680908203125, -0.6324615478515625, -0.584014892578125, -0.5355682373046875, -0.48712158203125, -0.4386749267578125, -0.390228271484375, -0.3417816162109375, -0.2933349609375, -0.2448883056640625, -0.196441650390625, -0.1479949951171875, -0.09954833984375, -0.0511016845703125, -0.002655029296875, 0.0457916259765625, 0.09423828125, 0.1426849365234375, 0.191131591796875, 0.2395782470703125, 0.28802490234375, 0.3364715576171875, 0.384918212890625, 0.4333648681640625, 0.4818115234375, 0.5302581787109375, 0.578704833984375, 0.6271514892578125, 0.67559814453125, 0.7240447998046875, 0.772491455078125, 0.8209381103515625, 0.869384765625, 0.9178314208984375, 0.966278076171875, 1.0147247314453125, 1.06317138671875, 1.1116180419921875, 1.160064697265625, 1.2085113525390625, 1.2569580078125, 1.3054046630859375, 1.353851318359375, 1.4022979736328125, 1.45074462890625, 1.4991912841796875, 1.547637939453125, 1.5960845947265625, 1.64453125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 5.0, 7.0, 8.0, 15.0, 18.0, 33.0, 67.0, 96.0, 130.0, 157.0, 164.0, 126.0, 76.0, 40.0, 25.0, 13.0, 4.0, 7.0, 7.0, 3.0, 6.0, 1.0, 1.0, 0.0, 2.0], "bins": [-11.89401626586914, -11.650848388671875, -11.40768051147461, -11.164512634277344, -10.921344757080078, -10.678177833557129, -10.435009956359863, -10.191842079162598, -9.948674201965332, -9.705506324768066, -9.4623384475708, -9.219170570373535, -8.976003646850586, -8.73283576965332, -8.489667892456055, -8.246500015258789, -8.003332138061523, -7.760164260864258, -7.516996383666992, -7.273828983306885, -7.030661106109619, -6.7874932289123535, -6.544325828552246, -6.3011579513549805, -6.057990074157715, -5.814822196960449, -5.571654319763184, -5.328486919403076, -5.0853190422058105, -4.842151165008545, -4.5989837646484375, -4.355815887451172, -4.112648010253906, -3.8694801330566406, -3.626312494277954, -3.3831448554992676, -3.139976978302002, -2.8968091011047363, -2.65364146232605, -2.4104738235473633, -2.1673057079315186, -1.9241379499435425, -1.6809701919555664, -1.4378024339675903, -1.1946346759796143, -0.9514669179916382, -0.7082991600036621, -0.46513140201568604, -0.22196364402770996, 0.021204113960266113, 0.2643718719482422, 0.5075396299362183, 0.7507073879241943, 0.9938751459121704, 1.2370429039001465, 1.4802106618881226, 1.7233784198760986, 1.9665461778640747, 2.209713935852051, 2.4528818130493164, 2.696049451828003, 2.9392170906066895, 3.182384967803955, 3.4255528450012207, 3.6687204837799072]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 6.0, 6.0, 8.0, 6.0, 4.0, 12.0, 3.0, 11.0, 7.0, 13.0, 6.0, 25.0, 20.0, 26.0, 33.0, 17.0, 35.0, 19.0, 28.0, 33.0, 41.0, 37.0, 29.0, 40.0, 40.0, 36.0, 39.0, 36.0, 39.0, 29.0, 33.0, 36.0, 24.0, 31.0, 20.0, 19.0, 21.0, 15.0, 18.0, 25.0, 17.0, 15.0, 6.0, 6.0, 7.0, 3.0, 6.0, 9.0, 3.0, 4.0, 5.0, 5.0], "bins": [-3.4690258502960205, -3.374457836151123, -3.2798898220062256, -3.185321807861328, -3.0907537937164307, -2.996185779571533, -2.9016177654266357, -2.8070497512817383, -2.712481737136841, -2.6179137229919434, -2.523345708847046, -2.4287776947021484, -2.334209680557251, -2.2396416664123535, -2.145073652267456, -2.0505056381225586, -1.9559376239776611, -1.8613696098327637, -1.7668015956878662, -1.6722335815429688, -1.5776655673980713, -1.4830975532531738, -1.3885295391082764, -1.293961524963379, -1.1993935108184814, -1.104825496673584, -1.0102574825286865, -0.9156894683837891, -0.8211214542388916, -0.7265534400939941, -0.6319854259490967, -0.5374174118041992, -0.44284939765930176, -0.3482813835144043, -0.25371336936950684, -0.15914535522460938, -0.06457734107971191, 0.029990673065185547, 0.12455868721008301, 0.21912670135498047, 0.31369471549987793, 0.4082627296447754, 0.5028307437896729, 0.5973987579345703, 0.6919667720794678, 0.7865347862243652, 0.8811028003692627, 0.9756708145141602, 1.0702388286590576, 1.164806842803955, 1.2593748569488525, 1.35394287109375, 1.4485108852386475, 1.543078899383545, 1.6376469135284424, 1.7322149276733398, 1.8267829418182373, 1.9213509559631348, 2.0159189701080322, 2.1104869842529297, 2.205054998397827, 2.2996230125427246, 2.394191026687622, 2.4887590408325195, 2.583327054977417]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 5.0, 3.0, 4.0, 2.0, 8.0, 10.0, 22.0, 20.0, 31.0, 81.0, 120.0, 191.0, 345.0, 653.0, 1430.0, 3375.0, 8606.0, 25118.0, 81781.0, 292408.0, 427797.0, 142939.0, 41009.0, 13507.0, 5009.0, 2058.0, 985.0, 427.0, 222.0, 148.0, 97.0, 47.0, 33.0, 26.0, 12.0, 7.0, 2.0, 8.0, 3.0, 6.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.48828125, -2.4231719970703125, -2.358062744140625, -2.2929534912109375, -2.22784423828125, -2.1627349853515625, -2.097625732421875, -2.0325164794921875, -1.9674072265625, -1.9022979736328125, -1.837188720703125, -1.7720794677734375, -1.70697021484375, -1.6418609619140625, -1.576751708984375, -1.5116424560546875, -1.446533203125, -1.3814239501953125, -1.316314697265625, -1.2512054443359375, -1.18609619140625, -1.1209869384765625, -1.055877685546875, -0.9907684326171875, -0.9256591796875, -0.8605499267578125, -0.795440673828125, -0.7303314208984375, -0.66522216796875, -0.6001129150390625, -0.535003662109375, -0.4698944091796875, -0.40478515625, -0.3396759033203125, -0.274566650390625, -0.2094573974609375, -0.14434814453125, -0.0792388916015625, -0.014129638671875, 0.0509796142578125, 0.1160888671875, 0.1811981201171875, 0.246307373046875, 0.3114166259765625, 0.37652587890625, 0.4416351318359375, 0.506744384765625, 0.5718536376953125, 0.636962890625, 0.7020721435546875, 0.767181396484375, 0.8322906494140625, 0.89739990234375, 0.9625091552734375, 1.027618408203125, 1.0927276611328125, 1.1578369140625, 1.2229461669921875, 1.288055419921875, 1.3531646728515625, 1.41827392578125, 1.4833831787109375, 1.548492431640625, 1.6136016845703125, 1.6787109375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 5.0, 8.0, 9.0, 15.0, 9.0, 22.0, 25.0, 25.0, 37.0, 38.0, 33.0, 39.0, 53.0, 54.0, 61.0, 54.0, 52.0, 53.0, 57.0, 51.0, 52.0, 27.0, 55.0, 28.0, 31.0, 27.0, 23.0, 14.0, 6.0, 11.0, 4.0, 7.0, 6.0, 6.0, 4.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5048828125, -0.4917030334472656, -0.47852325439453125, -0.4653434753417969, -0.4521636962890625, -0.4389839172363281, -0.42580413818359375, -0.4126243591308594, -0.399444580078125, -0.3862648010253906, -0.37308502197265625, -0.3599052429199219, -0.3467254638671875, -0.3335456848144531, -0.32036590576171875, -0.3071861267089844, -0.29400634765625, -0.2808265686035156, -0.26764678955078125, -0.2544670104980469, -0.2412872314453125, -0.22810745239257812, -0.21492767333984375, -0.20174789428710938, -0.188568115234375, -0.17538833618164062, -0.16220855712890625, -0.14902877807617188, -0.1358489990234375, -0.12266921997070312, -0.10948944091796875, -0.09630966186523438, -0.0831298828125, -0.06995010375976562, -0.05677032470703125, -0.043590545654296875, -0.0304107666015625, -0.017230987548828125, -0.00405120849609375, 0.009128570556640625, 0.022308349609375, 0.035488128662109375, 0.04866790771484375, 0.061847686767578125, 0.0750274658203125, 0.08820724487304688, 0.10138702392578125, 0.11456680297851562, 0.12774658203125, 0.14092636108398438, 0.15410614013671875, 0.16728591918945312, 0.1804656982421875, 0.19364547729492188, 0.20682525634765625, 0.22000503540039062, 0.233184814453125, 0.24636459350585938, 0.25954437255859375, 0.2727241516113281, 0.2859039306640625, 0.2990837097167969, 0.31226348876953125, 0.3254432678222656, 0.338623046875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 6.0, 8.0, 10.0, 15.0, 21.0, 43.0, 60.0, 65.0, 91.0, 149.0, 230.0, 394.0, 598.0, 942.0, 1640.0, 2760.0, 5438.0, 11095.0, 24942.0, 63037.0, 186896.0, 410550.0, 215347.0, 71212.0, 27619.0, 11920.0, 5917.0, 3012.0, 1721.0, 1047.0, 580.0, 387.0, 268.0, 181.0, 121.0, 65.0, 41.0, 34.0, 29.0, 15.0, 8.0, 16.0, 7.0, 4.0, 5.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-1.6748046875, -1.6233673095703125, -1.571929931640625, -1.5204925537109375, -1.46905517578125, -1.4176177978515625, -1.366180419921875, -1.3147430419921875, -1.2633056640625, -1.2118682861328125, -1.160430908203125, -1.1089935302734375, -1.05755615234375, -1.0061187744140625, -0.954681396484375, -0.9032440185546875, -0.851806640625, -0.8003692626953125, -0.748931884765625, -0.6974945068359375, -0.64605712890625, -0.5946197509765625, -0.543182373046875, -0.4917449951171875, -0.4403076171875, -0.3888702392578125, -0.337432861328125, -0.2859954833984375, -0.23455810546875, -0.1831207275390625, -0.131683349609375, -0.0802459716796875, -0.02880859375, 0.0226287841796875, 0.074066162109375, 0.1255035400390625, 0.17694091796875, 0.2283782958984375, 0.279815673828125, 0.3312530517578125, 0.3826904296875, 0.4341278076171875, 0.485565185546875, 0.5370025634765625, 0.58843994140625, 0.6398773193359375, 0.691314697265625, 0.7427520751953125, 0.794189453125, 0.8456268310546875, 0.897064208984375, 0.9485015869140625, 0.99993896484375, 1.0513763427734375, 1.102813720703125, 1.1542510986328125, 1.2056884765625, 1.2571258544921875, 1.308563232421875, 1.3600006103515625, 1.41143798828125, 1.4628753662109375, 1.514312744140625, 1.5657501220703125, 1.6171875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 0.0, 3.0, 5.0, 1.0, 2.0, 1.0, 3.0, 4.0, 8.0, 6.0, 10.0, 11.0, 7.0, 13.0, 8.0, 24.0, 17.0, 22.0, 26.0, 46.0, 33.0, 38.0, 37.0, 46.0, 34.0, 42.0, 41.0, 39.0, 27.0, 43.0, 28.0, 40.0, 29.0, 43.0, 41.0, 35.0, 30.0, 24.0, 19.0, 24.0, 16.0, 11.0, 16.0, 14.0, 7.0, 6.0, 6.0, 6.0, 2.0, 6.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.904296875, -1.84930419921875, -1.7943115234375, -1.73931884765625, -1.684326171875, -1.62933349609375, -1.5743408203125, -1.51934814453125, -1.46435546875, -1.40936279296875, -1.3543701171875, -1.29937744140625, -1.244384765625, -1.18939208984375, -1.1343994140625, -1.07940673828125, -1.0244140625, -0.96942138671875, -0.9144287109375, -0.85943603515625, -0.804443359375, -0.74945068359375, -0.6944580078125, -0.63946533203125, -0.58447265625, -0.52947998046875, -0.4744873046875, -0.41949462890625, -0.364501953125, -0.30950927734375, -0.2545166015625, -0.19952392578125, -0.14453125, -0.08953857421875, -0.0345458984375, 0.02044677734375, 0.075439453125, 0.13043212890625, 0.1854248046875, 0.24041748046875, 0.29541015625, 0.35040283203125, 0.4053955078125, 0.46038818359375, 0.515380859375, 0.57037353515625, 0.6253662109375, 0.68035888671875, 0.7353515625, 0.79034423828125, 0.8453369140625, 0.90032958984375, 0.955322265625, 1.01031494140625, 1.0653076171875, 1.12030029296875, 1.17529296875, 1.23028564453125, 1.2852783203125, 1.34027099609375, 1.395263671875, 1.45025634765625, 1.5052490234375, 1.56024169921875, 1.615234375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 4.0, 6.0, 7.0, 10.0, 14.0, 19.0, 28.0, 39.0, 53.0, 90.0, 168.0, 314.0, 658.0, 1375.0, 3725.0, 12960.0, 82493.0, 735658.0, 181335.0, 20690.0, 5307.0, 1926.0, 785.0, 380.0, 200.0, 109.0, 56.0, 35.0, 36.0, 24.0, 12.0, 12.0, 12.0, 6.0, 8.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.83984375, -1.7817230224609375, -1.723602294921875, -1.6654815673828125, -1.60736083984375, -1.5492401123046875, -1.491119384765625, -1.4329986572265625, -1.3748779296875, -1.3167572021484375, -1.258636474609375, -1.2005157470703125, -1.14239501953125, -1.0842742919921875, -1.026153564453125, -0.9680328369140625, -0.909912109375, -0.8517913818359375, -0.793670654296875, -0.7355499267578125, -0.67742919921875, -0.6193084716796875, -0.561187744140625, -0.5030670166015625, -0.4449462890625, -0.3868255615234375, -0.328704833984375, -0.2705841064453125, -0.21246337890625, -0.1543426513671875, -0.096221923828125, -0.0381011962890625, 0.02001953125, 0.0781402587890625, 0.136260986328125, 0.1943817138671875, 0.25250244140625, 0.3106231689453125, 0.368743896484375, 0.4268646240234375, 0.4849853515625, 0.5431060791015625, 0.601226806640625, 0.6593475341796875, 0.71746826171875, 0.7755889892578125, 0.833709716796875, 0.8918304443359375, 0.949951171875, 1.0080718994140625, 1.066192626953125, 1.1243133544921875, 1.18243408203125, 1.2405548095703125, 1.298675537109375, 1.3567962646484375, 1.4149169921875, 1.4730377197265625, 1.531158447265625, 1.5892791748046875, 1.64739990234375, 1.7055206298828125, 1.763641357421875, 1.8217620849609375, 1.8798828125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 6.0, 7.0, 12.0, 17.0, 17.0, 28.0, 24.0, 44.0, 68.0, 82.0, 106.0, 111.0, 119.0, 87.0, 65.0, 49.0, 32.0, 32.0, 27.0, 11.0, 10.0, 12.0, 7.0, 6.0, 3.0, 3.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00015747547149658203, -0.00015026144683361053, -0.00014304742217063904, -0.00013583339750766754, -0.00012861937284469604, -0.00012140534818172455, -0.00011419132351875305, -0.00010697729885578156, -9.976327419281006e-05, -9.254924952983856e-05, -8.533522486686707e-05, -7.812120020389557e-05, -7.090717554092407e-05, -6.369315087795258e-05, -5.647912621498108e-05, -4.926510155200958e-05, -4.2051076889038086e-05, -3.483705222606659e-05, -2.7623027563095093e-05, -2.0409002900123596e-05, -1.31949782371521e-05, -5.980953574180603e-06, 1.2330710887908936e-06, 8.44709575176239e-06, 1.5661120414733887e-05, 2.2875145077705383e-05, 3.008916974067688e-05, 3.7303194403648376e-05, 4.451721906661987e-05, 5.173124372959137e-05, 5.8945268392562866e-05, 6.615929305553436e-05, 7.337331771850586e-05, 8.058734238147736e-05, 8.780136704444885e-05, 9.501539170742035e-05, 0.00010222941637039185, 0.00010944344103336334, 0.00011665746569633484, 0.00012387149035930634, 0.00013108551502227783, 0.00013829953968524933, 0.00014551356434822083, 0.00015272758901119232, 0.00015994161367416382, 0.00016715563833713531, 0.0001743696630001068, 0.0001815836876630783, 0.0001887977123260498, 0.0001960117369890213, 0.0002032257616519928, 0.0002104397863149643, 0.0002176538109779358, 0.0002248678356409073, 0.00023208186030387878, 0.00023929588496685028, 0.0002465099096298218, 0.0002537239342927933, 0.00026093795895576477, 0.00026815198361873627, 0.00027536600828170776, 0.00028258003294467926, 0.00028979405760765076, 0.00029700808227062225, 0.00030422210693359375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 5.0, 9.0, 6.0, 7.0, 15.0, 18.0, 22.0, 35.0, 63.0, 80.0, 92.0, 211.0, 288.0, 517.0, 1040.0, 2297.0, 5996.0, 22471.0, 131826.0, 653678.0, 187760.0, 29424.0, 7361.0, 2637.0, 1159.0, 609.0, 333.0, 195.0, 136.0, 73.0, 58.0, 36.0, 33.0, 25.0, 11.0, 8.0, 11.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4150390625, -1.371612548828125, -1.32818603515625, -1.284759521484375, -1.2413330078125, -1.197906494140625, -1.15447998046875, -1.111053466796875, -1.067626953125, -1.024200439453125, -0.98077392578125, -0.937347412109375, -0.8939208984375, -0.850494384765625, -0.80706787109375, -0.763641357421875, -0.72021484375, -0.676788330078125, -0.63336181640625, -0.589935302734375, -0.5465087890625, -0.503082275390625, -0.45965576171875, -0.416229248046875, -0.372802734375, -0.329376220703125, -0.28594970703125, -0.242523193359375, -0.1990966796875, -0.155670166015625, -0.11224365234375, -0.068817138671875, -0.025390625, 0.018035888671875, 0.06146240234375, 0.104888916015625, 0.1483154296875, 0.191741943359375, 0.23516845703125, 0.278594970703125, 0.322021484375, 0.365447998046875, 0.40887451171875, 0.452301025390625, 0.4957275390625, 0.539154052734375, 0.58258056640625, 0.626007080078125, 0.66943359375, 0.712860107421875, 0.75628662109375, 0.799713134765625, 0.8431396484375, 0.886566162109375, 0.92999267578125, 0.973419189453125, 1.016845703125, 1.060272216796875, 1.10369873046875, 1.147125244140625, 1.1905517578125, 1.233978271484375, 1.27740478515625, 1.320831298828125, 1.3642578125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 7.0, 10.0, 10.0, 17.0, 19.0, 36.0, 42.0, 43.0, 70.0, 90.0, 124.0, 124.0, 112.0, 72.0, 51.0, 37.0, 40.0, 23.0, 18.0, 18.0, 6.0, 8.0, 7.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.71875, -1.6697998046875, -1.620849609375, -1.5718994140625, -1.52294921875, -1.4739990234375, -1.425048828125, -1.3760986328125, -1.3271484375, -1.2781982421875, -1.229248046875, -1.1802978515625, -1.13134765625, -1.0823974609375, -1.033447265625, -0.9844970703125, -0.935546875, -0.8865966796875, -0.837646484375, -0.7886962890625, -0.73974609375, -0.6907958984375, -0.641845703125, -0.5928955078125, -0.5439453125, -0.4949951171875, -0.446044921875, -0.3970947265625, -0.34814453125, -0.2991943359375, -0.250244140625, -0.2012939453125, -0.15234375, -0.1033935546875, -0.054443359375, -0.0054931640625, 0.04345703125, 0.0924072265625, 0.141357421875, 0.1903076171875, 0.2392578125, 0.2882080078125, 0.337158203125, 0.3861083984375, 0.43505859375, 0.4840087890625, 0.532958984375, 0.5819091796875, 0.630859375, 0.6798095703125, 0.728759765625, 0.7777099609375, 0.82666015625, 0.8756103515625, 0.924560546875, 0.9735107421875, 1.0224609375, 1.0714111328125, 1.120361328125, 1.1693115234375, 1.21826171875, 1.2672119140625, 1.316162109375, 1.3651123046875, 1.4140625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 28.0, 112.0, 291.0, 367.0, 159.0, 30.0, 18.0, 4.0, 2.0, 0.0, 1.0, 2.0], "bins": [-107.14361572265625, -105.20366668701172, -103.26371002197266, -101.32376098632812, -99.3838119506836, -97.44386291503906, -95.50390625, -93.56395721435547, -91.62400817871094, -89.6840591430664, -87.74410247802734, -85.80415344238281, -83.86420440673828, -81.92425537109375, -79.98429870605469, -78.04434967041016, -76.10440063476562, -74.1644515991211, -72.22449493408203, -70.2845458984375, -68.34459686279297, -66.40464782714844, -64.46469116210938, -62.524742126464844, -60.58478546142578, -58.644832611083984, -56.70488357543945, -54.764930725097656, -52.824981689453125, -50.88502883911133, -48.94507598876953, -47.005126953125, -45.06517791748047, -43.12522506713867, -41.18527603149414, -39.245323181152344, -37.30537414550781, -35.365421295166016, -33.42546844482422, -31.485519409179688, -29.545570373535156, -27.605619430541992, -25.665668487548828, -23.72571563720703, -21.7857666015625, -19.845813751220703, -17.90586280822754, -15.965911865234375, -14.025960922241211, -12.086009979248047, -10.146059036254883, -8.206107139587402, -6.266156196594238, -4.326205253601074, -2.3862533569335938, -0.4463024139404297, 1.4936485290527344, 3.4335997104644775, 5.373550891876221, 7.313502311706543, 9.253453254699707, 11.193404197692871, 13.133356094360352, 15.073307037353516, 17.01325798034668]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 6.0, 4.0, 4.0, 12.0, 5.0, 5.0, 15.0, 11.0, 12.0, 17.0, 15.0, 23.0, 25.0, 30.0, 28.0, 36.0, 39.0, 46.0, 48.0, 47.0, 40.0, 45.0, 43.0, 47.0, 61.0, 35.0, 49.0, 40.0, 26.0, 31.0, 18.0, 21.0, 12.0, 17.0, 16.0, 14.0, 12.0, 8.0, 7.0, 6.0, 10.0, 9.0, 5.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.62202262878418, -10.280797004699707, -9.939571380615234, -9.598345756530762, -9.257120132446289, -8.915895462036133, -8.57466983795166, -8.233444213867188, -7.892218589782715, -7.550992965698242, -7.2097673416137695, -6.868542194366455, -6.527316570281982, -6.18609094619751, -5.844865798950195, -5.503640174865723, -5.16241455078125, -4.821188926696777, -4.479963302612305, -4.13873815536499, -3.7975125312805176, -3.456286907196045, -3.1150615215301514, -2.773836135864258, -2.432610511779785, -2.0913848876953125, -1.750159502029419, -1.4089339971542358, -1.0677084922790527, -0.7264829874038696, -0.3852574825286865, -0.04403209686279297, 0.2971944808959961, 0.6384199857711792, 0.9796454906463623, 1.3208709955215454, 1.6620965003967285, 2.003322124481201, 2.3445475101470947, 2.6857728958129883, 3.026998519897461, 3.3682241439819336, 3.709449529647827, 4.050674915313721, 4.391900539398193, 4.733126163482666, 5.0743513107299805, 5.415576934814453, 5.756802558898926, 6.098028182983398, 6.439253807067871, 6.7804789543151855, 7.121704578399658, 7.462930202484131, 7.804155349731445, 8.145380973815918, 8.48660659790039, 8.827832221984863, 9.169057846069336, 9.510283470153809, 9.851509094238281, 10.192733764648438, 10.53395938873291, 10.875185012817383, 11.216410636901855]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 3.0, 9.0, 13.0, 11.0, 11.0, 27.0, 32.0, 57.0, 81.0, 181.0, 359.0, 938.0, 2895.0, 13084.0, 4040402.0, 123701.0, 8869.0, 2168.0, 721.0, 331.0, 126.0, 87.0, 43.0, 48.0, 24.0, 14.0, 12.0, 15.0, 6.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.00390625, -6.81903076171875, -6.6341552734375, -6.44927978515625, -6.264404296875, -6.07952880859375, -5.8946533203125, -5.70977783203125, -5.52490234375, -5.34002685546875, -5.1551513671875, -4.97027587890625, -4.785400390625, -4.60052490234375, -4.4156494140625, -4.23077392578125, -4.0458984375, -3.86102294921875, -3.6761474609375, -3.49127197265625, -3.306396484375, -3.12152099609375, -2.9366455078125, -2.75177001953125, -2.56689453125, -2.38201904296875, -2.1971435546875, -2.01226806640625, -1.827392578125, -1.64251708984375, -1.4576416015625, -1.27276611328125, -1.087890625, -0.90301513671875, -0.7181396484375, -0.53326416015625, -0.348388671875, -0.16351318359375, 0.0213623046875, 0.20623779296875, 0.39111328125, 0.57598876953125, 0.7608642578125, 0.94573974609375, 1.130615234375, 1.31549072265625, 1.5003662109375, 1.68524169921875, 1.8701171875, 2.05499267578125, 2.2398681640625, 2.42474365234375, 2.609619140625, 2.79449462890625, 2.9793701171875, 3.16424560546875, 3.34912109375, 3.53399658203125, 3.7188720703125, 3.90374755859375, 4.088623046875, 4.27349853515625, 4.4583740234375, 4.64324951171875, 4.828125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 7.0, 9.0, 11.0, 9.0, 17.0, 17.0, 29.0, 36.0, 42.0, 46.0, 48.0, 53.0, 65.0, 72.0, 66.0, 62.0, 61.0, 57.0, 52.0, 43.0, 42.0, 26.0, 29.0, 27.0, 14.0, 18.0, 13.0, 4.0, 4.0, 6.0, 4.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6806640625, -0.66046142578125, -0.6402587890625, -0.62005615234375, -0.599853515625, -0.57965087890625, -0.5594482421875, -0.53924560546875, -0.51904296875, -0.49884033203125, -0.4786376953125, -0.45843505859375, -0.438232421875, -0.41802978515625, -0.3978271484375, -0.37762451171875, -0.357421875, -0.33721923828125, -0.3170166015625, -0.29681396484375, -0.276611328125, -0.25640869140625, -0.2362060546875, -0.21600341796875, -0.19580078125, -0.17559814453125, -0.1553955078125, -0.13519287109375, -0.114990234375, -0.09478759765625, -0.0745849609375, -0.05438232421875, -0.0341796875, -0.01397705078125, 0.0062255859375, 0.02642822265625, 0.046630859375, 0.06683349609375, 0.0870361328125, 0.10723876953125, 0.12744140625, 0.14764404296875, 0.1678466796875, 0.18804931640625, 0.208251953125, 0.22845458984375, 0.2486572265625, 0.26885986328125, 0.2890625, 0.30926513671875, 0.3294677734375, 0.34967041015625, 0.369873046875, 0.39007568359375, 0.4102783203125, 0.43048095703125, 0.45068359375, 0.47088623046875, 0.4910888671875, 0.51129150390625, 0.531494140625, 0.55169677734375, 0.5718994140625, 0.59210205078125, 0.6123046875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 5.0, 1.0, 4.0, 5.0, 6.0, 9.0, 12.0, 11.0, 28.0, 27.0, 33.0, 37.0, 50.0, 62.0, 114.0, 103.0, 146.0, 239.0, 282.0, 447.0, 654.0, 964.0, 1563.0, 2750.0, 5309.0, 12146.0, 38124.0, 3930307.0, 157470.0, 23990.0, 8896.0, 4085.0, 2203.0, 1297.0, 847.0, 585.0, 379.0, 287.0, 200.0, 151.0, 109.0, 104.0, 53.0, 43.0, 37.0, 39.0, 23.0, 16.0, 14.0, 12.0, 9.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0], "bins": [-3.865234375, -3.739837646484375, -3.61444091796875, -3.489044189453125, -3.3636474609375, -3.238250732421875, -3.11285400390625, -2.987457275390625, -2.862060546875, -2.736663818359375, -2.61126708984375, -2.485870361328125, -2.3604736328125, -2.235076904296875, -2.10968017578125, -1.984283447265625, -1.85888671875, -1.733489990234375, -1.60809326171875, -1.482696533203125, -1.3572998046875, -1.231903076171875, -1.10650634765625, -0.981109619140625, -0.855712890625, -0.730316162109375, -0.60491943359375, -0.479522705078125, -0.3541259765625, -0.228729248046875, -0.10333251953125, 0.022064208984375, 0.1474609375, 0.272857666015625, 0.39825439453125, 0.523651123046875, 0.6490478515625, 0.774444580078125, 0.89984130859375, 1.025238037109375, 1.150634765625, 1.276031494140625, 1.40142822265625, 1.526824951171875, 1.6522216796875, 1.777618408203125, 1.90301513671875, 2.028411865234375, 2.15380859375, 2.279205322265625, 2.40460205078125, 2.529998779296875, 2.6553955078125, 2.780792236328125, 2.90618896484375, 3.031585693359375, 3.156982421875, 3.282379150390625, 3.40777587890625, 3.533172607421875, 3.6585693359375, 3.783966064453125, 3.90936279296875, 4.034759521484375, 4.16015625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 7.0, 5.0, 6.0, 9.0, 19.0, 12.0, 21.0, 56.0, 261.0, 3519.0, 72.0, 39.0, 19.0, 5.0, 7.0, 10.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1826171875, -1.142059326171875, -1.10150146484375, -1.060943603515625, -1.0203857421875, -0.979827880859375, -0.93927001953125, -0.898712158203125, -0.858154296875, -0.817596435546875, -0.77703857421875, -0.736480712890625, -0.6959228515625, -0.655364990234375, -0.61480712890625, -0.574249267578125, -0.53369140625, -0.493133544921875, -0.45257568359375, -0.412017822265625, -0.3714599609375, -0.330902099609375, -0.29034423828125, -0.249786376953125, -0.209228515625, -0.168670654296875, -0.12811279296875, -0.087554931640625, -0.0469970703125, -0.006439208984375, 0.03411865234375, 0.074676513671875, 0.115234375, 0.155792236328125, 0.19635009765625, 0.236907958984375, 0.2774658203125, 0.318023681640625, 0.35858154296875, 0.399139404296875, 0.439697265625, 0.480255126953125, 0.52081298828125, 0.561370849609375, 0.6019287109375, 0.642486572265625, 0.68304443359375, 0.723602294921875, 0.76416015625, 0.804718017578125, 0.84527587890625, 0.885833740234375, 0.9263916015625, 0.966949462890625, 1.00750732421875, 1.048065185546875, 1.088623046875, 1.129180908203125, 1.16973876953125, 1.210296630859375, 1.2508544921875, 1.291412353515625, 1.33197021484375, 1.372528076171875, 1.4130859375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 3.0, 5.0, 11.0, 7.0, 16.0, 27.0, 51.0, 87.0, 114.0, 125.0, 139.0, 106.0, 101.0, 73.0, 47.0, 28.0, 25.0, 16.0, 5.0, 8.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7021236419677734, -2.581059217453003, -2.4599947929382324, -2.338930606842041, -2.2178661823272705, -2.0968017578125, -1.9757373332977295, -1.854672908782959, -1.733608603477478, -1.6125441789627075, -1.4914798736572266, -1.370415449142456, -1.2493510246276855, -1.1282867193222046, -1.007222294807434, -0.8861579298973083, -0.7650935649871826, -0.6440292000770569, -0.5229648351669312, -0.40190041065216064, -0.2808360457420349, -0.15977168083190918, -0.03870725631713867, 0.08235710859298706, 0.2034214735031128, 0.3244858384132385, 0.44555023312568665, 0.5666146278381348, 0.6876789927482605, 0.8087433576583862, 0.9298077821731567, 1.0508720874786377, 1.1719365119934082, 1.2930009365081787, 1.4140652418136597, 1.5351296663284302, 1.6561939716339111, 1.7772583961486816, 1.8983228206634521, 2.0193872451782227, 2.140451431274414, 2.2615158557891846, 2.382580280303955, 2.5036444664001465, 2.624708890914917, 2.7457733154296875, 2.866837739944458, 2.9879021644592285, 3.108966588973999, 3.2300310134887695, 3.35109543800354, 3.4721598625183105, 3.593224048614502, 3.7142884731292725, 3.835352897644043, 3.9564173221588135, 4.077481746673584, 4.198545932769775, 4.319610595703125, 4.440674781799316, 4.561739444732666, 4.682803630828857, 4.803868293762207, 4.924932479858398, 5.04599666595459]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 5.0, 9.0, 4.0, 7.0, 8.0, 10.0, 11.0, 16.0, 8.0, 16.0, 13.0, 20.0, 29.0, 34.0, 27.0, 29.0, 42.0, 50.0, 40.0, 44.0, 44.0, 55.0, 41.0, 58.0, 48.0, 42.0, 34.0, 32.0, 27.0, 22.0, 23.0, 19.0, 19.0, 12.0, 23.0, 17.0, 15.0, 14.0, 11.0, 6.0, 6.0, 5.0, 1.0, 1.0, 3.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7838761806488037, -1.725106120109558, -1.6663360595703125, -1.607565999031067, -1.5487959384918213, -1.4900259971618652, -1.4312559366226196, -1.372485876083374, -1.3137158155441284, -1.2549457550048828, -1.1961756944656372, -1.1374056339263916, -1.0786356925964355, -1.0198655128479004, -0.9610955715179443, -0.9023255109786987, -0.8435554504394531, -0.7847853899002075, -0.7260153293609619, -0.6672453284263611, -0.6084752678871155, -0.5497052073478699, -0.49093517661094666, -0.43216514587402344, -0.37339508533477783, -0.3146250247955322, -0.255854994058609, -0.1970849484205246, -0.13831490278244019, -0.07954484224319458, -0.020774811506271362, 0.037995219230651855, 0.09676527976989746, 0.15553532540798187, 0.21430537104606628, 0.2730754017829895, 0.3318454623222351, 0.3906155228614807, 0.44938555359840393, 0.5081555843353271, 0.5669256448745728, 0.6256957054138184, 0.684465765953064, 0.7432357668876648, 0.8020058274269104, 0.860775887966156, 0.9195458889007568, 0.9783159494400024, 1.037086009979248, 1.0958560705184937, 1.1546261310577393, 1.2133961915969849, 1.2721662521362305, 1.3309361934661865, 1.3897062540054321, 1.4484763145446777, 1.5072463750839233, 1.566016435623169, 1.6247864961624146, 1.6835565567016602, 1.7423264980316162, 1.8010966777801514, 1.8598666191101074, 1.918636679649353, 1.9774067401885986]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 6.0, 7.0, 7.0, 14.0, 22.0, 26.0, 38.0, 59.0, 61.0, 109.0, 170.0, 253.0, 382.0, 538.0, 920.0, 1470.0, 2398.0, 4103.0, 7171.0, 13239.0, 24883.0, 47818.0, 92906.0, 168912.0, 236647.0, 199047.0, 117233.0, 60481.0, 31414.0, 16407.0, 9076.0, 4981.0, 2900.0, 1737.0, 1133.0, 674.0, 462.0, 291.0, 165.0, 119.0, 92.0, 53.0, 41.0, 27.0, 30.0, 14.0, 8.0, 6.0, 4.0, 6.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5, -1.4526519775390625, -1.405303955078125, -1.3579559326171875, -1.31060791015625, -1.2632598876953125, -1.215911865234375, -1.1685638427734375, -1.1212158203125, -1.0738677978515625, -1.026519775390625, -0.9791717529296875, -0.93182373046875, -0.8844757080078125, -0.837127685546875, -0.7897796630859375, -0.742431640625, -0.6950836181640625, -0.647735595703125, -0.6003875732421875, -0.55303955078125, -0.5056915283203125, -0.458343505859375, -0.4109954833984375, -0.3636474609375, -0.3162994384765625, -0.268951416015625, -0.2216033935546875, -0.17425537109375, -0.1269073486328125, -0.079559326171875, -0.0322113037109375, 0.01513671875, 0.0624847412109375, 0.109832763671875, 0.1571807861328125, 0.20452880859375, 0.2518768310546875, 0.299224853515625, 0.3465728759765625, 0.3939208984375, 0.4412689208984375, 0.488616943359375, 0.5359649658203125, 0.58331298828125, 0.6306610107421875, 0.678009033203125, 0.7253570556640625, 0.772705078125, 0.8200531005859375, 0.867401123046875, 0.9147491455078125, 0.96209716796875, 1.0094451904296875, 1.056793212890625, 1.1041412353515625, 1.1514892578125, 1.1988372802734375, 1.246185302734375, 1.2935333251953125, 1.34088134765625, 1.3882293701171875, 1.435577392578125, 1.4829254150390625, 1.5302734375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 2.0, 6.0, 6.0, 7.0, 16.0, 18.0, 17.0, 25.0, 25.0, 23.0, 41.0, 43.0, 44.0, 58.0, 56.0, 58.0, 68.0, 56.0, 57.0, 52.0, 38.0, 41.0, 44.0, 34.0, 33.0, 19.0, 19.0, 25.0, 14.0, 13.0, 10.0, 8.0, 7.0, 9.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8125, -0.7878799438476562, -0.7632598876953125, -0.7386398315429688, -0.714019775390625, -0.6893997192382812, -0.6647796630859375, -0.6401596069335938, -0.61553955078125, -0.5909194946289062, -0.5662994384765625, -0.5416793823242188, -0.517059326171875, -0.49243927001953125, -0.4678192138671875, -0.44319915771484375, -0.4185791015625, -0.39395904541015625, -0.3693389892578125, -0.34471893310546875, -0.320098876953125, -0.29547882080078125, -0.2708587646484375, -0.24623870849609375, -0.22161865234375, -0.19699859619140625, -0.1723785400390625, -0.14775848388671875, -0.123138427734375, -0.09851837158203125, -0.0738983154296875, -0.04927825927734375, -0.024658203125, -3.814697265625e-05, 0.0245819091796875, 0.04920196533203125, 0.073822021484375, 0.09844207763671875, 0.1230621337890625, 0.14768218994140625, 0.17230224609375, 0.19692230224609375, 0.2215423583984375, 0.24616241455078125, 0.270782470703125, 0.29540252685546875, 0.3200225830078125, 0.34464263916015625, 0.3692626953125, 0.39388275146484375, 0.4185028076171875, 0.44312286376953125, 0.467742919921875, 0.49236297607421875, 0.5169830322265625, 0.5416030883789062, 0.56622314453125, 0.5908432006835938, 0.6154632568359375, 0.6400833129882812, 0.664703369140625, 0.6893234252929688, 0.7139434814453125, 0.7385635375976562, 0.76318359375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 7.0, 14.0, 17.0, 41.0, 62.0, 107.0, 186.0, 490.0, 967.0, 2560.0, 7888.0, 31926.0, 183849.0, 597598.0, 179305.0, 31508.0, 7645.0, 2523.0, 991.0, 395.0, 220.0, 104.0, 63.0, 34.0, 22.0, 11.0, 13.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.458984375, -3.305206298828125, -3.15142822265625, -2.997650146484375, -2.8438720703125, -2.690093994140625, -2.53631591796875, -2.382537841796875, -2.228759765625, -2.074981689453125, -1.92120361328125, -1.767425537109375, -1.6136474609375, -1.459869384765625, -1.30609130859375, -1.152313232421875, -0.99853515625, -0.844757080078125, -0.69097900390625, -0.537200927734375, -0.3834228515625, -0.229644775390625, -0.07586669921875, 0.077911376953125, 0.231689453125, 0.385467529296875, 0.53924560546875, 0.693023681640625, 0.8468017578125, 1.000579833984375, 1.15435791015625, 1.308135986328125, 1.4619140625, 1.615692138671875, 1.76947021484375, 1.923248291015625, 2.0770263671875, 2.230804443359375, 2.38458251953125, 2.538360595703125, 2.692138671875, 2.845916748046875, 2.99969482421875, 3.153472900390625, 3.3072509765625, 3.461029052734375, 3.61480712890625, 3.768585205078125, 3.92236328125, 4.076141357421875, 4.22991943359375, 4.383697509765625, 4.5374755859375, 4.691253662109375, 4.84503173828125, 4.998809814453125, 5.152587890625, 5.306365966796875, 5.46014404296875, 5.613922119140625, 5.7677001953125, 5.921478271484375, 6.07525634765625, 6.229034423828125, 6.3828125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 1.0, 5.0, 1.0, 5.0, 5.0, 9.0, 7.0, 11.0, 13.0, 17.0, 16.0, 14.0, 16.0, 19.0, 18.0, 20.0, 33.0, 30.0, 26.0, 41.0, 40.0, 52.0, 34.0, 33.0, 41.0, 44.0, 52.0, 31.0, 40.0, 34.0, 39.0, 36.0, 31.0, 30.0, 26.0, 24.0, 16.0, 23.0, 16.0, 9.0, 13.0, 10.0, 9.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.470703125, -3.349639892578125, -3.22857666015625, -3.107513427734375, -2.9864501953125, -2.865386962890625, -2.74432373046875, -2.623260498046875, -2.502197265625, -2.381134033203125, -2.26007080078125, -2.139007568359375, -2.0179443359375, -1.896881103515625, -1.77581787109375, -1.654754638671875, -1.53369140625, -1.412628173828125, -1.29156494140625, -1.170501708984375, -1.0494384765625, -0.928375244140625, -0.80731201171875, -0.686248779296875, -0.565185546875, -0.444122314453125, -0.32305908203125, -0.201995849609375, -0.0809326171875, 0.040130615234375, 0.16119384765625, 0.282257080078125, 0.4033203125, 0.524383544921875, 0.64544677734375, 0.766510009765625, 0.8875732421875, 1.008636474609375, 1.12969970703125, 1.250762939453125, 1.371826171875, 1.492889404296875, 1.61395263671875, 1.735015869140625, 1.8560791015625, 1.977142333984375, 2.09820556640625, 2.219268798828125, 2.34033203125, 2.461395263671875, 2.58245849609375, 2.703521728515625, 2.8245849609375, 2.945648193359375, 3.06671142578125, 3.187774658203125, 3.308837890625, 3.429901123046875, 3.55096435546875, 3.672027587890625, 3.7930908203125, 3.914154052734375, 4.03521728515625, 4.156280517578125, 4.27734375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 5.0, 6.0, 12.0, 15.0, 8.0, 26.0, 33.0, 53.0, 77.0, 126.0, 216.0, 352.0, 757.0, 2025.0, 7289.0, 73556.0, 892236.0, 61478.0, 6675.0, 1990.0, 719.0, 353.0, 206.0, 115.0, 74.0, 43.0, 37.0, 20.0, 14.0, 12.0, 9.0, 7.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.27734375, -4.149566650390625, -4.02178955078125, -3.894012451171875, -3.7662353515625, -3.638458251953125, -3.51068115234375, -3.382904052734375, -3.255126953125, -3.127349853515625, -2.99957275390625, -2.871795654296875, -2.7440185546875, -2.616241455078125, -2.48846435546875, -2.360687255859375, -2.23291015625, -2.105133056640625, -1.97735595703125, -1.849578857421875, -1.7218017578125, -1.594024658203125, -1.46624755859375, -1.338470458984375, -1.210693359375, -1.082916259765625, -0.95513916015625, -0.827362060546875, -0.6995849609375, -0.571807861328125, -0.44403076171875, -0.316253662109375, -0.1884765625, -0.060699462890625, 0.06707763671875, 0.194854736328125, 0.3226318359375, 0.450408935546875, 0.57818603515625, 0.705963134765625, 0.833740234375, 0.961517333984375, 1.08929443359375, 1.217071533203125, 1.3448486328125, 1.472625732421875, 1.60040283203125, 1.728179931640625, 1.85595703125, 1.983734130859375, 2.11151123046875, 2.239288330078125, 2.3670654296875, 2.494842529296875, 2.62261962890625, 2.750396728515625, 2.878173828125, 3.005950927734375, 3.13372802734375, 3.261505126953125, 3.3892822265625, 3.517059326171875, 3.64483642578125, 3.772613525390625, 3.900390625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 9.0, 6.0, 32.0, 59.0, 79.0, 158.0, 198.0, 174.0, 124.0, 68.0, 39.0, 18.0, 12.0, 7.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004527568817138672, -0.0004329271614551544, -0.00041309744119644165, -0.0003932677209377289, -0.0003734380006790161, -0.00035360828042030334, -0.0003337785601615906, -0.0003139488399028778, -0.00029411911964416504, -0.00027428939938545227, -0.0002544596791267395, -0.00023462995886802673, -0.00021480023860931396, -0.0001949705183506012, -0.00017514079809188843, -0.00015531107783317566, -0.0001354813575744629, -0.00011565163731575012, -9.582191705703735e-05, -7.599219679832458e-05, -5.6162476539611816e-05, -3.633275628089905e-05, -1.650303602218628e-05, 3.3266842365264893e-06, 2.3156404495239258e-05, 4.2986124753952026e-05, 6.28158450126648e-05, 8.264556527137756e-05, 0.00010247528553009033, 0.0001223050057888031, 0.00014213472604751587, 0.00016196444630622864, 0.0001817941665649414, 0.00020162388682365417, 0.00022145360708236694, 0.0002412833273410797, 0.0002611130475997925, 0.00028094276785850525, 0.000300772488117218, 0.0003206022083759308, 0.00034043192863464355, 0.0003602616488933563, 0.0003800913691520691, 0.00039992108941078186, 0.00041975080966949463, 0.0004395805299282074, 0.00045941025018692017, 0.00047923997044563293, 0.0004990696907043457, 0.0005188994109630585, 0.0005387291312217712, 0.000558558851480484, 0.0005783885717391968, 0.0005982182919979095, 0.0006180480122566223, 0.0006378777325153351, 0.0006577074527740479, 0.0006775371730327606, 0.0006973668932914734, 0.0007171966135501862, 0.0007370263338088989, 0.0007568560540676117, 0.0007766857743263245, 0.0007965154945850372, 0.00081634521484375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 5.0, 2.0, 2.0, 2.0, 4.0, 3.0, 5.0, 10.0, 20.0, 26.0, 44.0, 66.0, 109.0, 218.0, 394.0, 781.0, 2173.0, 7758.0, 57445.0, 765624.0, 193054.0, 14919.0, 3613.0, 1188.0, 472.0, 251.0, 138.0, 87.0, 48.0, 24.0, 20.0, 12.0, 11.0, 5.0, 5.0, 6.0, 3.0, 0.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.251953125, -3.15545654296875, -3.0589599609375, -2.96246337890625, -2.865966796875, -2.76947021484375, -2.6729736328125, -2.57647705078125, -2.47998046875, -2.38348388671875, -2.2869873046875, -2.19049072265625, -2.093994140625, -1.99749755859375, -1.9010009765625, -1.80450439453125, -1.7080078125, -1.61151123046875, -1.5150146484375, -1.41851806640625, -1.322021484375, -1.22552490234375, -1.1290283203125, -1.03253173828125, -0.93603515625, -0.83953857421875, -0.7430419921875, -0.64654541015625, -0.550048828125, -0.45355224609375, -0.3570556640625, -0.26055908203125, -0.1640625, -0.06756591796875, 0.0289306640625, 0.12542724609375, 0.221923828125, 0.31842041015625, 0.4149169921875, 0.51141357421875, 0.60791015625, 0.70440673828125, 0.8009033203125, 0.89739990234375, 0.993896484375, 1.09039306640625, 1.1868896484375, 1.28338623046875, 1.3798828125, 1.47637939453125, 1.5728759765625, 1.66937255859375, 1.765869140625, 1.86236572265625, 1.9588623046875, 2.05535888671875, 2.15185546875, 2.24835205078125, 2.3448486328125, 2.44134521484375, 2.537841796875, 2.63433837890625, 2.7308349609375, 2.82733154296875, 2.923828125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 2.0, 9.0, 5.0, 5.0, 13.0, 19.0, 34.0, 60.0, 126.0, 169.0, 201.0, 141.0, 106.0, 43.0, 31.0, 13.0, 9.0, 3.0, 6.0, 0.0, 0.0, 2.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.13671875, -4.97705078125, -4.8173828125, -4.65771484375, -4.498046875, -4.33837890625, -4.1787109375, -4.01904296875, -3.859375, -3.69970703125, -3.5400390625, -3.38037109375, -3.220703125, -3.06103515625, -2.9013671875, -2.74169921875, -2.58203125, -2.42236328125, -2.2626953125, -2.10302734375, -1.943359375, -1.78369140625, -1.6240234375, -1.46435546875, -1.3046875, -1.14501953125, -0.9853515625, -0.82568359375, -0.666015625, -0.50634765625, -0.3466796875, -0.18701171875, -0.02734375, 0.13232421875, 0.2919921875, 0.45166015625, 0.611328125, 0.77099609375, 0.9306640625, 1.09033203125, 1.25, 1.40966796875, 1.5693359375, 1.72900390625, 1.888671875, 2.04833984375, 2.2080078125, 2.36767578125, 2.52734375, 2.68701171875, 2.8466796875, 3.00634765625, 3.166015625, 3.32568359375, 3.4853515625, 3.64501953125, 3.8046875, 3.96435546875, 4.1240234375, 4.28369140625, 4.443359375, 4.60302734375, 4.7626953125, 4.92236328125, 5.08203125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 1.0, 9.0, 17.0, 34.0, 64.0, 113.0, 161.0, 206.0, 181.0, 102.0, 52.0, 29.0, 16.0, 9.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-74.5879135131836, -72.87418365478516, -71.16046142578125, -69.44673156738281, -67.73300170898438, -66.01927947998047, -64.30554962158203, -62.591819763183594, -60.87809371948242, -59.16436767578125, -57.45063781738281, -55.73691177368164, -54.02318572998047, -52.30945587158203, -50.59572982788086, -48.88200378417969, -47.16827392578125, -45.45454788208008, -43.74081802368164, -42.02709197998047, -40.3133659362793, -38.59963607788086, -36.88591003417969, -35.17218017578125, -33.458457946777344, -31.74472999572754, -30.031003952026367, -28.317276000976562, -26.603548049926758, -24.889820098876953, -23.17609405517578, -21.462366104125977, -19.748638153076172, -18.034910202026367, -16.321184158325195, -14.60745620727539, -12.893728256225586, -11.180001258850098, -9.46627426147461, -7.752546310424805, -6.038819313049316, -4.32509183883667, -2.6113646030426025, -0.8976373672485352, 0.8160901069641113, 2.529817581176758, 4.243544578552246, 5.957272529602051, 7.670999526977539, 9.384726524353027, 11.098454475402832, 12.81218147277832, 14.525909423828125, 16.239635467529297, 17.9533634185791, 19.667091369628906, 21.380817413330078, 23.094545364379883, 24.808271408081055, 26.52199935913086, 28.235727310180664, 29.94945526123047, 31.66318130493164, 33.37690734863281, 35.09063720703125]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 5.0, 3.0, 2.0, 3.0, 5.0, 6.0, 8.0, 10.0, 14.0, 16.0, 13.0, 13.0, 20.0, 30.0, 26.0, 20.0, 27.0, 36.0, 36.0, 26.0, 31.0, 27.0, 59.0, 47.0, 44.0, 49.0, 52.0, 32.0, 45.0, 27.0, 29.0, 29.0, 30.0, 28.0, 31.0, 22.0, 22.0, 20.0, 14.0, 7.0, 7.0, 13.0, 4.0, 9.0, 1.0, 4.0, 2.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-20.776704788208008, -20.143341064453125, -19.50997543334961, -18.876611709594727, -18.243247985839844, -17.609882354736328, -16.976518630981445, -16.343154907226562, -15.709790229797363, -15.076425552368164, -14.443061828613281, -13.809697151184082, -13.176332473754883, -12.54296875, -11.9096040725708, -11.276239395141602, -10.642875671386719, -10.00951099395752, -9.376147270202637, -8.742782592773438, -8.109418869018555, -7.4760541915893555, -6.842689514160156, -6.209325313568115, -5.575961112976074, -4.942596912384033, -4.309232711791992, -3.675868034362793, -3.042503833770752, -2.409139633178711, -1.7757751941680908, -1.1424107551574707, -0.5090446472167969, 0.12431967258453369, 0.7576839923858643, 1.3910483121871948, 2.0244126319885254, 2.6577768325805664, 3.2911412715911865, 3.9245057106018066, 4.557869911193848, 5.191234111785889, 5.82459831237793, 6.457962989807129, 7.09132719039917, 7.724691390991211, 8.35805606842041, 8.99142074584961, 9.624784469604492, 10.258149147033691, 10.891512870788574, 11.524877548217773, 12.158241271972656, 12.791605949401855, 13.424970626831055, 14.058334350585938, 14.691699028015137, 15.325063705444336, 15.958427429199219, 16.5917911529541, 17.225156784057617, 17.8585205078125, 18.491884231567383, 19.1252498626709, 19.75861358642578]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 8.0, 15.0, 8.0, 12.0, 19.0, 24.0, 39.0, 59.0, 98.0, 122.0, 229.0, 344.0, 544.0, 1039.0, 1991.0, 4528.0, 14418.0, 99154.0, 4028617.0, 29190.0, 7601.0, 2923.0, 1367.0, 734.0, 433.0, 258.0, 164.0, 110.0, 79.0, 51.0, 30.0, 23.0, 10.0, 9.0, 7.0, 6.0, 3.0, 3.0, 6.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.943359375, -3.817108154296875, -3.69085693359375, -3.564605712890625, -3.4383544921875, -3.312103271484375, -3.18585205078125, -3.059600830078125, -2.933349609375, -2.807098388671875, -2.68084716796875, -2.554595947265625, -2.4283447265625, -2.302093505859375, -2.17584228515625, -2.049591064453125, -1.92333984375, -1.797088623046875, -1.67083740234375, -1.544586181640625, -1.4183349609375, -1.292083740234375, -1.16583251953125, -1.039581298828125, -0.913330078125, -0.787078857421875, -0.66082763671875, -0.534576416015625, -0.4083251953125, -0.282073974609375, -0.15582275390625, -0.029571533203125, 0.0966796875, 0.222930908203125, 0.34918212890625, 0.475433349609375, 0.6016845703125, 0.727935791015625, 0.85418701171875, 0.980438232421875, 1.106689453125, 1.232940673828125, 1.35919189453125, 1.485443115234375, 1.6116943359375, 1.737945556640625, 1.86419677734375, 1.990447998046875, 2.11669921875, 2.242950439453125, 2.36920166015625, 2.495452880859375, 2.6217041015625, 2.747955322265625, 2.87420654296875, 3.000457763671875, 3.126708984375, 3.252960205078125, 3.37921142578125, 3.505462646484375, 3.6317138671875, 3.757965087890625, 3.88421630859375, 4.010467529296875, 4.13671875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 6.0, 3.0, 7.0, 12.0, 7.0, 11.0, 27.0, 28.0, 39.0, 34.0, 60.0, 71.0, 72.0, 92.0, 90.0, 79.0, 73.0, 62.0, 52.0, 41.0, 36.0, 29.0, 15.0, 19.0, 13.0, 7.0, 4.0, 7.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0], "bins": [-1.88671875, -1.843170166015625, -1.79962158203125, -1.756072998046875, -1.7125244140625, -1.668975830078125, -1.62542724609375, -1.581878662109375, -1.538330078125, -1.494781494140625, -1.45123291015625, -1.407684326171875, -1.3641357421875, -1.320587158203125, -1.27703857421875, -1.233489990234375, -1.18994140625, -1.146392822265625, -1.10284423828125, -1.059295654296875, -1.0157470703125, -0.972198486328125, -0.92864990234375, -0.885101318359375, -0.841552734375, -0.798004150390625, -0.75445556640625, -0.710906982421875, -0.6673583984375, -0.623809814453125, -0.58026123046875, -0.536712646484375, -0.4931640625, -0.449615478515625, -0.40606689453125, -0.362518310546875, -0.3189697265625, -0.275421142578125, -0.23187255859375, -0.188323974609375, -0.144775390625, -0.101226806640625, -0.05767822265625, -0.014129638671875, 0.0294189453125, 0.072967529296875, 0.11651611328125, 0.160064697265625, 0.20361328125, 0.247161865234375, 0.29071044921875, 0.334259033203125, 0.3778076171875, 0.421356201171875, 0.46490478515625, 0.508453369140625, 0.552001953125, 0.595550537109375, 0.63909912109375, 0.682647705078125, 0.7261962890625, 0.769744873046875, 0.81329345703125, 0.856842041015625, 0.900390625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 8.0, 6.0, 9.0, 10.0, 10.0, 16.0, 21.0, 31.0, 52.0, 53.0, 82.0, 124.0, 144.0, 207.0, 326.0, 394.0, 587.0, 886.0, 1449.0, 2705.0, 5562.0, 15010.0, 81207.0, 4017004.0, 46117.0, 11456.0, 4447.0, 2284.0, 1347.0, 856.0, 537.0, 390.0, 266.0, 184.0, 122.0, 100.0, 77.0, 51.0, 41.0, 22.0, 17.0, 9.0, 13.0, 13.0, 10.0, 9.0, 5.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.3828125, -7.15478515625, -6.9267578125, -6.69873046875, -6.470703125, -6.24267578125, -6.0146484375, -5.78662109375, -5.55859375, -5.33056640625, -5.1025390625, -4.87451171875, -4.646484375, -4.41845703125, -4.1904296875, -3.96240234375, -3.734375, -3.50634765625, -3.2783203125, -3.05029296875, -2.822265625, -2.59423828125, -2.3662109375, -2.13818359375, -1.91015625, -1.68212890625, -1.4541015625, -1.22607421875, -0.998046875, -0.77001953125, -0.5419921875, -0.31396484375, -0.0859375, 0.14208984375, 0.3701171875, 0.59814453125, 0.826171875, 1.05419921875, 1.2822265625, 1.51025390625, 1.73828125, 1.96630859375, 2.1943359375, 2.42236328125, 2.650390625, 2.87841796875, 3.1064453125, 3.33447265625, 3.5625, 3.79052734375, 4.0185546875, 4.24658203125, 4.474609375, 4.70263671875, 4.9306640625, 5.15869140625, 5.38671875, 5.61474609375, 5.8427734375, 6.07080078125, 6.298828125, 6.52685546875, 6.7548828125, 6.98291015625, 7.2109375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 3.0, 3.0, 2.0, 4.0, 12.0, 9.0, 14.0, 22.0, 62.0, 366.0, 3382.0, 98.0, 37.0, 17.0, 13.0, 10.0, 2.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.587890625, -2.5199127197265625, -2.451934814453125, -2.3839569091796875, -2.31597900390625, -2.2480010986328125, -2.180023193359375, -2.1120452880859375, -2.0440673828125, -1.9760894775390625, -1.908111572265625, -1.8401336669921875, -1.77215576171875, -1.7041778564453125, -1.636199951171875, -1.5682220458984375, -1.500244140625, -1.4322662353515625, -1.364288330078125, -1.2963104248046875, -1.22833251953125, -1.1603546142578125, -1.092376708984375, -1.0243988037109375, -0.9564208984375, -0.8884429931640625, -0.820465087890625, -0.7524871826171875, -0.68450927734375, -0.6165313720703125, -0.548553466796875, -0.4805755615234375, -0.41259765625, -0.3446197509765625, -0.276641845703125, -0.2086639404296875, -0.14068603515625, -0.0727081298828125, -0.004730224609375, 0.0632476806640625, 0.1312255859375, 0.1992034912109375, 0.267181396484375, 0.3351593017578125, 0.40313720703125, 0.4711151123046875, 0.539093017578125, 0.6070709228515625, 0.675048828125, 0.7430267333984375, 0.811004638671875, 0.8789825439453125, 0.94696044921875, 1.0149383544921875, 1.082916259765625, 1.1508941650390625, 1.2188720703125, 1.2868499755859375, 1.354827880859375, 1.4228057861328125, 1.49078369140625, 1.5587615966796875, 1.626739501953125, 1.6947174072265625, 1.7626953125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 0.0, 7.0, 1.0, 7.0, 9.0, 20.0, 42.0, 61.0, 90.0, 146.0, 194.0, 174.0, 124.0, 66.0, 32.0, 17.0, 8.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.433637619018555, -14.051681518554688, -13.669726371765137, -13.28777027130127, -12.905814170837402, -12.523858070373535, -12.141902923583984, -11.759946823120117, -11.37799072265625, -10.996034622192383, -10.614079475402832, -10.232123374938965, -9.850167274475098, -9.46821117401123, -9.08625602722168, -8.704299926757812, -8.322343826293945, -7.940388202667236, -7.558432102203369, -7.17647647857666, -6.794520378112793, -6.412564754486084, -6.030609130859375, -5.648653030395508, -5.266697883605957, -4.884742259979248, -4.502786159515381, -4.120830535888672, -3.7388744354248047, -3.3569188117980957, -2.9749629497528076, -2.5930070877075195, -2.2110509872436523, -1.8290951251983643, -1.4471392631530762, -1.0651835203170776, -0.6832276582717896, -0.30127179622650146, 0.08068394660949707, 0.46263980865478516, 0.8445956707000732, 1.2265515327453613, 1.6085073947906494, 1.990463137626648, 2.3724188804626465, 2.7543749809265137, 3.1363306045532227, 3.5182864665985107, 3.900242328643799, 4.282197952270508, 4.664154052734375, 5.046109676361084, 5.428065776824951, 5.81002140045166, 6.191977500915527, 6.573933124542236, 6.955888748168945, 7.337844371795654, 7.7198004722595215, 8.10175609588623, 8.483712196350098, 8.865668296813965, 9.247623443603516, 9.629579544067383, 10.01153564453125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 3.0, 5.0, 6.0, 6.0, 8.0, 16.0, 14.0, 17.0, 18.0, 15.0, 17.0, 26.0, 28.0, 29.0, 35.0, 41.0, 35.0, 39.0, 48.0, 51.0, 49.0, 37.0, 45.0, 46.0, 42.0, 42.0, 32.0, 27.0, 25.0, 30.0, 22.0, 29.0, 16.0, 18.0, 13.0, 13.0, 14.0, 10.0, 8.0, 9.0, 5.0, 7.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.744624614715576, -3.6153879165649414, -3.4861512184143066, -3.356914758682251, -3.227678060531616, -3.0984413623809814, -2.969204902648926, -2.839968204498291, -2.7107315063476562, -2.5814948081970215, -2.4522581100463867, -2.323021650314331, -2.1937849521636963, -2.0645482540130615, -1.9353116750717163, -1.806075096130371, -1.6768383979797363, -1.5476016998291016, -1.4183651208877563, -1.2891285419464111, -1.1598918437957764, -1.0306551456451416, -0.9014185667037964, -0.7721819281578064, -0.6429452896118164, -0.5137086510658264, -0.3844720125198364, -0.25523537397384644, -0.12599873542785645, 0.003237903118133545, 0.13247454166412354, 0.2617111802101135, 0.3909473419189453, 0.5201839804649353, 0.6494206190109253, 0.7786572575569153, 0.9078938961029053, 1.03713059425354, 1.1663671731948853, 1.2956037521362305, 1.4248404502868652, 1.5540771484375, 1.6833137273788452, 1.8125503063201904, 1.9417870044708252, 2.07102370262146, 2.2002601623535156, 2.3294968605041504, 2.458733558654785, 2.58797025680542, 2.7172069549560547, 2.8464434146881104, 2.975680112838745, 3.10491681098938, 3.2341532707214355, 3.3633899688720703, 3.492626667022705, 3.62186336517334, 3.7511000633239746, 3.8803365230560303, 4.009572982788086, 4.138809680938721, 4.2680463790893555, 4.39728307723999, 4.526519775390625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 8.0, 14.0, 27.0, 21.0, 15.0, 38.0, 67.0, 78.0, 103.0, 186.0, 213.0, 348.0, 582.0, 886.0, 1460.0, 2340.0, 4163.0, 7424.0, 14245.0, 27821.0, 56742.0, 120447.0, 230341.0, 267519.0, 159495.0, 76801.0, 36517.0, 18137.0, 9493.0, 5150.0, 2992.0, 1751.0, 1057.0, 699.0, 418.0, 311.0, 189.0, 117.0, 91.0, 76.0, 53.0, 30.0, 27.0, 20.0, 10.0, 12.0, 6.0, 1.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-2.240234375, -2.166046142578125, -2.09185791015625, -2.017669677734375, -1.9434814453125, -1.869293212890625, -1.79510498046875, -1.720916748046875, -1.646728515625, -1.572540283203125, -1.49835205078125, -1.424163818359375, -1.3499755859375, -1.275787353515625, -1.20159912109375, -1.127410888671875, -1.05322265625, -0.979034423828125, -0.90484619140625, -0.830657958984375, -0.7564697265625, -0.682281494140625, -0.60809326171875, -0.533905029296875, -0.459716796875, -0.385528564453125, -0.31134033203125, -0.237152099609375, -0.1629638671875, -0.088775634765625, -0.01458740234375, 0.059600830078125, 0.1337890625, 0.207977294921875, 0.28216552734375, 0.356353759765625, 0.4305419921875, 0.504730224609375, 0.57891845703125, 0.653106689453125, 0.727294921875, 0.801483154296875, 0.87567138671875, 0.949859619140625, 1.0240478515625, 1.098236083984375, 1.17242431640625, 1.246612548828125, 1.32080078125, 1.394989013671875, 1.46917724609375, 1.543365478515625, 1.6175537109375, 1.691741943359375, 1.76593017578125, 1.840118408203125, 1.914306640625, 1.988494873046875, 2.06268310546875, 2.136871337890625, 2.2110595703125, 2.285247802734375, 2.35943603515625, 2.433624267578125, 2.5078125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 9.0, 5.0, 8.0, 7.0, 7.0, 10.0, 15.0, 11.0, 27.0, 18.0, 41.0, 50.0, 42.0, 57.0, 63.0, 64.0, 86.0, 64.0, 71.0, 55.0, 49.0, 37.0, 45.0, 30.0, 28.0, 26.0, 22.0, 16.0, 17.0, 9.0, 7.0, 10.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8251953125, -1.7757720947265625, -1.726348876953125, -1.6769256591796875, -1.62750244140625, -1.5780792236328125, -1.528656005859375, -1.4792327880859375, -1.4298095703125, -1.3803863525390625, -1.330963134765625, -1.2815399169921875, -1.23211669921875, -1.1826934814453125, -1.133270263671875, -1.0838470458984375, -1.034423828125, -0.9850006103515625, -0.935577392578125, -0.8861541748046875, -0.83673095703125, -0.7873077392578125, -0.737884521484375, -0.6884613037109375, -0.6390380859375, -0.5896148681640625, -0.540191650390625, -0.4907684326171875, -0.44134521484375, -0.3919219970703125, -0.342498779296875, -0.2930755615234375, -0.24365234375, -0.1942291259765625, -0.144805908203125, -0.0953826904296875, -0.04595947265625, 0.0034637451171875, 0.052886962890625, 0.1023101806640625, 0.1517333984375, 0.2011566162109375, 0.250579833984375, 0.3000030517578125, 0.34942626953125, 0.3988494873046875, 0.448272705078125, 0.4976959228515625, 0.547119140625, 0.5965423583984375, 0.645965576171875, 0.6953887939453125, 0.74481201171875, 0.7942352294921875, 0.843658447265625, 0.8930816650390625, 0.9425048828125, 0.9919281005859375, 1.041351318359375, 1.0907745361328125, 1.14019775390625, 1.1896209716796875, 1.239044189453125, 1.2884674072265625, 1.337890625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 6.0, 9.0, 4.0, 17.0, 17.0, 24.0, 34.0, 63.0, 90.0, 176.0, 352.0, 811.0, 2568.0, 9258.0, 52966.0, 533361.0, 398287.0, 39330.0, 7546.0, 2146.0, 740.0, 319.0, 163.0, 102.0, 66.0, 36.0, 25.0, 10.0, 16.0, 8.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5546875, -6.28076171875, -6.0068359375, -5.73291015625, -5.458984375, -5.18505859375, -4.9111328125, -4.63720703125, -4.36328125, -4.08935546875, -3.8154296875, -3.54150390625, -3.267578125, -2.99365234375, -2.7197265625, -2.44580078125, -2.171875, -1.89794921875, -1.6240234375, -1.35009765625, -1.076171875, -0.80224609375, -0.5283203125, -0.25439453125, 0.01953125, 0.29345703125, 0.5673828125, 0.84130859375, 1.115234375, 1.38916015625, 1.6630859375, 1.93701171875, 2.2109375, 2.48486328125, 2.7587890625, 3.03271484375, 3.306640625, 3.58056640625, 3.8544921875, 4.12841796875, 4.40234375, 4.67626953125, 4.9501953125, 5.22412109375, 5.498046875, 5.77197265625, 6.0458984375, 6.31982421875, 6.59375, 6.86767578125, 7.1416015625, 7.41552734375, 7.689453125, 7.96337890625, 8.2373046875, 8.51123046875, 8.78515625, 9.05908203125, 9.3330078125, 9.60693359375, 9.880859375, 10.15478515625, 10.4287109375, 10.70263671875, 10.9765625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 9.0, 5.0, 7.0, 6.0, 6.0, 6.0, 10.0, 19.0, 26.0, 27.0, 37.0, 37.0, 34.0, 40.0, 54.0, 53.0, 48.0, 64.0, 67.0, 44.0, 51.0, 60.0, 43.0, 37.0, 36.0, 34.0, 30.0, 16.0, 19.0, 13.0, 12.0, 13.0, 7.0, 12.0, 7.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-8.6953125, -8.45477294921875, -8.2142333984375, -7.97369384765625, -7.733154296875, -7.49261474609375, -7.2520751953125, -7.01153564453125, -6.77099609375, -6.53045654296875, -6.2899169921875, -6.04937744140625, -5.808837890625, -5.56829833984375, -5.3277587890625, -5.08721923828125, -4.8466796875, -4.60614013671875, -4.3656005859375, -4.12506103515625, -3.884521484375, -3.64398193359375, -3.4034423828125, -3.16290283203125, -2.92236328125, -2.68182373046875, -2.4412841796875, -2.20074462890625, -1.960205078125, -1.71966552734375, -1.4791259765625, -1.23858642578125, -0.998046875, -0.75750732421875, -0.5169677734375, -0.27642822265625, -0.035888671875, 0.20465087890625, 0.4451904296875, 0.68572998046875, 0.92626953125, 1.16680908203125, 1.4073486328125, 1.64788818359375, 1.888427734375, 2.12896728515625, 2.3695068359375, 2.61004638671875, 2.8505859375, 3.09112548828125, 3.3316650390625, 3.57220458984375, 3.812744140625, 4.05328369140625, 4.2938232421875, 4.53436279296875, 4.77490234375, 5.01544189453125, 5.2559814453125, 5.49652099609375, 5.737060546875, 5.97760009765625, 6.2181396484375, 6.45867919921875, 6.69921875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 6.0, 6.0, 5.0, 1.0, 10.0, 9.0, 8.0, 12.0, 24.0, 33.0, 46.0, 59.0, 92.0, 115.0, 201.0, 318.0, 500.0, 976.0, 2180.0, 5601.0, 19951.0, 124984.0, 686867.0, 170479.0, 24405.0, 6589.0, 2358.0, 1132.0, 564.0, 333.0, 219.0, 133.0, 108.0, 64.0, 44.0, 28.0, 24.0, 13.0, 13.0, 11.0, 11.0, 3.0, 11.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-3.0546875, -2.957916259765625, -2.86114501953125, -2.764373779296875, -2.6676025390625, -2.570831298828125, -2.47406005859375, -2.377288818359375, -2.280517578125, -2.183746337890625, -2.08697509765625, -1.990203857421875, -1.8934326171875, -1.796661376953125, -1.69989013671875, -1.603118896484375, -1.50634765625, -1.409576416015625, -1.31280517578125, -1.216033935546875, -1.1192626953125, -1.022491455078125, -0.92572021484375, -0.828948974609375, -0.732177734375, -0.635406494140625, -0.53863525390625, -0.441864013671875, -0.3450927734375, -0.248321533203125, -0.15155029296875, -0.054779052734375, 0.0419921875, 0.138763427734375, 0.23553466796875, 0.332305908203125, 0.4290771484375, 0.525848388671875, 0.62261962890625, 0.719390869140625, 0.816162109375, 0.912933349609375, 1.00970458984375, 1.106475830078125, 1.2032470703125, 1.300018310546875, 1.39678955078125, 1.493560791015625, 1.59033203125, 1.687103271484375, 1.78387451171875, 1.880645751953125, 1.9774169921875, 2.074188232421875, 2.17095947265625, 2.267730712890625, 2.364501953125, 2.461273193359375, 2.55804443359375, 2.654815673828125, 2.7515869140625, 2.848358154296875, 2.94512939453125, 3.041900634765625, 3.138671875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 8.0, 10.0, 18.0, 16.0, 35.0, 46.0, 93.0, 114.0, 161.0, 163.0, 139.0, 72.0, 44.0, 37.0, 15.0, 4.0, 8.0, 5.0, 4.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004634857177734375, -0.00044229626655578613, -0.00042110681533813477, -0.0003999173641204834, -0.00037872791290283203, -0.00035753846168518066, -0.0003363490104675293, -0.00031515955924987793, -0.00029397010803222656, -0.0002727806568145752, -0.00025159120559692383, -0.00023040175437927246, -0.0002092123031616211, -0.00018802285194396973, -0.00016683340072631836, -0.000145643949508667, -0.00012445449829101562, -0.00010326504707336426, -8.207559585571289e-05, -6.0886144638061523e-05, -3.9696693420410156e-05, -1.850724220275879e-05, 2.682209014892578e-06, 2.3871660232543945e-05, 4.506111145019531e-05, 6.625056266784668e-05, 8.744001388549805e-05, 0.00010862946510314941, 0.00012981891632080078, 0.00015100836753845215, 0.00017219781875610352, 0.00019338726997375488, 0.00021457672119140625, 0.00023576617240905762, 0.000256955623626709, 0.00027814507484436035, 0.0002993345260620117, 0.0003205239772796631, 0.00034171342849731445, 0.0003629028797149658, 0.0003840923309326172, 0.00040528178215026855, 0.0004264712333679199, 0.0004476606845855713, 0.00046885013580322266, 0.000490039587020874, 0.0005112290382385254, 0.0005324184894561768, 0.0005536079406738281, 0.0005747973918914795, 0.0005959868431091309, 0.0006171762943267822, 0.0006383657455444336, 0.000659555196762085, 0.0006807446479797363, 0.0007019340991973877, 0.0007231235504150391, 0.0007443130016326904, 0.0007655024528503418, 0.0007866919040679932, 0.0008078813552856445, 0.0008290708065032959, 0.0008502602577209473, 0.0008714497089385986, 0.00089263916015625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 0.0, 6.0, 13.0, 8.0, 20.0, 23.0, 38.0, 48.0, 90.0, 144.0, 237.0, 540.0, 1256.0, 3819.0, 17071.0, 228786.0, 734936.0, 50384.0, 7463.0, 2037.0, 778.0, 373.0, 178.0, 109.0, 57.0, 57.0, 25.0, 19.0, 14.0, 11.0, 2.0, 3.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.15234375, -3.0223388671875, -2.892333984375, -2.7623291015625, -2.63232421875, -2.5023193359375, -2.372314453125, -2.2423095703125, -2.1123046875, -1.9822998046875, -1.852294921875, -1.7222900390625, -1.59228515625, -1.4622802734375, -1.332275390625, -1.2022705078125, -1.072265625, -0.9422607421875, -0.812255859375, -0.6822509765625, -0.55224609375, -0.4222412109375, -0.292236328125, -0.1622314453125, -0.0322265625, 0.0977783203125, 0.227783203125, 0.3577880859375, 0.48779296875, 0.6177978515625, 0.747802734375, 0.8778076171875, 1.0078125, 1.1378173828125, 1.267822265625, 1.3978271484375, 1.52783203125, 1.6578369140625, 1.787841796875, 1.9178466796875, 2.0478515625, 2.1778564453125, 2.307861328125, 2.4378662109375, 2.56787109375, 2.6978759765625, 2.827880859375, 2.9578857421875, 3.087890625, 3.2178955078125, 3.347900390625, 3.4779052734375, 3.60791015625, 3.7379150390625, 3.867919921875, 3.9979248046875, 4.1279296875, 4.2579345703125, 4.387939453125, 4.5179443359375, 4.64794921875, 4.7779541015625, 4.907958984375, 5.0379638671875, 5.16796875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 2.0, 1.0, 4.0, 5.0, 7.0, 10.0, 9.0, 24.0, 17.0, 33.0, 41.0, 71.0, 86.0, 96.0, 80.0, 94.0, 85.0, 88.0, 68.0, 51.0, 41.0, 23.0, 20.0, 16.0, 11.0, 7.0, 5.0, 0.0, 3.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.560546875, -3.461822509765625, -3.36309814453125, -3.264373779296875, -3.1656494140625, -3.066925048828125, -2.96820068359375, -2.869476318359375, -2.770751953125, -2.672027587890625, -2.57330322265625, -2.474578857421875, -2.3758544921875, -2.277130126953125, -2.17840576171875, -2.079681396484375, -1.98095703125, -1.882232666015625, -1.78350830078125, -1.684783935546875, -1.5860595703125, -1.487335205078125, -1.38861083984375, -1.289886474609375, -1.191162109375, -1.092437744140625, -0.99371337890625, -0.894989013671875, -0.7962646484375, -0.697540283203125, -0.59881591796875, -0.500091552734375, -0.4013671875, -0.302642822265625, -0.20391845703125, -0.105194091796875, -0.0064697265625, 0.092254638671875, 0.19097900390625, 0.289703369140625, 0.388427734375, 0.487152099609375, 0.58587646484375, 0.684600830078125, 0.7833251953125, 0.882049560546875, 0.98077392578125, 1.079498291015625, 1.17822265625, 1.276947021484375, 1.37567138671875, 1.474395751953125, 1.5731201171875, 1.671844482421875, 1.77056884765625, 1.869293212890625, 1.968017578125, 2.066741943359375, 2.16546630859375, 2.264190673828125, 2.3629150390625, 2.461639404296875, 2.56036376953125, 2.659088134765625, 2.7578125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 15.0, 25.0, 106.0, 250.0, 320.0, 179.0, 80.0, 18.0, 10.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-172.21542358398438, -168.31869506835938, -164.42196655273438, -160.5252227783203, -156.6284942626953, -152.7317657470703, -148.8350372314453, -144.93829345703125, -141.04156494140625, -137.14483642578125, -133.24810791015625, -129.3513641357422, -125.45463562011719, -121.55790710449219, -117.66117858886719, -113.76444244384766, -109.86771392822266, -105.97098541259766, -102.07424926757812, -98.17752075195312, -94.2807846069336, -90.3840560913086, -86.48731994628906, -82.59059143066406, -78.69386291503906, -74.79713439941406, -70.90039825439453, -67.00366973876953, -63.10693359375, -59.210205078125, -55.313472747802734, -51.41674041748047, -47.52001190185547, -43.6232795715332, -39.72654724121094, -35.82981872558594, -31.93308448791504, -28.036352157592773, -24.13962173461914, -20.242889404296875, -16.34615707397461, -12.449424743652344, -8.552693367004395, -4.655961990356445, -0.7592296600341797, 3.137502670288086, 7.034233093261719, 10.930965423583984, 14.82769775390625, 18.724430084228516, 22.62116241455078, 26.517892837524414, 30.41462516784668, 34.31135559082031, 38.20808792114258, 42.104820251464844, 46.00155258178711, 49.898284912109375, 53.79501724243164, 57.691749572753906, 61.588478088378906, 65.48521423339844, 69.38194274902344, 73.27867126464844, 77.17540740966797]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 4.0, 7.0, 4.0, 10.0, 5.0, 12.0, 13.0, 21.0, 22.0, 19.0, 24.0, 27.0, 35.0, 36.0, 41.0, 46.0, 52.0, 55.0, 59.0, 58.0, 64.0, 62.0, 35.0, 47.0, 32.0, 32.0, 32.0, 26.0, 29.0, 19.0, 17.0, 12.0, 14.0, 9.0, 10.0, 3.0, 1.0, 8.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.93239974975586, -28.862197875976562, -27.7919979095459, -26.7217960357666, -25.651594161987305, -24.58139419555664, -23.511192321777344, -22.440990447998047, -21.37078857421875, -20.300586700439453, -19.23038673400879, -18.160184860229492, -17.089982986450195, -16.01978302001953, -14.949581146240234, -13.879379272460938, -12.809179306030273, -11.738978385925293, -10.668776512145996, -9.598575592041016, -8.528373718261719, -7.458172798156738, -6.387971878051758, -5.317770481109619, -4.2475690841674805, -3.177367687225342, -2.1071665287017822, -1.0369653701782227, 0.033236026763916016, 1.1034374237060547, 2.173638343811035, 3.243839740753174, 4.3140411376953125, 5.384242534637451, 6.45444393157959, 7.52464485168457, 8.594846725463867, 9.665047645568848, 10.735248565673828, 11.805450439453125, 12.875651359558105, 13.945852279663086, 15.016054153442383, 16.086254119873047, 17.156455993652344, 18.22665786743164, 19.296859741210938, 20.3670597076416, 21.4372615814209, 22.507463455200195, 23.57766342163086, 24.647865295410156, 25.718067169189453, 26.78826904296875, 27.858469009399414, 28.92867088317871, 29.998870849609375, 31.069072723388672, 32.13927459716797, 33.20947265625, 34.2796745300293, 35.349876403808594, 36.42007827758789, 37.49028015136719, 38.560482025146484]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 6.0, 1.0, 6.0, 5.0, 6.0, 14.0, 19.0, 23.0, 49.0, 62.0, 127.0, 199.0, 386.0, 747.0, 1773.0, 4900.0, 30886.0, 4134614.0, 14250.0, 3450.0, 1316.0, 640.0, 336.0, 185.0, 99.0, 71.0, 38.0, 18.0, 21.0, 11.0, 6.0, 6.0, 9.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.9453125, -9.6378173828125, -9.330322265625, -9.0228271484375, -8.71533203125, -8.4078369140625, -8.100341796875, -7.7928466796875, -7.4853515625, -7.1778564453125, -6.870361328125, -6.5628662109375, -6.25537109375, -5.9478759765625, -5.640380859375, -5.3328857421875, -5.025390625, -4.7178955078125, -4.410400390625, -4.1029052734375, -3.79541015625, -3.4879150390625, -3.180419921875, -2.8729248046875, -2.5654296875, -2.2579345703125, -1.950439453125, -1.6429443359375, -1.33544921875, -1.0279541015625, -0.720458984375, -0.4129638671875, -0.10546875, 0.2020263671875, 0.509521484375, 0.8170166015625, 1.12451171875, 1.4320068359375, 1.739501953125, 2.0469970703125, 2.3544921875, 2.6619873046875, 2.969482421875, 3.2769775390625, 3.58447265625, 3.8919677734375, 4.199462890625, 4.5069580078125, 4.814453125, 5.1219482421875, 5.429443359375, 5.7369384765625, 6.04443359375, 6.3519287109375, 6.659423828125, 6.9669189453125, 7.2744140625, 7.5819091796875, 7.889404296875, 8.1968994140625, 8.50439453125, 8.8118896484375, 9.119384765625, 9.4268798828125, 9.734375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 1.0, 2.0, 6.0, 2.0, 15.0, 10.0, 19.0, 19.0, 24.0, 36.0, 42.0, 79.0, 73.0, 109.0, 88.0, 91.0, 89.0, 80.0, 62.0, 43.0, 32.0, 25.0, 20.0, 10.0, 8.0, 5.0, 7.0, 6.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.38671875, -2.306549072265625, -2.22637939453125, -2.146209716796875, -2.0660400390625, -1.985870361328125, -1.90570068359375, -1.825531005859375, -1.745361328125, -1.665191650390625, -1.58502197265625, -1.504852294921875, -1.4246826171875, -1.344512939453125, -1.26434326171875, -1.184173583984375, -1.10400390625, -1.023834228515625, -0.94366455078125, -0.863494873046875, -0.7833251953125, -0.703155517578125, -0.62298583984375, -0.542816162109375, -0.462646484375, -0.382476806640625, -0.30230712890625, -0.222137451171875, -0.1419677734375, -0.061798095703125, 0.01837158203125, 0.098541259765625, 0.1787109375, 0.258880615234375, 0.33905029296875, 0.419219970703125, 0.4993896484375, 0.579559326171875, 0.65972900390625, 0.739898681640625, 0.820068359375, 0.900238037109375, 0.98040771484375, 1.060577392578125, 1.1407470703125, 1.220916748046875, 1.30108642578125, 1.381256103515625, 1.46142578125, 1.541595458984375, 1.62176513671875, 1.701934814453125, 1.7821044921875, 1.862274169921875, 1.94244384765625, 2.022613525390625, 2.102783203125, 2.182952880859375, 2.26312255859375, 2.343292236328125, 2.4234619140625, 2.503631591796875, 2.58380126953125, 2.663970947265625, 2.744140625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 8.0, 4.0, 13.0, 14.0, 19.0, 19.0, 23.0, 35.0, 50.0, 67.0, 116.0, 156.0, 231.0, 355.0, 522.0, 742.0, 1131.0, 1688.0, 2876.0, 5554.0, 14746.0, 177759.0, 3955611.0, 17787.0, 6049.0, 3100.0, 1873.0, 1185.0, 801.0, 526.0, 368.0, 251.0, 167.0, 126.0, 101.0, 63.0, 48.0, 30.0, 27.0, 17.0, 7.0, 9.0, 4.0, 1.0, 3.0, 6.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.6875, -7.41357421875, -7.1396484375, -6.86572265625, -6.591796875, -6.31787109375, -6.0439453125, -5.77001953125, -5.49609375, -5.22216796875, -4.9482421875, -4.67431640625, -4.400390625, -4.12646484375, -3.8525390625, -3.57861328125, -3.3046875, -3.03076171875, -2.7568359375, -2.48291015625, -2.208984375, -1.93505859375, -1.6611328125, -1.38720703125, -1.11328125, -0.83935546875, -0.5654296875, -0.29150390625, -0.017578125, 0.25634765625, 0.5302734375, 0.80419921875, 1.078125, 1.35205078125, 1.6259765625, 1.89990234375, 2.173828125, 2.44775390625, 2.7216796875, 2.99560546875, 3.26953125, 3.54345703125, 3.8173828125, 4.09130859375, 4.365234375, 4.63916015625, 4.9130859375, 5.18701171875, 5.4609375, 5.73486328125, 6.0087890625, 6.28271484375, 6.556640625, 6.83056640625, 7.1044921875, 7.37841796875, 7.65234375, 7.92626953125, 8.2001953125, 8.47412109375, 8.748046875, 9.02197265625, 9.2958984375, 9.56982421875, 9.84375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 2.0, 8.0, 8.0, 17.0, 23.0, 61.0, 3721.0, 150.0, 26.0, 17.0, 10.0, 3.0, 3.0, 6.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.28515625, -2.20831298828125, -2.1314697265625, -2.05462646484375, -1.977783203125, -1.90093994140625, -1.8240966796875, -1.74725341796875, -1.67041015625, -1.59356689453125, -1.5167236328125, -1.43988037109375, -1.363037109375, -1.28619384765625, -1.2093505859375, -1.13250732421875, -1.0556640625, -0.97882080078125, -0.9019775390625, -0.82513427734375, -0.748291015625, -0.67144775390625, -0.5946044921875, -0.51776123046875, -0.44091796875, -0.36407470703125, -0.2872314453125, -0.21038818359375, -0.133544921875, -0.05670166015625, 0.0201416015625, 0.09698486328125, 0.173828125, 0.25067138671875, 0.3275146484375, 0.40435791015625, 0.481201171875, 0.55804443359375, 0.6348876953125, 0.71173095703125, 0.78857421875, 0.86541748046875, 0.9422607421875, 1.01910400390625, 1.095947265625, 1.17279052734375, 1.2496337890625, 1.32647705078125, 1.4033203125, 1.48016357421875, 1.5570068359375, 1.63385009765625, 1.710693359375, 1.78753662109375, 1.8643798828125, 1.94122314453125, 2.01806640625, 2.09490966796875, 2.1717529296875, 2.24859619140625, 2.325439453125, 2.40228271484375, 2.4791259765625, 2.55596923828125, 2.6328125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 9.0, 8.0, 9.0, 31.0, 67.0, 177.0, 192.0, 211.0, 134.0, 81.0, 47.0, 20.0, 10.0, 7.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.363758087158203, -17.943307876586914, -17.522857666015625, -17.10240936279297, -16.68195915222168, -16.26150894165039, -15.841058731079102, -15.420608520507812, -15.000158309936523, -14.579708099365234, -14.159258842468262, -13.738808631896973, -13.318358421325684, -12.897909164428711, -12.477458953857422, -12.057008743286133, -11.63655948638916, -11.216109275817871, -10.795660018920898, -10.37520980834961, -9.95475959777832, -9.534309387207031, -9.113860130310059, -8.69340991973877, -8.272960662841797, -7.852510929107666, -7.432060718536377, -7.011610984802246, -6.591160774230957, -6.170711040496826, -5.750261306762695, -5.329811096191406, -4.909359931945801, -4.48891019821167, -4.068459987640381, -3.64801025390625, -3.22756028175354, -2.80711030960083, -2.386660575866699, -1.9662106037139893, -1.5457606315612793, -1.1253106594085693, -0.7048608064651489, -0.2844109535217285, 0.13603901863098145, 0.5564889907836914, 0.9769387245178223, 1.3973886966705322, 1.8178386688232422, 2.238288640975952, 2.658738613128662, 3.079188346862793, 3.499638319015503, 3.920088291168213, 4.340538024902344, 4.760988235473633, 5.181437969207764, 5.6018877029418945, 6.022337913513184, 6.4427876472473145, 6.863237380981445, 7.283687591552734, 7.704137325286865, 8.124587059020996, 8.545037269592285]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 6.0, 2.0, 8.0, 9.0, 8.0, 8.0, 12.0, 9.0, 16.0, 18.0, 21.0, 24.0, 17.0, 27.0, 26.0, 32.0, 28.0, 36.0, 32.0, 37.0, 45.0, 29.0, 34.0, 33.0, 49.0, 41.0, 37.0, 40.0, 29.0, 38.0, 29.0, 24.0, 29.0, 33.0, 19.0, 21.0, 12.0, 16.0, 16.0, 10.0, 5.0, 9.0, 6.0, 3.0, 3.0, 6.0, 5.0, 3.0, 5.0, 4.0, 1.0], "bins": [-4.406777858734131, -4.285886764526367, -4.1649956703186035, -4.04410457611084, -3.923213481903076, -3.8023223876953125, -3.681431293487549, -3.560540199279785, -3.4396491050720215, -3.318758010864258, -3.197866916656494, -3.0769758224487305, -2.956084728240967, -2.835193634033203, -2.7143025398254395, -2.593411445617676, -2.472520351409912, -2.3516292572021484, -2.2307381629943848, -2.109847068786621, -1.9889559745788574, -1.8680648803710938, -1.74717378616333, -1.6262826919555664, -1.5053918361663818, -1.3845007419586182, -1.2636096477508545, -1.1427185535430908, -1.0218274593353271, -0.9009364247322083, -0.7800453305244446, -0.6591542363166809, -0.5382630825042725, -0.4173719882965088, -0.2964808940887451, -0.17558982968330383, -0.05469873547554016, 0.06619232892990112, 0.1870834231376648, 0.30797451734542847, 0.42886561155319214, 0.5497567057609558, 0.6706477999687195, 0.7915388345718384, 0.912429928779602, 1.0333210229873657, 1.1542121171951294, 1.275103211402893, 1.3959943056106567, 1.5168853998184204, 1.637776494026184, 1.7586675882339478, 1.8795586824417114, 2.0004496574401855, 2.121340751647949, 2.242231845855713, 2.3631229400634766, 2.4840140342712402, 2.604905128479004, 2.7257962226867676, 2.8466873168945312, 2.967578411102295, 3.0884695053100586, 3.2093605995178223, 3.330251693725586]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 3.0, 4.0, 10.0, 13.0, 10.0, 19.0, 34.0, 52.0, 98.0, 130.0, 274.0, 407.0, 820.0, 1864.0, 4650.0, 13536.0, 46968.0, 199232.0, 529657.0, 185852.0, 44070.0, 12881.0, 4278.0, 1850.0, 854.0, 413.0, 213.0, 125.0, 76.0, 49.0, 34.0, 19.0, 15.0, 15.0, 14.0, 9.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0], "bins": [-6.4453125, -6.26861572265625, -6.0919189453125, -5.91522216796875, -5.738525390625, -5.56182861328125, -5.3851318359375, -5.20843505859375, -5.03173828125, -4.85504150390625, -4.6783447265625, -4.50164794921875, -4.324951171875, -4.14825439453125, -3.9715576171875, -3.79486083984375, -3.6181640625, -3.44146728515625, -3.2647705078125, -3.08807373046875, -2.911376953125, -2.73468017578125, -2.5579833984375, -2.38128662109375, -2.20458984375, -2.02789306640625, -1.8511962890625, -1.67449951171875, -1.497802734375, -1.32110595703125, -1.1444091796875, -0.96771240234375, -0.791015625, -0.61431884765625, -0.4376220703125, -0.26092529296875, -0.084228515625, 0.09246826171875, 0.2691650390625, 0.44586181640625, 0.62255859375, 0.79925537109375, 0.9759521484375, 1.15264892578125, 1.329345703125, 1.50604248046875, 1.6827392578125, 1.85943603515625, 2.0361328125, 2.21282958984375, 2.3895263671875, 2.56622314453125, 2.742919921875, 2.91961669921875, 3.0963134765625, 3.27301025390625, 3.44970703125, 3.62640380859375, 3.8031005859375, 3.97979736328125, 4.156494140625, 4.33319091796875, 4.5098876953125, 4.68658447265625, 4.86328125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 2.0, 5.0, 15.0, 15.0, 23.0, 22.0, 32.0, 41.0, 55.0, 75.0, 80.0, 89.0, 98.0, 75.0, 69.0, 75.0, 61.0, 46.0, 38.0, 26.0, 11.0, 9.0, 15.0, 8.0, 5.0, 3.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.173828125, -3.08428955078125, -2.9947509765625, -2.90521240234375, -2.815673828125, -2.72613525390625, -2.6365966796875, -2.54705810546875, -2.45751953125, -2.36798095703125, -2.2784423828125, -2.18890380859375, -2.099365234375, -2.00982666015625, -1.9202880859375, -1.83074951171875, -1.7412109375, -1.65167236328125, -1.5621337890625, -1.47259521484375, -1.383056640625, -1.29351806640625, -1.2039794921875, -1.11444091796875, -1.02490234375, -0.93536376953125, -0.8458251953125, -0.75628662109375, -0.666748046875, -0.57720947265625, -0.4876708984375, -0.39813232421875, -0.30859375, -0.21905517578125, -0.1295166015625, -0.03997802734375, 0.049560546875, 0.13909912109375, 0.2286376953125, 0.31817626953125, 0.40771484375, 0.49725341796875, 0.5867919921875, 0.67633056640625, 0.765869140625, 0.85540771484375, 0.9449462890625, 1.03448486328125, 1.1240234375, 1.21356201171875, 1.3031005859375, 1.39263916015625, 1.482177734375, 1.57171630859375, 1.6612548828125, 1.75079345703125, 1.84033203125, 1.92987060546875, 2.0194091796875, 2.10894775390625, 2.198486328125, 2.28802490234375, 2.3775634765625, 2.46710205078125, 2.556640625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 6.0, 4.0, 3.0, 8.0, 7.0, 5.0, 4.0, 7.0, 15.0, 13.0, 17.0, 25.0, 36.0, 49.0, 88.0, 137.0, 238.0, 439.0, 885.0, 2101.0, 5518.0, 19177.0, 93377.0, 551613.0, 306183.0, 50048.0, 11862.0, 3650.0, 1455.0, 685.0, 344.0, 188.0, 116.0, 68.0, 43.0, 43.0, 34.0, 15.0, 8.0, 15.0, 3.0, 8.0, 5.0, 3.0, 1.0, 2.0, 3.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-6.33984375, -6.13409423828125, -5.9283447265625, -5.72259521484375, -5.516845703125, -5.31109619140625, -5.1053466796875, -4.89959716796875, -4.69384765625, -4.48809814453125, -4.2823486328125, -4.07659912109375, -3.870849609375, -3.66510009765625, -3.4593505859375, -3.25360107421875, -3.0478515625, -2.84210205078125, -2.6363525390625, -2.43060302734375, -2.224853515625, -2.01910400390625, -1.8133544921875, -1.60760498046875, -1.40185546875, -1.19610595703125, -0.9903564453125, -0.78460693359375, -0.578857421875, -0.37310791015625, -0.1673583984375, 0.03839111328125, 0.244140625, 0.44989013671875, 0.6556396484375, 0.86138916015625, 1.067138671875, 1.27288818359375, 1.4786376953125, 1.68438720703125, 1.89013671875, 2.09588623046875, 2.3016357421875, 2.50738525390625, 2.713134765625, 2.91888427734375, 3.1246337890625, 3.33038330078125, 3.5361328125, 3.74188232421875, 3.9476318359375, 4.15338134765625, 4.359130859375, 4.56488037109375, 4.7706298828125, 4.97637939453125, 5.18212890625, 5.38787841796875, 5.5936279296875, 5.79937744140625, 6.005126953125, 6.21087646484375, 6.4166259765625, 6.62237548828125, 6.828125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 2.0, 4.0, 9.0, 11.0, 13.0, 16.0, 19.0, 17.0, 26.0, 25.0, 32.0, 31.0, 55.0, 50.0, 62.0, 50.0, 44.0, 59.0, 53.0, 48.0, 46.0, 55.0, 42.0, 41.0, 34.0, 35.0, 29.0, 20.0, 12.0, 18.0, 13.0, 4.0, 11.0, 4.0, 2.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.453125, -8.1458740234375, -7.838623046875, -7.5313720703125, -7.22412109375, -6.9168701171875, -6.609619140625, -6.3023681640625, -5.9951171875, -5.6878662109375, -5.380615234375, -5.0733642578125, -4.76611328125, -4.4588623046875, -4.151611328125, -3.8443603515625, -3.537109375, -3.2298583984375, -2.922607421875, -2.6153564453125, -2.30810546875, -2.0008544921875, -1.693603515625, -1.3863525390625, -1.0791015625, -0.7718505859375, -0.464599609375, -0.1573486328125, 0.14990234375, 0.4571533203125, 0.764404296875, 1.0716552734375, 1.37890625, 1.6861572265625, 1.993408203125, 2.3006591796875, 2.60791015625, 2.9151611328125, 3.222412109375, 3.5296630859375, 3.8369140625, 4.1441650390625, 4.451416015625, 4.7586669921875, 5.06591796875, 5.3731689453125, 5.680419921875, 5.9876708984375, 6.294921875, 6.6021728515625, 6.909423828125, 7.2166748046875, 7.52392578125, 7.8311767578125, 8.138427734375, 8.4456787109375, 8.7529296875, 9.0601806640625, 9.367431640625, 9.6746826171875, 9.98193359375, 10.2891845703125, 10.596435546875, 10.9036865234375, 11.2109375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 2.0, 5.0, 10.0, 12.0, 15.0, 35.0, 66.0, 127.0, 273.0, 677.0, 3172.0, 39592.0, 972174.0, 28585.0, 2668.0, 651.0, 266.0, 95.0, 52.0, 30.0, 24.0, 11.0, 5.0, 5.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.203125, -7.880859375, -7.55859375, -7.236328125, -6.9140625, -6.591796875, -6.26953125, -5.947265625, -5.625, -5.302734375, -4.98046875, -4.658203125, -4.3359375, -4.013671875, -3.69140625, -3.369140625, -3.046875, -2.724609375, -2.40234375, -2.080078125, -1.7578125, -1.435546875, -1.11328125, -0.791015625, -0.46875, -0.146484375, 0.17578125, 0.498046875, 0.8203125, 1.142578125, 1.46484375, 1.787109375, 2.109375, 2.431640625, 2.75390625, 3.076171875, 3.3984375, 3.720703125, 4.04296875, 4.365234375, 4.6875, 5.009765625, 5.33203125, 5.654296875, 5.9765625, 6.298828125, 6.62109375, 6.943359375, 7.265625, 7.587890625, 7.91015625, 8.232421875, 8.5546875, 8.876953125, 9.19921875, 9.521484375, 9.84375, 10.166015625, 10.48828125, 10.810546875, 11.1328125, 11.455078125, 11.77734375, 12.099609375, 12.421875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 4.0, 10.0, 9.0, 23.0, 45.0, 111.0, 252.0, 284.0, 143.0, 57.0, 31.0, 21.0, 4.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001247406005859375, -0.0012013912200927734, -0.0011553764343261719, -0.0011093616485595703, -0.0010633468627929688, -0.0010173320770263672, -0.0009713172912597656, -0.0009253025054931641, -0.0008792877197265625, -0.0008332729339599609, -0.0007872581481933594, -0.0007412433624267578, -0.0006952285766601562, -0.0006492137908935547, -0.0006031990051269531, -0.0005571842193603516, -0.00051116943359375, -0.00046515464782714844, -0.0004191398620605469, -0.0003731250762939453, -0.00032711029052734375, -0.0002810955047607422, -0.00023508071899414062, -0.00018906593322753906, -0.0001430511474609375, -9.703636169433594e-05, -5.1021575927734375e-05, -5.0067901611328125e-06, 4.100799560546875e-05, 8.702278137207031e-05, 0.00013303756713867188, 0.00017905235290527344, 0.000225067138671875, 0.00027108192443847656, 0.0003170967102050781, 0.0003631114959716797, 0.00040912628173828125, 0.0004551410675048828, 0.0005011558532714844, 0.0005471706390380859, 0.0005931854248046875, 0.0006392002105712891, 0.0006852149963378906, 0.0007312297821044922, 0.0007772445678710938, 0.0008232593536376953, 0.0008692741394042969, 0.0009152889251708984, 0.0009613037109375, 0.0010073184967041016, 0.0010533332824707031, 0.0010993480682373047, 0.0011453628540039062, 0.0011913776397705078, 0.0012373924255371094, 0.001283407211303711, 0.0013294219970703125, 0.001375436782836914, 0.0014214515686035156, 0.0014674663543701172, 0.0015134811401367188, 0.0015594959259033203, 0.0016055107116699219, 0.0016515254974365234, 0.001697540283203125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 9.0, 1.0, 9.0, 9.0, 13.0, 16.0, 14.0, 28.0, 49.0, 63.0, 93.0, 188.0, 359.0, 817.0, 1945.0, 5804.0, 30985.0, 829497.0, 160679.0, 12253.0, 3240.0, 1259.0, 547.0, 283.0, 157.0, 87.0, 55.0, 31.0, 25.0, 11.0, 5.0, 5.0, 7.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.2734375, -8.0543212890625, -7.835205078125, -7.6160888671875, -7.39697265625, -7.1778564453125, -6.958740234375, -6.7396240234375, -6.5205078125, -6.3013916015625, -6.082275390625, -5.8631591796875, -5.64404296875, -5.4249267578125, -5.205810546875, -4.9866943359375, -4.767578125, -4.5484619140625, -4.329345703125, -4.1102294921875, -3.89111328125, -3.6719970703125, -3.452880859375, -3.2337646484375, -3.0146484375, -2.7955322265625, -2.576416015625, -2.3572998046875, -2.13818359375, -1.9190673828125, -1.699951171875, -1.4808349609375, -1.26171875, -1.0426025390625, -0.823486328125, -0.6043701171875, -0.38525390625, -0.1661376953125, 0.052978515625, 0.2720947265625, 0.4912109375, 0.7103271484375, 0.929443359375, 1.1485595703125, 1.36767578125, 1.5867919921875, 1.805908203125, 2.0250244140625, 2.244140625, 2.4632568359375, 2.682373046875, 2.9014892578125, 3.12060546875, 3.3397216796875, 3.558837890625, 3.7779541015625, 3.9970703125, 4.2161865234375, 4.435302734375, 4.6544189453125, 4.87353515625, 5.0926513671875, 5.311767578125, 5.5308837890625, 5.75]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 4.0, 4.0, 4.0, 4.0, 7.0, 9.0, 6.0, 17.0, 22.0, 38.0, 56.0, 101.0, 129.0, 148.0, 138.0, 132.0, 67.0, 31.0, 21.0, 17.0, 15.0, 14.0, 4.0, 6.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.08203125, -5.8836669921875, -5.685302734375, -5.4869384765625, -5.28857421875, -5.0902099609375, -4.891845703125, -4.6934814453125, -4.4951171875, -4.2967529296875, -4.098388671875, -3.9000244140625, -3.70166015625, -3.5032958984375, -3.304931640625, -3.1065673828125, -2.908203125, -2.7098388671875, -2.511474609375, -2.3131103515625, -2.11474609375, -1.9163818359375, -1.718017578125, -1.5196533203125, -1.3212890625, -1.1229248046875, -0.924560546875, -0.7261962890625, -0.52783203125, -0.3294677734375, -0.131103515625, 0.0672607421875, 0.265625, 0.4639892578125, 0.662353515625, 0.8607177734375, 1.05908203125, 1.2574462890625, 1.455810546875, 1.6541748046875, 1.8525390625, 2.0509033203125, 2.249267578125, 2.4476318359375, 2.64599609375, 2.8443603515625, 3.042724609375, 3.2410888671875, 3.439453125, 3.6378173828125, 3.836181640625, 4.0345458984375, 4.23291015625, 4.4312744140625, 4.629638671875, 4.8280029296875, 5.0263671875, 5.2247314453125, 5.423095703125, 5.6214599609375, 5.81982421875, 6.0181884765625, 6.216552734375, 6.4149169921875, 6.61328125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 1.0, 2.0, 4.0, 3.0, 10.0, 17.0, 18.0, 53.0, 60.0, 98.0, 119.0, 151.0, 144.0, 118.0, 73.0, 61.0, 30.0, 16.0, 11.0, 8.0, 5.0, 0.0, 3.0, 0.0, 1.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.47226333618164, -26.52532958984375, -24.578393936157227, -22.631458282470703, -20.684524536132812, -18.737590789794922, -16.7906551361084, -14.843720436096191, -12.896785736083984, -10.949851036071777, -9.00291633605957, -7.055981636047363, -5.109046936035156, -3.162112236022949, -1.2151775360107422, 0.7317571640014648, 2.678691864013672, 4.625626564025879, 6.572561264038086, 8.519495964050293, 10.4664306640625, 12.413365364074707, 14.360300064086914, 16.307235717773438, 18.254169464111328, 20.20110321044922, 22.148038864135742, 24.094974517822266, 26.041908264160156, 27.988842010498047, 29.93577766418457, 31.882713317871094, 33.82964324951172, 35.77657699584961, 37.7235107421875, 39.670448303222656, 41.61738204956055, 43.56431579589844, 45.511253356933594, 47.458187103271484, 49.405120849609375, 51.352054595947266, 53.298988342285156, 55.24592590332031, 57.1928596496582, 59.139793395996094, 61.08673095703125, 63.03366470336914, 64.98059844970703, 66.92753601074219, 68.87446594238281, 70.82140350341797, 72.76834106445312, 74.71527099609375, 76.6622085571289, 78.60913848876953, 80.55607604980469, 82.50301361083984, 84.44994354248047, 86.39688110351562, 88.34381103515625, 90.2907485961914, 92.23768615722656, 94.18461608886719, 96.13155364990234]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 9.0, 5.0, 10.0, 12.0, 20.0, 29.0, 25.0, 30.0, 24.0, 57.0, 61.0, 65.0, 88.0, 76.0, 86.0, 82.0, 72.0, 39.0, 49.0, 45.0, 22.0, 24.0, 21.0, 13.0, 13.0, 7.0, 10.0, 4.0, 4.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.255859375, -76.07733154296875, -73.89879608154297, -71.72026062011719, -69.54173278808594, -67.36320495605469, -65.1846694946289, -63.00613784790039, -60.827606201171875, -58.64907455444336, -56.470542907714844, -54.29201126098633, -52.11347961425781, -49.9349479675293, -47.75641632080078, -45.577884674072266, -43.39935302734375, -41.220821380615234, -39.04228973388672, -36.8637580871582, -34.68522644042969, -32.50669479370117, -30.328163146972656, -28.14963150024414, -25.971099853515625, -23.79256820678711, -21.614036560058594, -19.435504913330078, -17.256973266601562, -15.078441619873047, -12.899909973144531, -10.721378326416016, -8.5428466796875, -6.364315032958984, -4.185783386230469, -2.007251739501953, 0.1712799072265625, 2.349811553955078, 4.528343200683594, 6.706874847412109, 8.885406494140625, 11.06393814086914, 13.242469787597656, 15.421001434326172, 17.599533081054688, 19.778064727783203, 21.95659637451172, 24.135128021240234, 26.31365966796875, 28.492191314697266, 30.67072296142578, 32.8492546081543, 35.02778625488281, 37.20631790161133, 39.384849548339844, 41.56338119506836, 43.741912841796875, 45.92044448852539, 48.098976135253906, 50.27750778198242, 52.45603942871094, 54.63457107543945, 56.81310272216797, 58.991634368896484, 61.170166015625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 1.0, 1.0, 2.0, 11.0, 3.0, 17.0, 28.0, 20.0, 36.0, 49.0, 76.0, 118.0, 244.0, 421.0, 814.0, 1747.0, 4674.0, 17104.0, 3677397.0, 467188.0, 16345.0, 4448.0, 1730.0, 844.0, 385.0, 200.0, 127.0, 84.0, 58.0, 27.0, 27.0, 12.0, 13.0, 7.0, 7.0, 8.0, 2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.53125, -7.2520751953125, -6.972900390625, -6.6937255859375, -6.41455078125, -6.1353759765625, -5.856201171875, -5.5770263671875, -5.2978515625, -5.0186767578125, -4.739501953125, -4.4603271484375, -4.18115234375, -3.9019775390625, -3.622802734375, -3.3436279296875, -3.064453125, -2.7852783203125, -2.506103515625, -2.2269287109375, -1.94775390625, -1.6685791015625, -1.389404296875, -1.1102294921875, -0.8310546875, -0.5518798828125, -0.272705078125, 0.0064697265625, 0.28564453125, 0.5648193359375, 0.843994140625, 1.1231689453125, 1.40234375, 1.6815185546875, 1.960693359375, 2.2398681640625, 2.51904296875, 2.7982177734375, 3.077392578125, 3.3565673828125, 3.6357421875, 3.9149169921875, 4.194091796875, 4.4732666015625, 4.75244140625, 5.0316162109375, 5.310791015625, 5.5899658203125, 5.869140625, 6.1483154296875, 6.427490234375, 6.7066650390625, 6.98583984375, 7.2650146484375, 7.544189453125, 7.8233642578125, 8.1025390625, 8.3817138671875, 8.660888671875, 8.9400634765625, 9.21923828125, 9.4984130859375, 9.777587890625, 10.0567626953125, 10.3359375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 7.0, 7.0, 4.0, 8.0, 13.0, 23.0, 20.0, 36.0, 65.0, 80.0, 84.0, 100.0, 108.0, 98.0, 117.0, 61.0, 44.0, 32.0, 20.0, 20.0, 14.0, 12.0, 7.0, 4.0, 3.0, 1.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.96875, -2.860198974609375, -2.75164794921875, -2.643096923828125, -2.5345458984375, -2.425994873046875, -2.31744384765625, -2.208892822265625, -2.100341796875, -1.991790771484375, -1.88323974609375, -1.774688720703125, -1.6661376953125, -1.557586669921875, -1.44903564453125, -1.340484619140625, -1.23193359375, -1.123382568359375, -1.01483154296875, -0.906280517578125, -0.7977294921875, -0.689178466796875, -0.58062744140625, -0.472076416015625, -0.363525390625, -0.254974365234375, -0.14642333984375, -0.037872314453125, 0.0706787109375, 0.179229736328125, 0.28778076171875, 0.396331787109375, 0.5048828125, 0.613433837890625, 0.72198486328125, 0.830535888671875, 0.9390869140625, 1.047637939453125, 1.15618896484375, 1.264739990234375, 1.373291015625, 1.481842041015625, 1.59039306640625, 1.698944091796875, 1.8074951171875, 1.916046142578125, 2.02459716796875, 2.133148193359375, 2.24169921875, 2.350250244140625, 2.45880126953125, 2.567352294921875, 2.6759033203125, 2.784454345703125, 2.89300537109375, 3.001556396484375, 3.110107421875, 3.218658447265625, 3.32720947265625, 3.435760498046875, 3.5443115234375, 3.652862548828125, 3.76141357421875, 3.869964599609375, 3.978515625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 6.0, 5.0, 8.0, 4.0, 7.0, 15.0, 21.0, 23.0, 34.0, 33.0, 46.0, 76.0, 124.0, 241.0, 447.0, 933.0, 2490.0, 14842.0, 4123935.0, 44556.0, 3873.0, 1320.0, 553.0, 235.0, 144.0, 90.0, 44.0, 47.0, 35.0, 26.0, 14.0, 10.0, 14.0, 12.0, 7.0, 2.0, 8.0, 6.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.015625, -22.26513671875, -21.5146484375, -20.76416015625, -20.013671875, -19.26318359375, -18.5126953125, -17.76220703125, -17.01171875, -16.26123046875, -15.5107421875, -14.76025390625, -14.009765625, -13.25927734375, -12.5087890625, -11.75830078125, -11.0078125, -10.25732421875, -9.5068359375, -8.75634765625, -8.005859375, -7.25537109375, -6.5048828125, -5.75439453125, -5.00390625, -4.25341796875, -3.5029296875, -2.75244140625, -2.001953125, -1.25146484375, -0.5009765625, 0.24951171875, 1.0, 1.75048828125, 2.5009765625, 3.25146484375, 4.001953125, 4.75244140625, 5.5029296875, 6.25341796875, 7.00390625, 7.75439453125, 8.5048828125, 9.25537109375, 10.005859375, 10.75634765625, 11.5068359375, 12.25732421875, 13.0078125, 13.75830078125, 14.5087890625, 15.25927734375, 16.009765625, 16.76025390625, 17.5107421875, 18.26123046875, 19.01171875, 19.76220703125, 20.5126953125, 21.26318359375, 22.013671875, 22.76416015625, 23.5146484375, 24.26513671875, 25.015625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 7.0, 9.0, 26.0, 42.0, 144.0, 3498.0, 253.0, 48.0, 22.0, 6.0, 10.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.09765625, -6.85882568359375, -6.6199951171875, -6.38116455078125, -6.142333984375, -5.90350341796875, -5.6646728515625, -5.42584228515625, -5.18701171875, -4.94818115234375, -4.7093505859375, -4.47052001953125, -4.231689453125, -3.99285888671875, -3.7540283203125, -3.51519775390625, -3.2763671875, -3.03753662109375, -2.7987060546875, -2.55987548828125, -2.321044921875, -2.08221435546875, -1.8433837890625, -1.60455322265625, -1.36572265625, -1.12689208984375, -0.8880615234375, -0.64923095703125, -0.410400390625, -0.17156982421875, 0.0672607421875, 0.30609130859375, 0.544921875, 0.78375244140625, 1.0225830078125, 1.26141357421875, 1.500244140625, 1.73907470703125, 1.9779052734375, 2.21673583984375, 2.45556640625, 2.69439697265625, 2.9332275390625, 3.17205810546875, 3.410888671875, 3.64971923828125, 3.8885498046875, 4.12738037109375, 4.3662109375, 4.60504150390625, 4.8438720703125, 5.08270263671875, 5.321533203125, 5.56036376953125, 5.7991943359375, 6.03802490234375, 6.27685546875, 6.51568603515625, 6.7545166015625, 6.99334716796875, 7.232177734375, 7.47100830078125, 7.7098388671875, 7.94866943359375, 8.1875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 3.0, 9.0, 7.0, 19.0, 22.0, 48.0, 63.0, 139.0, 175.0, 183.0, 121.0, 109.0, 53.0, 26.0, 15.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-38.48661422729492, -37.54632568359375, -36.60603713989258, -35.66575241088867, -34.7254638671875, -33.78517532348633, -32.844886779785156, -31.904598236083984, -30.964311599731445, -30.024023056030273, -29.083736419677734, -28.143447875976562, -27.20315933227539, -26.26287269592285, -25.32258415222168, -24.38229751586914, -23.44200897216797, -22.501720428466797, -21.561433792114258, -20.621145248413086, -19.680858612060547, -18.740570068359375, -17.800281524658203, -16.85999298095703, -15.919706344604492, -14.979418754577637, -14.039131164550781, -13.09884262084961, -12.158555030822754, -11.218267440795898, -10.277978897094727, -9.337691307067871, -8.397401809692383, -7.457114219665527, -6.516826152801514, -5.5765380859375, -4.6362504959106445, -3.695962905883789, -2.7556748390197754, -1.8153867721557617, -0.8750991821289062, 0.06518864631652832, 1.005476474761963, 1.9457643032073975, 2.886052131652832, 3.8263397216796875, 4.766627788543701, 5.706915855407715, 6.64720344543457, 7.587491035461426, 8.527778625488281, 9.468067169189453, 10.408354759216309, 11.348642349243164, 12.288930892944336, 13.229218482971191, 14.169506072998047, 15.109793663024902, 16.050081253051758, 16.99036979675293, 17.93065643310547, 18.87094497680664, 19.811233520507812, 20.751522064208984, 21.691808700561523]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 6.0, 7.0, 9.0, 12.0, 10.0, 27.0, 19.0, 23.0, 28.0, 41.0, 43.0, 57.0, 50.0, 54.0, 36.0, 62.0, 62.0, 51.0, 58.0, 46.0, 51.0, 57.0, 41.0, 28.0, 20.0, 21.0, 20.0, 18.0, 14.0, 9.0, 6.0, 6.0, 2.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-19.763521194458008, -19.256900787353516, -18.750280380249023, -18.24365997314453, -17.73703956604004, -17.230419158935547, -16.723798751831055, -16.217178344726562, -15.71055793762207, -15.203937530517578, -14.697317123413086, -14.190696716308594, -13.684076309204102, -13.17745590209961, -12.670835494995117, -12.164215087890625, -11.657593727111816, -11.150973320007324, -10.644352912902832, -10.13773250579834, -9.631112098693848, -9.124491691589355, -8.617870330810547, -8.111249923706055, -7.604629993438721, -7.0980095863342285, -6.591389179229736, -6.084768295288086, -5.578147888183594, -5.071527481079102, -4.564907073974609, -4.058286666870117, -3.5516672134399414, -3.045046806335449, -2.538426399230957, -2.0318057537078857, -1.5251853466033936, -1.0185649394989014, -0.5119442939758301, -0.005323886871337891, 0.5012965202331543, 1.0079169273376465, 1.5145374536514282, 2.02115797996521, 2.527778387069702, 3.0343987941741943, 3.5410194396972656, 4.047639846801758, 4.55426025390625, 5.060880661010742, 5.567501068115234, 6.074121475219727, 6.580741882324219, 7.087362289428711, 7.593983173370361, 8.100603103637695, 8.607223510742188, 9.11384391784668, 9.620464324951172, 10.127084732055664, 10.633705139160156, 11.140325546264648, 11.64694595336914, 12.153566360473633, 12.660187721252441]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 12.0, 19.0, 23.0, 37.0, 40.0, 84.0, 137.0, 247.0, 543.0, 1012.0, 2379.0, 6516.0, 21460.0, 91978.0, 454655.0, 369855.0, 72226.0, 17711.0, 5567.0, 2106.0, 922.0, 449.0, 247.0, 138.0, 87.0, 32.0, 24.0, 18.0, 11.0, 9.0, 9.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.25, -6.0089111328125, -5.767822265625, -5.5267333984375, -5.28564453125, -5.0445556640625, -4.803466796875, -4.5623779296875, -4.3212890625, -4.0802001953125, -3.839111328125, -3.5980224609375, -3.35693359375, -3.1158447265625, -2.874755859375, -2.6336669921875, -2.392578125, -2.1514892578125, -1.910400390625, -1.6693115234375, -1.42822265625, -1.1871337890625, -0.946044921875, -0.7049560546875, -0.4638671875, -0.2227783203125, 0.018310546875, 0.2593994140625, 0.50048828125, 0.7415771484375, 0.982666015625, 1.2237548828125, 1.46484375, 1.7059326171875, 1.947021484375, 2.1881103515625, 2.42919921875, 2.6702880859375, 2.911376953125, 3.1524658203125, 3.3935546875, 3.6346435546875, 3.875732421875, 4.1168212890625, 4.35791015625, 4.5989990234375, 4.840087890625, 5.0811767578125, 5.322265625, 5.5633544921875, 5.804443359375, 6.0455322265625, 6.28662109375, 6.5277099609375, 6.768798828125, 7.0098876953125, 7.2509765625, 7.4920654296875, 7.733154296875, 7.9742431640625, 8.21533203125, 8.4564208984375, 8.697509765625, 8.9385986328125, 9.1796875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 5.0, 5.0, 13.0, 14.0, 19.0, 23.0, 29.0, 34.0, 38.0, 55.0, 53.0, 64.0, 72.0, 86.0, 74.0, 78.0, 68.0, 52.0, 45.0, 30.0, 39.0, 25.0, 11.0, 11.0, 10.0, 10.0, 5.0, 7.0, 3.0, 2.0, 0.0, 4.0, 3.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.953125, -2.850555419921875, -2.74798583984375, -2.645416259765625, -2.5428466796875, -2.440277099609375, -2.33770751953125, -2.235137939453125, -2.132568359375, -2.029998779296875, -1.92742919921875, -1.824859619140625, -1.7222900390625, -1.619720458984375, -1.51715087890625, -1.414581298828125, -1.31201171875, -1.209442138671875, -1.10687255859375, -1.004302978515625, -0.9017333984375, -0.799163818359375, -0.69659423828125, -0.594024658203125, -0.491455078125, -0.388885498046875, -0.28631591796875, -0.183746337890625, -0.0811767578125, 0.021392822265625, 0.12396240234375, 0.226531982421875, 0.3291015625, 0.431671142578125, 0.53424072265625, 0.636810302734375, 0.7393798828125, 0.841949462890625, 0.94451904296875, 1.047088623046875, 1.149658203125, 1.252227783203125, 1.35479736328125, 1.457366943359375, 1.5599365234375, 1.662506103515625, 1.76507568359375, 1.867645263671875, 1.97021484375, 2.072784423828125, 2.17535400390625, 2.277923583984375, 2.3804931640625, 2.483062744140625, 2.58563232421875, 2.688201904296875, 2.790771484375, 2.893341064453125, 2.99591064453125, 3.098480224609375, 3.2010498046875, 3.303619384765625, 3.40618896484375, 3.508758544921875, 3.611328125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 5.0, 8.0, 7.0, 18.0, 25.0, 39.0, 70.0, 156.0, 252.0, 673.0, 2140.0, 15117.0, 732073.0, 287307.0, 8046.0, 1540.0, 540.0, 230.0, 125.0, 78.0, 37.0, 26.0, 13.0, 9.0, 5.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.875, -21.209716796875, -20.54443359375, -19.879150390625, -19.2138671875, -18.548583984375, -17.88330078125, -17.218017578125, -16.552734375, -15.887451171875, -15.22216796875, -14.556884765625, -13.8916015625, -13.226318359375, -12.56103515625, -11.895751953125, -11.23046875, -10.565185546875, -9.89990234375, -9.234619140625, -8.5693359375, -7.904052734375, -7.23876953125, -6.573486328125, -5.908203125, -5.242919921875, -4.57763671875, -3.912353515625, -3.2470703125, -2.581787109375, -1.91650390625, -1.251220703125, -0.5859375, 0.079345703125, 0.74462890625, 1.409912109375, 2.0751953125, 2.740478515625, 3.40576171875, 4.071044921875, 4.736328125, 5.401611328125, 6.06689453125, 6.732177734375, 7.3974609375, 8.062744140625, 8.72802734375, 9.393310546875, 10.05859375, 10.723876953125, 11.38916015625, 12.054443359375, 12.7197265625, 13.385009765625, 14.05029296875, 14.715576171875, 15.380859375, 16.046142578125, 16.71142578125, 17.376708984375, 18.0419921875, 18.707275390625, 19.37255859375, 20.037841796875, 20.703125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 0.0, 5.0, 10.0, 13.0, 13.0, 27.0, 49.0, 60.0, 98.0, 110.0, 98.0, 100.0, 98.0, 99.0, 77.0, 49.0, 34.0, 26.0, 15.0, 8.0, 10.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.1875, -24.4287109375, -23.669921875, -22.9111328125, -22.15234375, -21.3935546875, -20.634765625, -19.8759765625, -19.1171875, -18.3583984375, -17.599609375, -16.8408203125, -16.08203125, -15.3232421875, -14.564453125, -13.8056640625, -13.046875, -12.2880859375, -11.529296875, -10.7705078125, -10.01171875, -9.2529296875, -8.494140625, -7.7353515625, -6.9765625, -6.2177734375, -5.458984375, -4.7001953125, -3.94140625, -3.1826171875, -2.423828125, -1.6650390625, -0.90625, -0.1474609375, 0.611328125, 1.3701171875, 2.12890625, 2.8876953125, 3.646484375, 4.4052734375, 5.1640625, 5.9228515625, 6.681640625, 7.4404296875, 8.19921875, 8.9580078125, 9.716796875, 10.4755859375, 11.234375, 11.9931640625, 12.751953125, 13.5107421875, 14.26953125, 15.0283203125, 15.787109375, 16.5458984375, 17.3046875, 18.0634765625, 18.822265625, 19.5810546875, 20.33984375, 21.0986328125, 21.857421875, 22.6162109375, 23.375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 6.0, 4.0, 4.0, 12.0, 9.0, 19.0, 31.0, 51.0, 69.0, 142.0, 269.0, 586.0, 1461.0, 4445.0, 20054.0, 198979.0, 736943.0, 70577.0, 10270.0, 2705.0, 988.0, 433.0, 192.0, 117.0, 65.0, 42.0, 20.0, 18.0, 8.0, 4.0, 6.0, 8.0, 6.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.591796875, -3.469207763671875, -3.34661865234375, -3.224029541015625, -3.1014404296875, -2.978851318359375, -2.85626220703125, -2.733673095703125, -2.611083984375, -2.488494873046875, -2.36590576171875, -2.243316650390625, -2.1207275390625, -1.998138427734375, -1.87554931640625, -1.752960205078125, -1.63037109375, -1.507781982421875, -1.38519287109375, -1.262603759765625, -1.1400146484375, -1.017425537109375, -0.89483642578125, -0.772247314453125, -0.649658203125, -0.527069091796875, -0.40447998046875, -0.281890869140625, -0.1593017578125, -0.036712646484375, 0.08587646484375, 0.208465576171875, 0.3310546875, 0.453643798828125, 0.57623291015625, 0.698822021484375, 0.8214111328125, 0.944000244140625, 1.06658935546875, 1.189178466796875, 1.311767578125, 1.434356689453125, 1.55694580078125, 1.679534912109375, 1.8021240234375, 1.924713134765625, 2.04730224609375, 2.169891357421875, 2.29248046875, 2.415069580078125, 2.53765869140625, 2.660247802734375, 2.7828369140625, 2.905426025390625, 3.02801513671875, 3.150604248046875, 3.273193359375, 3.395782470703125, 3.51837158203125, 3.640960693359375, 3.7635498046875, 3.886138916015625, 4.00872802734375, 4.131317138671875, 4.25390625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 6.0, 2.0, 7.0, 9.0, 6.0, 14.0, 25.0, 25.0, 33.0, 53.0, 90.0, 140.0, 160.0, 126.0, 104.0, 57.0, 39.0, 37.0, 25.0, 12.0, 11.0, 3.0, 8.0, 4.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006809234619140625, -0.0006562992930412292, -0.000631675124168396, -0.0006070509552955627, -0.0005824267864227295, -0.0005578026175498962, -0.000533178448677063, -0.0005085542798042297, -0.0004839301109313965, -0.00045930594205856323, -0.00043468177318573, -0.00041005760431289673, -0.0003854334354400635, -0.0003608092665672302, -0.00033618509769439697, -0.0003115609288215637, -0.00028693675994873047, -0.0002623125910758972, -0.00023768842220306396, -0.0002130642533302307, -0.00018844008445739746, -0.0001638159155845642, -0.00013919174671173096, -0.0001145675778388977, -8.994340896606445e-05, -6.53192400932312e-05, -4.069507122039795e-05, -1.6070902347564697e-05, 8.553266525268555e-06, 3.317743539810181e-05, 5.780160427093506e-05, 8.242577314376831e-05, 0.00010704994201660156, 0.00013167411088943481, 0.00015629827976226807, 0.00018092244863510132, 0.00020554661750793457, 0.00023017078638076782, 0.0002547949552536011, 0.0002794191241264343, 0.0003040432929992676, 0.00032866746187210083, 0.0003532916307449341, 0.00037791579961776733, 0.0004025399684906006, 0.00042716413736343384, 0.0004517883062362671, 0.00047641247510910034, 0.0005010366439819336, 0.0005256608128547668, 0.0005502849817276001, 0.0005749091506004333, 0.0005995333194732666, 0.0006241574883460999, 0.0006487816572189331, 0.0006734058260917664, 0.0006980299949645996, 0.0007226541638374329, 0.0007472783327102661, 0.0007719025015830994, 0.0007965266704559326, 0.0008211508393287659, 0.0008457750082015991, 0.0008703991770744324, 0.0008950233459472656]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 10.0, 7.0, 10.0, 17.0, 20.0, 38.0, 63.0, 77.0, 135.0, 218.0, 451.0, 787.0, 2104.0, 6673.0, 29826.0, 263574.0, 652906.0, 73096.0, 12510.0, 3459.0, 1271.0, 551.0, 277.0, 181.0, 105.0, 47.0, 44.0, 21.0, 24.0, 17.0, 11.0, 10.0, 4.0, 1.0, 3.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.21875, -4.1112060546875, -4.003662109375, -3.8961181640625, -3.78857421875, -3.6810302734375, -3.573486328125, -3.4659423828125, -3.3583984375, -3.2508544921875, -3.143310546875, -3.0357666015625, -2.92822265625, -2.8206787109375, -2.713134765625, -2.6055908203125, -2.498046875, -2.3905029296875, -2.282958984375, -2.1754150390625, -2.06787109375, -1.9603271484375, -1.852783203125, -1.7452392578125, -1.6376953125, -1.5301513671875, -1.422607421875, -1.3150634765625, -1.20751953125, -1.0999755859375, -0.992431640625, -0.8848876953125, -0.77734375, -0.6697998046875, -0.562255859375, -0.4547119140625, -0.34716796875, -0.2396240234375, -0.132080078125, -0.0245361328125, 0.0830078125, 0.1905517578125, 0.298095703125, 0.4056396484375, 0.51318359375, 0.6207275390625, 0.728271484375, 0.8358154296875, 0.943359375, 1.0509033203125, 1.158447265625, 1.2659912109375, 1.37353515625, 1.4810791015625, 1.588623046875, 1.6961669921875, 1.8037109375, 1.9112548828125, 2.018798828125, 2.1263427734375, 2.23388671875, 2.3414306640625, 2.448974609375, 2.5565185546875, 2.6640625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 7.0, 4.0, 3.0, 5.0, 5.0, 8.0, 13.0, 20.0, 27.0, 26.0, 32.0, 50.0, 55.0, 55.0, 83.0, 73.0, 84.0, 72.0, 79.0, 56.0, 48.0, 34.0, 35.0, 37.0, 21.0, 20.0, 11.0, 16.0, 5.0, 8.0, 2.0, 6.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.92578125, -2.8328857421875, -2.739990234375, -2.6470947265625, -2.55419921875, -2.4613037109375, -2.368408203125, -2.2755126953125, -2.1826171875, -2.0897216796875, -1.996826171875, -1.9039306640625, -1.81103515625, -1.7181396484375, -1.625244140625, -1.5323486328125, -1.439453125, -1.3465576171875, -1.253662109375, -1.1607666015625, -1.06787109375, -0.9749755859375, -0.882080078125, -0.7891845703125, -0.6962890625, -0.6033935546875, -0.510498046875, -0.4176025390625, -0.32470703125, -0.2318115234375, -0.138916015625, -0.0460205078125, 0.046875, 0.1397705078125, 0.232666015625, 0.3255615234375, 0.41845703125, 0.5113525390625, 0.604248046875, 0.6971435546875, 0.7900390625, 0.8829345703125, 0.975830078125, 1.0687255859375, 1.16162109375, 1.2545166015625, 1.347412109375, 1.4403076171875, 1.533203125, 1.6260986328125, 1.718994140625, 1.8118896484375, 1.90478515625, 1.9976806640625, 2.090576171875, 2.1834716796875, 2.2763671875, 2.3692626953125, 2.462158203125, 2.5550537109375, 2.64794921875, 2.7408447265625, 2.833740234375, 2.9266357421875, 3.01953125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 7.0, 10.0, 12.0, 19.0, 23.0, 37.0, 54.0, 77.0, 111.0, 119.0, 123.0, 98.0, 104.0, 64.0, 44.0, 29.0, 21.0, 13.0, 13.0, 7.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.66254425048828, -61.568138122558594, -59.473731994628906, -57.37932586669922, -55.28491973876953, -53.190513610839844, -51.09611129760742, -49.001705169677734, -46.90729904174805, -44.81289291381836, -42.71848678588867, -40.624080657958984, -38.52967834472656, -36.435272216796875, -34.34086608886719, -32.2464599609375, -30.152053833007812, -28.057647705078125, -25.963241577148438, -23.868837356567383, -21.774431228637695, -19.680025100708008, -17.585620880126953, -15.491214752197266, -13.396808624267578, -11.30240249633789, -9.20799732208252, -7.11359167098999, -5.019186019897461, -2.9247798919677734, -0.8303747177124023, 1.2640304565429688, 3.3584442138671875, 5.452849864959717, 7.547255516052246, 9.641660690307617, 11.736066818237305, 13.830472946166992, 15.924878120422363, 18.019283294677734, 20.113689422607422, 22.20809555053711, 24.302501678466797, 26.39690589904785, 28.49131202697754, 30.585718154907227, 32.68012237548828, 34.77452850341797, 36.868934631347656, 38.963340759277344, 41.05774688720703, 43.15215301513672, 45.246559143066406, 47.340965270996094, 49.435367584228516, 51.5297737121582, 53.62417984008789, 55.71858596801758, 57.812992095947266, 59.90739822387695, 62.001800537109375, 64.09620666503906, 66.19061279296875, 68.28501892089844, 70.37942504882812]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 3.0, 4.0, 12.0, 12.0, 12.0, 18.0, 11.0, 15.0, 18.0, 21.0, 21.0, 28.0, 38.0, 25.0, 35.0, 46.0, 49.0, 57.0, 49.0, 56.0, 48.0, 43.0, 47.0, 45.0, 43.0, 42.0, 21.0, 25.0, 27.0, 29.0, 16.0, 19.0, 14.0, 10.0, 11.0, 5.0, 8.0, 4.0, 3.0, 6.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-61.69361114501953, -59.840736389160156, -57.98786163330078, -56.134986877441406, -54.282108306884766, -52.42923355102539, -50.576358795166016, -48.72348403930664, -46.87060546875, -45.017730712890625, -43.16485595703125, -41.311981201171875, -39.459102630615234, -37.60622787475586, -35.753353118896484, -33.90047836303711, -32.047603607177734, -30.19472885131836, -28.34185218811035, -26.488977432250977, -24.63610076904297, -22.783226013183594, -20.93035125732422, -19.077476501464844, -17.224599838256836, -15.371724128723145, -13.518848419189453, -11.665973663330078, -9.813097953796387, -7.960222244262695, -6.10734748840332, -4.254471778869629, -2.4015960693359375, -0.5487205982208252, 1.304154872894287, 3.1570301055908203, 5.009905815124512, 6.862781524658203, 8.715656280517578, 10.56853199005127, 12.421407699584961, 14.274283409118652, 16.127159118652344, 17.98003387451172, 19.832908630371094, 21.6857852935791, 23.538660049438477, 25.391536712646484, 27.24441146850586, 29.097286224365234, 30.950162887573242, 32.80303955078125, 34.655914306640625, 36.5087890625, 38.361663818359375, 40.21453857421875, 42.067413330078125, 43.9202880859375, 45.773162841796875, 47.62603759765625, 49.47891616821289, 51.331790924072266, 53.18466567993164, 55.037540435791016, 56.890419006347656]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 14.0, 9.0, 23.0, 25.0, 35.0, 37.0, 79.0, 141.0, 285.0, 631.0, 1663.0, 5177.0, 23568.0, 350871.0, 3745020.0, 52511.0, 9500.0, 2728.0, 1002.0, 432.0, 220.0, 109.0, 81.0, 45.0, 25.0, 19.0, 11.0, 3.0, 7.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.1015625, -10.777099609375, -10.45263671875, -10.128173828125, -9.8037109375, -9.479248046875, -9.15478515625, -8.830322265625, -8.505859375, -8.181396484375, -7.85693359375, -7.532470703125, -7.2080078125, -6.883544921875, -6.55908203125, -6.234619140625, -5.91015625, -5.585693359375, -5.26123046875, -4.936767578125, -4.6123046875, -4.287841796875, -3.96337890625, -3.638916015625, -3.314453125, -2.989990234375, -2.66552734375, -2.341064453125, -2.0166015625, -1.692138671875, -1.36767578125, -1.043212890625, -0.71875, -0.394287109375, -0.06982421875, 0.254638671875, 0.5791015625, 0.903564453125, 1.22802734375, 1.552490234375, 1.876953125, 2.201416015625, 2.52587890625, 2.850341796875, 3.1748046875, 3.499267578125, 3.82373046875, 4.148193359375, 4.47265625, 4.797119140625, 5.12158203125, 5.446044921875, 5.7705078125, 6.094970703125, 6.41943359375, 6.743896484375, 7.068359375, 7.392822265625, 7.71728515625, 8.041748046875, 8.3662109375, 8.690673828125, 9.01513671875, 9.339599609375, 9.6640625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 8.0, 9.0, 13.0, 14.0, 11.0, 21.0, 19.0, 31.0, 40.0, 41.0, 71.0, 73.0, 75.0, 67.0, 72.0, 54.0, 61.0, 44.0, 59.0, 40.0, 36.0, 29.0, 31.0, 9.0, 20.0, 8.0, 6.0, 10.0, 4.0, 4.0, 7.0, 4.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.912109375, -1.82659912109375, -1.7410888671875, -1.65557861328125, -1.570068359375, -1.48455810546875, -1.3990478515625, -1.31353759765625, -1.22802734375, -1.14251708984375, -1.0570068359375, -0.97149658203125, -0.885986328125, -0.80047607421875, -0.7149658203125, -0.62945556640625, -0.5439453125, -0.45843505859375, -0.3729248046875, -0.28741455078125, -0.201904296875, -0.11639404296875, -0.0308837890625, 0.05462646484375, 0.14013671875, 0.22564697265625, 0.3111572265625, 0.39666748046875, 0.482177734375, 0.56768798828125, 0.6531982421875, 0.73870849609375, 0.82421875, 0.90972900390625, 0.9952392578125, 1.08074951171875, 1.166259765625, 1.25177001953125, 1.3372802734375, 1.42279052734375, 1.50830078125, 1.59381103515625, 1.6793212890625, 1.76483154296875, 1.850341796875, 1.93585205078125, 2.0213623046875, 2.10687255859375, 2.1923828125, 2.27789306640625, 2.3634033203125, 2.44891357421875, 2.534423828125, 2.61993408203125, 2.7054443359375, 2.79095458984375, 2.87646484375, 2.96197509765625, 3.0474853515625, 3.13299560546875, 3.218505859375, 3.30401611328125, 3.3895263671875, 3.47503662109375, 3.560546875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 1.0, 5.0, 8.0, 9.0, 16.0, 12.0, 39.0, 47.0, 92.0, 187.0, 352.0, 822.0, 2071.0, 6299.0, 27731.0, 290372.0, 3758649.0, 87092.0, 14182.0, 3829.0, 1319.0, 568.0, 251.0, 142.0, 73.0, 44.0, 22.0, 21.0, 7.0, 10.0, 3.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.109375, -10.775634765625, -10.44189453125, -10.108154296875, -9.7744140625, -9.440673828125, -9.10693359375, -8.773193359375, -8.439453125, -8.105712890625, -7.77197265625, -7.438232421875, -7.1044921875, -6.770751953125, -6.43701171875, -6.103271484375, -5.76953125, -5.435791015625, -5.10205078125, -4.768310546875, -4.4345703125, -4.100830078125, -3.76708984375, -3.433349609375, -3.099609375, -2.765869140625, -2.43212890625, -2.098388671875, -1.7646484375, -1.430908203125, -1.09716796875, -0.763427734375, -0.4296875, -0.095947265625, 0.23779296875, 0.571533203125, 0.9052734375, 1.239013671875, 1.57275390625, 1.906494140625, 2.240234375, 2.573974609375, 2.90771484375, 3.241455078125, 3.5751953125, 3.908935546875, 4.24267578125, 4.576416015625, 4.91015625, 5.243896484375, 5.57763671875, 5.911376953125, 6.2451171875, 6.578857421875, 6.91259765625, 7.246337890625, 7.580078125, 7.913818359375, 8.24755859375, 8.581298828125, 8.9150390625, 9.248779296875, 9.58251953125, 9.916259765625, 10.25]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 6.0, 8.0, 9.0, 8.0, 5.0, 15.0, 16.0, 26.0, 32.0, 40.0, 73.0, 181.0, 637.0, 1777.0, 698.0, 222.0, 102.0, 79.0, 35.0, 30.0, 22.0, 13.0, 10.0, 4.0, 9.0, 5.0, 4.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-11.8203125, -11.49755859375, -11.1748046875, -10.85205078125, -10.529296875, -10.20654296875, -9.8837890625, -9.56103515625, -9.23828125, -8.91552734375, -8.5927734375, -8.27001953125, -7.947265625, -7.62451171875, -7.3017578125, -6.97900390625, -6.65625, -6.33349609375, -6.0107421875, -5.68798828125, -5.365234375, -5.04248046875, -4.7197265625, -4.39697265625, -4.07421875, -3.75146484375, -3.4287109375, -3.10595703125, -2.783203125, -2.46044921875, -2.1376953125, -1.81494140625, -1.4921875, -1.16943359375, -0.8466796875, -0.52392578125, -0.201171875, 0.12158203125, 0.4443359375, 0.76708984375, 1.08984375, 1.41259765625, 1.7353515625, 2.05810546875, 2.380859375, 2.70361328125, 3.0263671875, 3.34912109375, 3.671875, 3.99462890625, 4.3173828125, 4.64013671875, 4.962890625, 5.28564453125, 5.6083984375, 5.93115234375, 6.25390625, 6.57666015625, 6.8994140625, 7.22216796875, 7.544921875, 7.86767578125, 8.1904296875, 8.51318359375, 8.8359375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 15.0, 30.0, 81.0, 197.0, 300.0, 212.0, 96.0, 32.0, 21.0, 8.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-95.21401977539062, -91.74302673339844, -88.27204132080078, -84.8010482788086, -81.33006286621094, -77.85906982421875, -74.38807678222656, -70.9170913696289, -67.44610595703125, -63.97511672973633, -60.504127502441406, -57.03313446044922, -53.56214904785156, -50.091156005859375, -46.62016677856445, -43.14917755126953, -39.678184509277344, -36.20719528198242, -32.7362060546875, -29.265214920043945, -25.794225692749023, -22.3232364654541, -18.852245330810547, -15.381256103515625, -11.910266876220703, -8.439277648925781, -4.968287467956543, -1.4972972869873047, 1.9736919403076172, 5.444681167602539, 8.915672302246094, 12.386661529541016, 15.857650756835938, 19.32863998413086, 22.79962921142578, 26.270620346069336, 29.741609573364258, 33.21260070800781, 36.683589935302734, 40.154579162597656, 43.62556838989258, 47.0965576171875, 50.56754684448242, 54.038536071777344, 57.50952911376953, 60.98051452636719, 64.45150756835938, 67.92250061035156, 71.39348602294922, 74.8644790649414, 78.33546447753906, 81.80645751953125, 85.2774429321289, 88.7484359741211, 92.21942138671875, 95.69041442871094, 99.16140747070312, 102.63240051269531, 106.10338592529297, 109.57437896728516, 113.04536437988281, 116.516357421875, 119.98735046386719, 123.45833587646484, 126.9293212890625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 5.0, 10.0, 11.0, 16.0, 19.0, 30.0, 23.0, 30.0, 41.0, 41.0, 58.0, 57.0, 61.0, 58.0, 63.0, 59.0, 69.0, 58.0, 44.0, 64.0, 43.0, 36.0, 28.0, 19.0, 18.0, 9.0, 6.0, 7.0, 5.0, 6.0, 4.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-61.09820556640625, -59.50714874267578, -57.91608810424805, -56.32503128051758, -54.733970642089844, -53.142913818359375, -51.551856994628906, -49.96080017089844, -48.3697395324707, -46.778682708740234, -45.1876220703125, -43.59656524658203, -42.00550842285156, -40.41444778442383, -38.82339096069336, -37.232330322265625, -35.641273498535156, -34.05021667480469, -32.45915603637695, -30.868099212646484, -29.277040481567383, -27.68598175048828, -26.094924926757812, -24.50386619567871, -22.91280746459961, -21.321748733520508, -19.730690002441406, -18.139633178710938, -16.548574447631836, -14.957515716552734, -13.36645793914795, -11.775400161743164, -10.184341430664062, -8.593282699584961, -7.002224922180176, -5.411166667938232, -3.820108413696289, -2.2290501594543457, -0.6379919052124023, 0.9530658721923828, 2.5441246032714844, 4.135182857513428, 5.726241111755371, 7.3172993659973145, 8.908357620239258, 10.49941635131836, 12.090474128723145, 13.68153190612793, 15.272590637207031, 16.863649368286133, 18.454708099365234, 20.045764923095703, 21.636823654174805, 23.227882385253906, 24.818939208984375, 26.409997940063477, 28.001056671142578, 29.59211540222168, 31.18317413330078, 32.77423095703125, 34.36528778076172, 35.95634841918945, 37.54740524291992, 39.138465881347656, 40.729522705078125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 11.0, 10.0, 22.0, 20.0, 42.0, 67.0, 120.0, 231.0, 444.0, 886.0, 1977.0, 4788.0, 13314.0, 41276.0, 140151.0, 405813.0, 304824.0, 91087.0, 27507.0, 9486.0, 3560.0, 1479.0, 667.0, 322.0, 188.0, 107.0, 60.0, 35.0, 28.0, 7.0, 12.0, 6.0, 6.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.890625, -5.71649169921875, -5.5423583984375, -5.36822509765625, -5.194091796875, -5.01995849609375, -4.8458251953125, -4.67169189453125, -4.49755859375, -4.32342529296875, -4.1492919921875, -3.97515869140625, -3.801025390625, -3.62689208984375, -3.4527587890625, -3.27862548828125, -3.1044921875, -2.93035888671875, -2.7562255859375, -2.58209228515625, -2.407958984375, -2.23382568359375, -2.0596923828125, -1.88555908203125, -1.71142578125, -1.53729248046875, -1.3631591796875, -1.18902587890625, -1.014892578125, -0.84075927734375, -0.6666259765625, -0.49249267578125, -0.318359375, -0.14422607421875, 0.0299072265625, 0.20404052734375, 0.378173828125, 0.55230712890625, 0.7264404296875, 0.90057373046875, 1.07470703125, 1.24884033203125, 1.4229736328125, 1.59710693359375, 1.771240234375, 1.94537353515625, 2.1195068359375, 2.29364013671875, 2.4677734375, 2.64190673828125, 2.8160400390625, 2.99017333984375, 3.164306640625, 3.33843994140625, 3.5125732421875, 3.68670654296875, 3.86083984375, 4.03497314453125, 4.2091064453125, 4.38323974609375, 4.557373046875, 4.73150634765625, 4.9056396484375, 5.07977294921875, 5.25390625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 8.0, 8.0, 7.0, 11.0, 9.0, 19.0, 17.0, 22.0, 45.0, 35.0, 30.0, 41.0, 43.0, 54.0, 53.0, 58.0, 57.0, 67.0, 63.0, 48.0, 51.0, 38.0, 35.0, 30.0, 29.0, 35.0, 26.0, 7.0, 9.0, 10.0, 11.0, 11.0, 5.0, 4.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9619140625, -1.8853912353515625, -1.808868408203125, -1.7323455810546875, -1.65582275390625, -1.5792999267578125, -1.502777099609375, -1.4262542724609375, -1.3497314453125, -1.2732086181640625, -1.196685791015625, -1.1201629638671875, -1.04364013671875, -0.9671173095703125, -0.890594482421875, -0.8140716552734375, -0.737548828125, -0.6610260009765625, -0.584503173828125, -0.5079803466796875, -0.43145751953125, -0.3549346923828125, -0.278411865234375, -0.2018890380859375, -0.1253662109375, -0.0488433837890625, 0.027679443359375, 0.1042022705078125, 0.18072509765625, 0.2572479248046875, 0.333770751953125, 0.4102935791015625, 0.48681640625, 0.5633392333984375, 0.639862060546875, 0.7163848876953125, 0.79290771484375, 0.8694305419921875, 0.945953369140625, 1.0224761962890625, 1.0989990234375, 1.1755218505859375, 1.252044677734375, 1.3285675048828125, 1.40509033203125, 1.4816131591796875, 1.558135986328125, 1.6346588134765625, 1.711181640625, 1.7877044677734375, 1.864227294921875, 1.9407501220703125, 2.01727294921875, 2.0937957763671875, 2.170318603515625, 2.2468414306640625, 2.3233642578125, 2.3998870849609375, 2.476409912109375, 2.5529327392578125, 2.62945556640625, 2.7059783935546875, 2.782501220703125, 2.8590240478515625, 2.935546875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 7.0, 8.0, 11.0, 12.0, 14.0, 26.0, 20.0, 34.0, 59.0, 86.0, 153.0, 246.0, 389.0, 767.0, 1541.0, 3799.0, 12757.0, 75978.0, 643619.0, 265829.0, 31230.0, 6957.0, 2496.0, 1107.0, 576.0, 339.0, 195.0, 104.0, 77.0, 40.0, 28.0, 23.0, 11.0, 7.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.6484375, -12.3304443359375, -12.012451171875, -11.6944580078125, -11.37646484375, -11.0584716796875, -10.740478515625, -10.4224853515625, -10.1044921875, -9.7864990234375, -9.468505859375, -9.1505126953125, -8.83251953125, -8.5145263671875, -8.196533203125, -7.8785400390625, -7.560546875, -7.2425537109375, -6.924560546875, -6.6065673828125, -6.28857421875, -5.9705810546875, -5.652587890625, -5.3345947265625, -5.0166015625, -4.6986083984375, -4.380615234375, -4.0626220703125, -3.74462890625, -3.4266357421875, -3.108642578125, -2.7906494140625, -2.47265625, -2.1546630859375, -1.836669921875, -1.5186767578125, -1.20068359375, -0.8826904296875, -0.564697265625, -0.2467041015625, 0.0712890625, 0.3892822265625, 0.707275390625, 1.0252685546875, 1.34326171875, 1.6612548828125, 1.979248046875, 2.2972412109375, 2.615234375, 2.9332275390625, 3.251220703125, 3.5692138671875, 3.88720703125, 4.2052001953125, 4.523193359375, 4.8411865234375, 5.1591796875, 5.4771728515625, 5.795166015625, 6.1131591796875, 6.43115234375, 6.7491455078125, 7.067138671875, 7.3851318359375, 7.703125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 4.0, 5.0, 6.0, 8.0, 6.0, 11.0, 11.0, 23.0, 25.0, 21.0, 28.0, 30.0, 35.0, 47.0, 44.0, 61.0, 57.0, 44.0, 45.0, 46.0, 58.0, 49.0, 53.0, 39.0, 37.0, 29.0, 39.0, 30.0, 24.0, 22.0, 15.0, 10.0, 8.0, 7.0, 10.0, 3.0, 5.0, 3.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-14.0546875, -13.6724853515625, -13.290283203125, -12.9080810546875, -12.52587890625, -12.1436767578125, -11.761474609375, -11.3792724609375, -10.9970703125, -10.6148681640625, -10.232666015625, -9.8504638671875, -9.46826171875, -9.0860595703125, -8.703857421875, -8.3216552734375, -7.939453125, -7.5572509765625, -7.175048828125, -6.7928466796875, -6.41064453125, -6.0284423828125, -5.646240234375, -5.2640380859375, -4.8818359375, -4.4996337890625, -4.117431640625, -3.7352294921875, -3.35302734375, -2.9708251953125, -2.588623046875, -2.2064208984375, -1.82421875, -1.4420166015625, -1.059814453125, -0.6776123046875, -0.29541015625, 0.0867919921875, 0.468994140625, 0.8511962890625, 1.2333984375, 1.6156005859375, 1.997802734375, 2.3800048828125, 2.76220703125, 3.1444091796875, 3.526611328125, 3.9088134765625, 4.291015625, 4.6732177734375, 5.055419921875, 5.4376220703125, 5.81982421875, 6.2020263671875, 6.584228515625, 6.9664306640625, 7.3486328125, 7.7308349609375, 8.113037109375, 8.4952392578125, 8.87744140625, 9.2596435546875, 9.641845703125, 10.0240478515625, 10.40625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 7.0, 7.0, 4.0, 11.0, 17.0, 25.0, 42.0, 82.0, 141.0, 280.0, 741.0, 2503.0, 17173.0, 877408.0, 141491.0, 6318.0, 1362.0, 512.0, 202.0, 102.0, 57.0, 17.0, 19.0, 11.0, 5.0, 2.0, 6.0, 4.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.2578125, -9.9788818359375, -9.699951171875, -9.4210205078125, -9.14208984375, -8.8631591796875, -8.584228515625, -8.3052978515625, -8.0263671875, -7.7474365234375, -7.468505859375, -7.1895751953125, -6.91064453125, -6.6317138671875, -6.352783203125, -6.0738525390625, -5.794921875, -5.5159912109375, -5.237060546875, -4.9581298828125, -4.67919921875, -4.4002685546875, -4.121337890625, -3.8424072265625, -3.5634765625, -3.2845458984375, -3.005615234375, -2.7266845703125, -2.44775390625, -2.1688232421875, -1.889892578125, -1.6109619140625, -1.33203125, -1.0531005859375, -0.774169921875, -0.4952392578125, -0.21630859375, 0.0626220703125, 0.341552734375, 0.6204833984375, 0.8994140625, 1.1783447265625, 1.457275390625, 1.7362060546875, 2.01513671875, 2.2940673828125, 2.572998046875, 2.8519287109375, 3.130859375, 3.4097900390625, 3.688720703125, 3.9676513671875, 4.24658203125, 4.5255126953125, 4.804443359375, 5.0833740234375, 5.3623046875, 5.6412353515625, 5.920166015625, 6.1990966796875, 6.47802734375, 6.7569580078125, 7.035888671875, 7.3148193359375, 7.59375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 3.0, 1.0, 7.0, 8.0, 7.0, 11.0, 11.0, 24.0, 49.0, 80.0, 104.0, 134.0, 170.0, 111.0, 95.0, 76.0, 32.0, 33.0, 18.0, 9.0, 9.0, 4.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0013856887817382812, -0.0013529956340789795, -0.0013203024864196777, -0.001287609338760376, -0.0012549161911010742, -0.0012222230434417725, -0.0011895298957824707, -0.001156836748123169, -0.0011241436004638672, -0.0010914504528045654, -0.0010587573051452637, -0.001026064157485962, -0.0009933710098266602, -0.0009606778621673584, -0.0009279847145080566, -0.0008952915668487549, -0.0008625984191894531, -0.0008299052715301514, -0.0007972121238708496, -0.0007645189762115479, -0.0007318258285522461, -0.0006991326808929443, -0.0006664395332336426, -0.0006337463855743408, -0.0006010532379150391, -0.0005683600902557373, -0.0005356669425964355, -0.0005029737949371338, -0.00047028064727783203, -0.0004375874996185303, -0.0004048943519592285, -0.00037220120429992676, -0.000339508056640625, -0.00030681490898132324, -0.0002741217613220215, -0.00024142861366271973, -0.00020873546600341797, -0.0001760423183441162, -0.00014334917068481445, -0.0001106560230255127, -7.796287536621094e-05, -4.526972770690918e-05, -1.2576580047607422e-05, 2.0116567611694336e-05, 5.2809715270996094e-05, 8.550286293029785e-05, 0.00011819601058959961, 0.00015088915824890137, 0.00018358230590820312, 0.00021627545356750488, 0.00024896860122680664, 0.0002816617488861084, 0.00031435489654541016, 0.0003470480442047119, 0.00037974119186401367, 0.00041243433952331543, 0.0004451274871826172, 0.00047782063484191895, 0.0005105137825012207, 0.0005432069301605225, 0.0005759000778198242, 0.000608593225479126, 0.0006412863731384277, 0.0006739795207977295, 0.0007066726684570312]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 2.0, 11.0, 5.0, 11.0, 23.0, 23.0, 49.0, 71.0, 140.0, 312.0, 724.0, 2030.0, 8497.0, 87483.0, 857080.0, 80792.0, 8088.0, 1924.0, 676.0, 268.0, 140.0, 91.0, 43.0, 19.0, 17.0, 10.0, 6.0, 9.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.7265625, -6.55621337890625, -6.3858642578125, -6.21551513671875, -6.045166015625, -5.87481689453125, -5.7044677734375, -5.53411865234375, -5.36376953125, -5.19342041015625, -5.0230712890625, -4.85272216796875, -4.682373046875, -4.51202392578125, -4.3416748046875, -4.17132568359375, -4.0009765625, -3.83062744140625, -3.6602783203125, -3.48992919921875, -3.319580078125, -3.14923095703125, -2.9788818359375, -2.80853271484375, -2.63818359375, -2.46783447265625, -2.2974853515625, -2.12713623046875, -1.956787109375, -1.78643798828125, -1.6160888671875, -1.44573974609375, -1.275390625, -1.10504150390625, -0.9346923828125, -0.76434326171875, -0.593994140625, -0.42364501953125, -0.2532958984375, -0.08294677734375, 0.08740234375, 0.25775146484375, 0.4281005859375, 0.59844970703125, 0.768798828125, 0.93914794921875, 1.1094970703125, 1.27984619140625, 1.4501953125, 1.62054443359375, 1.7908935546875, 1.96124267578125, 2.131591796875, 2.30194091796875, 2.4722900390625, 2.64263916015625, 2.81298828125, 2.98333740234375, 3.1536865234375, 3.32403564453125, 3.494384765625, 3.66473388671875, 3.8350830078125, 4.00543212890625, 4.17578125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 6.0, 2.0, 3.0, 5.0, 6.0, 9.0, 17.0, 21.0, 21.0, 35.0, 65.0, 65.0, 97.0, 100.0, 101.0, 99.0, 88.0, 74.0, 47.0, 39.0, 23.0, 25.0, 16.0, 15.0, 10.0, 8.0, 4.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-6.48046875, -6.3350830078125, -6.189697265625, -6.0443115234375, -5.89892578125, -5.7535400390625, -5.608154296875, -5.4627685546875, -5.3173828125, -5.1719970703125, -5.026611328125, -4.8812255859375, -4.73583984375, -4.5904541015625, -4.445068359375, -4.2996826171875, -4.154296875, -4.0089111328125, -3.863525390625, -3.7181396484375, -3.57275390625, -3.4273681640625, -3.281982421875, -3.1365966796875, -2.9912109375, -2.8458251953125, -2.700439453125, -2.5550537109375, -2.40966796875, -2.2642822265625, -2.118896484375, -1.9735107421875, -1.828125, -1.6827392578125, -1.537353515625, -1.3919677734375, -1.24658203125, -1.1011962890625, -0.955810546875, -0.8104248046875, -0.6650390625, -0.5196533203125, -0.374267578125, -0.2288818359375, -0.08349609375, 0.0618896484375, 0.207275390625, 0.3526611328125, 0.498046875, 0.6434326171875, 0.788818359375, 0.9342041015625, 1.07958984375, 1.2249755859375, 1.370361328125, 1.5157470703125, 1.6611328125, 1.8065185546875, 1.951904296875, 2.0972900390625, 2.24267578125, 2.3880615234375, 2.533447265625, 2.6788330078125, 2.82421875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 8.0, 12.0, 18.0, 53.0, 80.0, 163.0, 219.0, 203.0, 99.0, 63.0, 36.0, 15.0, 8.0, 4.0, 5.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.42872619628906, -96.5566635131836, -93.68460083007812, -90.81254577636719, -87.94048309326172, -85.06842041015625, -82.19635772705078, -79.32429504394531, -76.45223999023438, -73.5801773071289, -70.70811462402344, -67.8360595703125, -64.96399688720703, -62.09193420410156, -59.219871520996094, -56.347808837890625, -53.475746154785156, -50.60368347167969, -47.731624603271484, -44.859561920166016, -41.98750305175781, -39.115440368652344, -36.243377685546875, -33.371315002441406, -30.499256134033203, -27.627195358276367, -24.75513458251953, -21.883071899414062, -19.011011123657227, -16.13895034790039, -13.266887664794922, -10.394826889038086, -7.522773742675781, -4.650712490081787, -1.778651237487793, 1.0934104919433594, 3.9654712677001953, 6.837532043457031, 9.7095947265625, 12.581655502319336, 15.453716278076172, 18.325777053833008, 21.197837829589844, 24.069900512695312, 26.94196128845215, 29.814022064208984, 32.68608474731445, 35.558143615722656, 38.430206298828125, 41.302268981933594, 44.1743278503418, 47.046390533447266, 49.91844940185547, 52.79051208496094, 55.662574768066406, 58.534637451171875, 61.40669631958008, 64.27875518798828, 67.15081787109375, 70.02288055419922, 72.89494323730469, 75.76699829101562, 78.63906860351562, 81.51112365722656, 84.38318634033203]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 6.0, 7.0, 10.0, 8.0, 20.0, 24.0, 13.0, 23.0, 35.0, 35.0, 37.0, 38.0, 40.0, 51.0, 66.0, 56.0, 83.0, 62.0, 66.0, 42.0, 42.0, 39.0, 36.0, 42.0, 28.0, 23.0, 27.0, 12.0, 8.0, 4.0, 7.0, 6.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-63.788604736328125, -62.07896423339844, -60.36932373046875, -58.6596794128418, -56.95003890991211, -55.24039840698242, -53.530757904052734, -51.82111358642578, -50.111473083496094, -48.401832580566406, -46.69219207763672, -44.982547760009766, -43.27290725708008, -41.56326675415039, -39.8536262512207, -38.14398193359375, -36.43434143066406, -34.724700927734375, -33.01506042480469, -31.305418014526367, -29.595775604248047, -27.88613510131836, -26.176494598388672, -24.46685218811035, -22.757213592529297, -21.04757308959961, -19.33793067932129, -17.6282901763916, -15.918647766113281, -14.209007263183594, -12.49936580657959, -10.789724349975586, -9.080081939697266, -7.370440483093262, -5.660799026489258, -3.951158046722412, -2.241516590118408, -0.5318756103515625, 1.1777658462524414, 2.8874073028564453, 4.597048759460449, 6.306690216064453, 8.016331672668457, 9.725973129272461, 11.435613632202148, 13.145255088806152, 14.854896545410156, 16.564537048339844, 18.274179458618164, 19.98381996154785, 21.693462371826172, 23.40310287475586, 25.11274528503418, 26.822385787963867, 28.532028198242188, 30.241668701171875, 31.951309204101562, 33.66094970703125, 35.37059020996094, 37.08023452758789, 38.78987503051758, 40.499515533447266, 42.20915603637695, 43.918800354003906, 45.628440856933594]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 4.0, 1.0, 8.0, 8.0, 11.0, 9.0, 19.0, 19.0, 28.0, 33.0, 75.0, 113.0, 274.0, 710.0, 2794.0, 14757.0, 318398.0, 3810465.0, 38923.0, 5519.0, 1255.0, 402.0, 196.0, 98.0, 55.0, 37.0, 25.0, 15.0, 13.0, 8.0, 5.0, 4.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.421875, -11.0673828125, -10.712890625, -10.3583984375, -10.00390625, -9.6494140625, -9.294921875, -8.9404296875, -8.5859375, -8.2314453125, -7.876953125, -7.5224609375, -7.16796875, -6.8134765625, -6.458984375, -6.1044921875, -5.75, -5.3955078125, -5.041015625, -4.6865234375, -4.33203125, -3.9775390625, -3.623046875, -3.2685546875, -2.9140625, -2.5595703125, -2.205078125, -1.8505859375, -1.49609375, -1.1416015625, -0.787109375, -0.4326171875, -0.078125, 0.2763671875, 0.630859375, 0.9853515625, 1.33984375, 1.6943359375, 2.048828125, 2.4033203125, 2.7578125, 3.1123046875, 3.466796875, 3.8212890625, 4.17578125, 4.5302734375, 4.884765625, 5.2392578125, 5.59375, 5.9482421875, 6.302734375, 6.6572265625, 7.01171875, 7.3662109375, 7.720703125, 8.0751953125, 8.4296875, 8.7841796875, 9.138671875, 9.4931640625, 9.84765625, 10.2021484375, 10.556640625, 10.9111328125, 11.265625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 8.0, 8.0, 5.0, 9.0, 19.0, 27.0, 27.0, 43.0, 53.0, 75.0, 98.0, 108.0, 77.0, 106.0, 84.0, 67.0, 58.0, 44.0, 31.0, 17.0, 16.0, 10.0, 11.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.626953125, -3.498992919921875, -3.37103271484375, -3.243072509765625, -3.1151123046875, -2.987152099609375, -2.85919189453125, -2.731231689453125, -2.603271484375, -2.475311279296875, -2.34735107421875, -2.219390869140625, -2.0914306640625, -1.963470458984375, -1.83551025390625, -1.707550048828125, -1.57958984375, -1.451629638671875, -1.32366943359375, -1.195709228515625, -1.0677490234375, -0.939788818359375, -0.81182861328125, -0.683868408203125, -0.555908203125, -0.427947998046875, -0.29998779296875, -0.172027587890625, -0.0440673828125, 0.083892822265625, 0.21185302734375, 0.339813232421875, 0.4677734375, 0.595733642578125, 0.72369384765625, 0.851654052734375, 0.9796142578125, 1.107574462890625, 1.23553466796875, 1.363494873046875, 1.491455078125, 1.619415283203125, 1.74737548828125, 1.875335693359375, 2.0032958984375, 2.131256103515625, 2.25921630859375, 2.387176513671875, 2.51513671875, 2.643096923828125, 2.77105712890625, 2.899017333984375, 3.0269775390625, 3.154937744140625, 3.28289794921875, 3.410858154296875, 3.538818359375, 3.666778564453125, 3.79473876953125, 3.922698974609375, 4.0506591796875, 4.178619384765625, 4.30657958984375, 4.434539794921875, 4.5625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 1.0, 7.0, 8.0, 10.0, 8.0, 12.0, 21.0, 32.0, 48.0, 67.0, 116.0, 186.0, 402.0, 856.0, 1786.0, 4993.0, 17614.0, 99467.0, 3604564.0, 415762.0, 34951.0, 8239.0, 2732.0, 1081.0, 543.0, 259.0, 146.0, 118.0, 63.0, 45.0, 36.0, 25.0, 13.0, 17.0, 14.0, 6.0, 12.0, 6.0, 3.0, 2.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1328125, -8.82568359375, -8.5185546875, -8.21142578125, -7.904296875, -7.59716796875, -7.2900390625, -6.98291015625, -6.67578125, -6.36865234375, -6.0615234375, -5.75439453125, -5.447265625, -5.14013671875, -4.8330078125, -4.52587890625, -4.21875, -3.91162109375, -3.6044921875, -3.29736328125, -2.990234375, -2.68310546875, -2.3759765625, -2.06884765625, -1.76171875, -1.45458984375, -1.1474609375, -0.84033203125, -0.533203125, -0.22607421875, 0.0810546875, 0.38818359375, 0.6953125, 1.00244140625, 1.3095703125, 1.61669921875, 1.923828125, 2.23095703125, 2.5380859375, 2.84521484375, 3.15234375, 3.45947265625, 3.7666015625, 4.07373046875, 4.380859375, 4.68798828125, 4.9951171875, 5.30224609375, 5.609375, 5.91650390625, 6.2236328125, 6.53076171875, 6.837890625, 7.14501953125, 7.4521484375, 7.75927734375, 8.06640625, 8.37353515625, 8.6806640625, 8.98779296875, 9.294921875, 9.60205078125, 9.9091796875, 10.21630859375, 10.5234375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 7.0, 13.0, 14.0, 31.0, 36.0, 60.0, 149.0, 435.0, 1861.0, 1003.0, 238.0, 107.0, 39.0, 33.0, 19.0, 14.0, 7.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.609375, -7.181396484375, -6.75341796875, -6.325439453125, -5.8974609375, -5.469482421875, -5.04150390625, -4.613525390625, -4.185546875, -3.757568359375, -3.32958984375, -2.901611328125, -2.4736328125, -2.045654296875, -1.61767578125, -1.189697265625, -0.76171875, -0.333740234375, 0.09423828125, 0.522216796875, 0.9501953125, 1.378173828125, 1.80615234375, 2.234130859375, 2.662109375, 3.090087890625, 3.51806640625, 3.946044921875, 4.3740234375, 4.802001953125, 5.22998046875, 5.657958984375, 6.0859375, 6.513916015625, 6.94189453125, 7.369873046875, 7.7978515625, 8.225830078125, 8.65380859375, 9.081787109375, 9.509765625, 9.937744140625, 10.36572265625, 10.793701171875, 11.2216796875, 11.649658203125, 12.07763671875, 12.505615234375, 12.93359375, 13.361572265625, 13.78955078125, 14.217529296875, 14.6455078125, 15.073486328125, 15.50146484375, 15.929443359375, 16.357421875, 16.785400390625, 17.21337890625, 17.641357421875, 18.0693359375, 18.497314453125, 18.92529296875, 19.353271484375, 19.78125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 4.0, 13.0, 35.0, 74.0, 162.0, 249.0, 246.0, 115.0, 42.0, 23.0, 15.0, 8.0, 3.0, 3.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-98.06118774414062, -95.5317153930664, -93.00223541259766, -90.47276306152344, -87.94329071044922, -85.413818359375, -82.88433837890625, -80.35486602783203, -77.82539367675781, -75.2959213256836, -72.76644134521484, -70.23696899414062, -67.7074966430664, -65.17802429199219, -62.64854431152344, -60.11907196044922, -57.58959197998047, -55.060115814208984, -52.530643463134766, -50.00116729736328, -47.47169494628906, -44.94221878051758, -42.412742614746094, -39.883270263671875, -37.35379409790039, -34.824317932128906, -32.29484558105469, -29.765369415283203, -27.23589515686035, -24.7064208984375, -22.176944732666016, -19.647470474243164, -17.117996215820312, -14.588521957397461, -12.059046745300293, -9.529571533203125, -7.000097274780273, -4.470623016357422, -1.941147804260254, 0.5883274078369141, 3.1178016662597656, 5.647276401519775, 8.176751136779785, 10.706226348876953, 13.235700607299805, 15.765174865722656, 18.29465103149414, 20.824125289916992, 23.353599548339844, 25.883073806762695, 28.412548065185547, 30.94202423095703, 33.47149658203125, 36.000972747802734, 38.53044891357422, 41.05992126464844, 43.58939743041992, 46.118873596191406, 48.648345947265625, 51.17782211303711, 53.707298278808594, 56.23677062988281, 58.7662467956543, 61.29572296142578, 63.8251953125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 7.0, 6.0, 11.0, 12.0, 14.0, 13.0, 16.0, 19.0, 25.0, 25.0, 27.0, 27.0, 44.0, 51.0, 52.0, 47.0, 45.0, 51.0, 47.0, 45.0, 65.0, 47.0, 36.0, 31.0, 36.0, 25.0, 27.0, 25.0, 22.0, 22.0, 17.0, 15.0, 15.0, 10.0, 8.0, 3.0, 5.0, 8.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-31.665313720703125, -30.710559844970703, -29.75580406188965, -28.801048278808594, -27.846294403076172, -26.89154052734375, -25.936784744262695, -24.98202896118164, -24.02727508544922, -23.072521209716797, -22.117765426635742, -21.163009643554688, -20.208255767822266, -19.253501892089844, -18.29874610900879, -17.343990325927734, -16.389236450195312, -15.434481620788574, -14.479726791381836, -13.524971961975098, -12.57021713256836, -11.615462303161621, -10.660707473754883, -9.705952644348145, -8.751197814941406, -7.796442985534668, -6.84168815612793, -5.886933326721191, -4.932178497314453, -3.977423667907715, -3.0226688385009766, -2.0679140090942383, -1.1131591796875, -0.15840435028076172, 0.7963504791259766, 1.7511053085327148, 2.705860137939453, 3.6606149673461914, 4.61536979675293, 5.570124626159668, 6.524879455566406, 7.4796342849731445, 8.434389114379883, 9.389143943786621, 10.34389877319336, 11.298653602600098, 12.253408432006836, 13.208163261413574, 14.162918090820312, 15.11767292022705, 16.07242774963379, 17.027183532714844, 17.981937408447266, 18.936691284179688, 19.891447067260742, 20.846202850341797, 21.80095672607422, 22.75571060180664, 23.710466384887695, 24.66522216796875, 25.619976043701172, 26.574729919433594, 27.52948570251465, 28.484241485595703, 29.438995361328125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 5.0, 7.0, 10.0, 17.0, 19.0, 23.0, 36.0, 80.0, 74.0, 122.0, 191.0, 327.0, 474.0, 793.0, 1232.0, 2173.0, 3746.0, 6908.0, 12439.0, 24460.0, 48435.0, 99127.0, 203729.0, 292361.0, 177847.0, 85469.0, 41327.0, 21264.0, 11109.0, 6151.0, 3470.0, 1938.0, 1170.0, 681.0, 451.0, 303.0, 202.0, 124.0, 82.0, 64.0, 43.0, 23.0, 9.0, 14.0, 10.0, 3.0, 4.0, 5.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-3.80078125, -3.6834716796875, -3.566162109375, -3.4488525390625, -3.33154296875, -3.2142333984375, -3.096923828125, -2.9796142578125, -2.8623046875, -2.7449951171875, -2.627685546875, -2.5103759765625, -2.39306640625, -2.2757568359375, -2.158447265625, -2.0411376953125, -1.923828125, -1.8065185546875, -1.689208984375, -1.5718994140625, -1.45458984375, -1.3372802734375, -1.219970703125, -1.1026611328125, -0.9853515625, -0.8680419921875, -0.750732421875, -0.6334228515625, -0.51611328125, -0.3988037109375, -0.281494140625, -0.1641845703125, -0.046875, 0.0704345703125, 0.187744140625, 0.3050537109375, 0.42236328125, 0.5396728515625, 0.656982421875, 0.7742919921875, 0.8916015625, 1.0089111328125, 1.126220703125, 1.2435302734375, 1.36083984375, 1.4781494140625, 1.595458984375, 1.7127685546875, 1.830078125, 1.9473876953125, 2.064697265625, 2.1820068359375, 2.29931640625, 2.4166259765625, 2.533935546875, 2.6512451171875, 2.7685546875, 2.8858642578125, 3.003173828125, 3.1204833984375, 3.23779296875, 3.3551025390625, 3.472412109375, 3.5897216796875, 3.70703125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 6.0, 5.0, 6.0, 9.0, 5.0, 10.0, 9.0, 10.0, 16.0, 17.0, 29.0, 24.0, 22.0, 22.0, 34.0, 38.0, 50.0, 32.0, 31.0, 50.0, 53.0, 43.0, 40.0, 55.0, 50.0, 35.0, 31.0, 48.0, 34.0, 28.0, 26.0, 22.0, 19.0, 20.0, 12.0, 10.0, 8.0, 8.0, 9.0, 7.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.3125, -2.24298095703125, -2.1734619140625, -2.10394287109375, -2.034423828125, -1.96490478515625, -1.8953857421875, -1.82586669921875, -1.75634765625, -1.68682861328125, -1.6173095703125, -1.54779052734375, -1.478271484375, -1.40875244140625, -1.3392333984375, -1.26971435546875, -1.2001953125, -1.13067626953125, -1.0611572265625, -0.99163818359375, -0.922119140625, -0.85260009765625, -0.7830810546875, -0.71356201171875, -0.64404296875, -0.57452392578125, -0.5050048828125, -0.43548583984375, -0.365966796875, -0.29644775390625, -0.2269287109375, -0.15740966796875, -0.087890625, -0.01837158203125, 0.0511474609375, 0.12066650390625, 0.190185546875, 0.25970458984375, 0.3292236328125, 0.39874267578125, 0.46826171875, 0.53778076171875, 0.6072998046875, 0.67681884765625, 0.746337890625, 0.81585693359375, 0.8853759765625, 0.95489501953125, 1.0244140625, 1.09393310546875, 1.1634521484375, 1.23297119140625, 1.302490234375, 1.37200927734375, 1.4415283203125, 1.51104736328125, 1.58056640625, 1.65008544921875, 1.7196044921875, 1.78912353515625, 1.858642578125, 1.92816162109375, 1.9976806640625, 2.06719970703125, 2.13671875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 7.0, 7.0, 8.0, 16.0, 27.0, 26.0, 39.0, 50.0, 79.0, 106.0, 165.0, 259.0, 476.0, 843.0, 1832.0, 4579.0, 15859.0, 77060.0, 524742.0, 345651.0, 57077.0, 12561.0, 3754.0, 1514.0, 716.0, 372.0, 249.0, 135.0, 99.0, 65.0, 45.0, 44.0, 27.0, 13.0, 19.0, 4.0, 6.0, 7.0, 6.0, 2.0, 0.0, 3.0, 3.0, 2.0, 2.0], "bins": [-11.375, -11.074951171875, -10.77490234375, -10.474853515625, -10.1748046875, -9.874755859375, -9.57470703125, -9.274658203125, -8.974609375, -8.674560546875, -8.37451171875, -8.074462890625, -7.7744140625, -7.474365234375, -7.17431640625, -6.874267578125, -6.57421875, -6.274169921875, -5.97412109375, -5.674072265625, -5.3740234375, -5.073974609375, -4.77392578125, -4.473876953125, -4.173828125, -3.873779296875, -3.57373046875, -3.273681640625, -2.9736328125, -2.673583984375, -2.37353515625, -2.073486328125, -1.7734375, -1.473388671875, -1.17333984375, -0.873291015625, -0.5732421875, -0.273193359375, 0.02685546875, 0.326904296875, 0.626953125, 0.927001953125, 1.22705078125, 1.527099609375, 1.8271484375, 2.127197265625, 2.42724609375, 2.727294921875, 3.02734375, 3.327392578125, 3.62744140625, 3.927490234375, 4.2275390625, 4.527587890625, 4.82763671875, 5.127685546875, 5.427734375, 5.727783203125, 6.02783203125, 6.327880859375, 6.6279296875, 6.927978515625, 7.22802734375, 7.528076171875, 7.828125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 7.0, 8.0, 7.0, 8.0, 15.0, 11.0, 13.0, 19.0, 32.0, 24.0, 33.0, 41.0, 35.0, 53.0, 51.0, 55.0, 52.0, 78.0, 37.0, 49.0, 50.0, 33.0, 45.0, 54.0, 29.0, 29.0, 23.0, 23.0, 17.0, 9.0, 14.0, 7.0, 7.0, 5.0, 6.0, 4.0, 3.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-13.796875, -13.4326171875, -13.068359375, -12.7041015625, -12.33984375, -11.9755859375, -11.611328125, -11.2470703125, -10.8828125, -10.5185546875, -10.154296875, -9.7900390625, -9.42578125, -9.0615234375, -8.697265625, -8.3330078125, -7.96875, -7.6044921875, -7.240234375, -6.8759765625, -6.51171875, -6.1474609375, -5.783203125, -5.4189453125, -5.0546875, -4.6904296875, -4.326171875, -3.9619140625, -3.59765625, -3.2333984375, -2.869140625, -2.5048828125, -2.140625, -1.7763671875, -1.412109375, -1.0478515625, -0.68359375, -0.3193359375, 0.044921875, 0.4091796875, 0.7734375, 1.1376953125, 1.501953125, 1.8662109375, 2.23046875, 2.5947265625, 2.958984375, 3.3232421875, 3.6875, 4.0517578125, 4.416015625, 4.7802734375, 5.14453125, 5.5087890625, 5.873046875, 6.2373046875, 6.6015625, 6.9658203125, 7.330078125, 7.6943359375, 8.05859375, 8.4228515625, 8.787109375, 9.1513671875, 9.515625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 6.0, 12.0, 11.0, 20.0, 20.0, 38.0, 47.0, 83.0, 155.0, 275.0, 556.0, 1418.0, 5189.0, 37326.0, 647456.0, 328863.0, 21122.0, 3785.0, 1109.0, 465.0, 222.0, 128.0, 72.0, 52.0, 27.0, 18.0, 15.0, 12.0, 15.0, 5.0, 6.0, 0.0, 5.0, 3.0, 5.0, 0.0, 2.0, 2.0, 1.0], "bins": [-6.0078125, -5.857177734375, -5.70654296875, -5.555908203125, -5.4052734375, -5.254638671875, -5.10400390625, -4.953369140625, -4.802734375, -4.652099609375, -4.50146484375, -4.350830078125, -4.2001953125, -4.049560546875, -3.89892578125, -3.748291015625, -3.59765625, -3.447021484375, -3.29638671875, -3.145751953125, -2.9951171875, -2.844482421875, -2.69384765625, -2.543212890625, -2.392578125, -2.241943359375, -2.09130859375, -1.940673828125, -1.7900390625, -1.639404296875, -1.48876953125, -1.338134765625, -1.1875, -1.036865234375, -0.88623046875, -0.735595703125, -0.5849609375, -0.434326171875, -0.28369140625, -0.133056640625, 0.017578125, 0.168212890625, 0.31884765625, 0.469482421875, 0.6201171875, 0.770751953125, 0.92138671875, 1.072021484375, 1.22265625, 1.373291015625, 1.52392578125, 1.674560546875, 1.8251953125, 1.975830078125, 2.12646484375, 2.277099609375, 2.427734375, 2.578369140625, 2.72900390625, 2.879638671875, 3.0302734375, 3.180908203125, 3.33154296875, 3.482177734375, 3.6328125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 5.0, 2.0, 4.0, 4.0, 5.0, 5.0, 9.0, 13.0, 18.0, 15.0, 24.0, 30.0, 40.0, 26.0, 44.0, 48.0, 64.0, 62.0, 82.0, 66.0, 62.0, 52.0, 43.0, 55.0, 34.0, 38.0, 34.0, 24.0, 17.0, 18.0, 10.0, 15.0, 9.0, 6.0, 5.0, 5.0, 3.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.0005655288696289062, -0.0005498901009559631, -0.00053425133228302, -0.0005186125636100769, -0.0005029737949371338, -0.0004873350262641907, -0.00047169625759124756, -0.00045605748891830444, -0.00044041872024536133, -0.0004247799515724182, -0.0004091411828994751, -0.000393502414226532, -0.00037786364555358887, -0.00036222487688064575, -0.00034658610820770264, -0.0003309473395347595, -0.0003153085708618164, -0.0002996698021888733, -0.0002840310335159302, -0.00026839226484298706, -0.00025275349617004395, -0.00023711472749710083, -0.00022147595882415771, -0.0002058371901512146, -0.00019019842147827148, -0.00017455965280532837, -0.00015892088413238525, -0.00014328211545944214, -0.00012764334678649902, -0.00011200457811355591, -9.636580944061279e-05, -8.072704076766968e-05, -6.508827209472656e-05, -4.944950342178345e-05, -3.381073474884033e-05, -1.8171966075897217e-05, -2.5331974029541016e-06, 1.3105571269989014e-05, 2.874433994293213e-05, 4.4383108615875244e-05, 6.002187728881836e-05, 7.566064596176147e-05, 9.129941463470459e-05, 0.0001069381833076477, 0.00012257695198059082, 0.00013821572065353394, 0.00015385448932647705, 0.00016949325799942017, 0.00018513202667236328, 0.0002007707953453064, 0.0002164095640182495, 0.00023204833269119263, 0.00024768710136413574, 0.00026332587003707886, 0.00027896463871002197, 0.0002946034073829651, 0.0003102421760559082, 0.0003258809447288513, 0.00034151971340179443, 0.00035715848207473755, 0.00037279725074768066, 0.0003884360194206238, 0.0004040747880935669, 0.00041971355676651, 0.0004353523254394531]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 7.0, 6.0, 3.0, 5.0, 8.0, 14.0, 10.0, 28.0, 39.0, 59.0, 104.0, 230.0, 464.0, 1294.0, 4355.0, 26271.0, 399355.0, 575381.0, 33314.0, 5115.0, 1422.0, 520.0, 238.0, 119.0, 62.0, 42.0, 32.0, 20.0, 9.0, 11.0, 6.0, 7.0, 2.0, 8.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-5.1015625, -4.960052490234375, -4.81854248046875, -4.677032470703125, -4.5355224609375, -4.394012451171875, -4.25250244140625, -4.110992431640625, -3.969482421875, -3.827972412109375, -3.68646240234375, -3.544952392578125, -3.4034423828125, -3.261932373046875, -3.12042236328125, -2.978912353515625, -2.83740234375, -2.695892333984375, -2.55438232421875, -2.412872314453125, -2.2713623046875, -2.129852294921875, -1.98834228515625, -1.846832275390625, -1.705322265625, -1.563812255859375, -1.42230224609375, -1.280792236328125, -1.1392822265625, -0.997772216796875, -0.85626220703125, -0.714752197265625, -0.5732421875, -0.431732177734375, -0.29022216796875, -0.148712158203125, -0.0072021484375, 0.134307861328125, 0.27581787109375, 0.417327880859375, 0.558837890625, 0.700347900390625, 0.84185791015625, 0.983367919921875, 1.1248779296875, 1.266387939453125, 1.40789794921875, 1.549407958984375, 1.69091796875, 1.832427978515625, 1.97393798828125, 2.115447998046875, 2.2569580078125, 2.398468017578125, 2.53997802734375, 2.681488037109375, 2.822998046875, 2.964508056640625, 3.10601806640625, 3.247528076171875, 3.3890380859375, 3.530548095703125, 3.67205810546875, 3.813568115234375, 3.955078125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 9.0, 8.0, 17.0, 35.0, 28.0, 45.0, 56.0, 62.0, 73.0, 100.0, 99.0, 113.0, 84.0, 71.0, 45.0, 47.0, 35.0, 21.0, 22.0, 8.0, 8.0, 4.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.28125, -3.15277099609375, -3.0242919921875, -2.89581298828125, -2.767333984375, -2.63885498046875, -2.5103759765625, -2.38189697265625, -2.25341796875, -2.12493896484375, -1.9964599609375, -1.86798095703125, -1.739501953125, -1.61102294921875, -1.4825439453125, -1.35406494140625, -1.2255859375, -1.09710693359375, -0.9686279296875, -0.84014892578125, -0.711669921875, -0.58319091796875, -0.4547119140625, -0.32623291015625, -0.19775390625, -0.06927490234375, 0.0592041015625, 0.18768310546875, 0.316162109375, 0.44464111328125, 0.5731201171875, 0.70159912109375, 0.830078125, 0.95855712890625, 1.0870361328125, 1.21551513671875, 1.343994140625, 1.47247314453125, 1.6009521484375, 1.72943115234375, 1.85791015625, 1.98638916015625, 2.1148681640625, 2.24334716796875, 2.371826171875, 2.50030517578125, 2.6287841796875, 2.75726318359375, 2.8857421875, 3.01422119140625, 3.1427001953125, 3.27117919921875, 3.399658203125, 3.52813720703125, 3.6566162109375, 3.78509521484375, 3.91357421875, 4.04205322265625, 4.1705322265625, 4.29901123046875, 4.427490234375, 4.55596923828125, 4.6844482421875, 4.81292724609375, 4.94140625]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 7.0, 12.0, 16.0, 54.0, 101.0, 148.0, 221.0, 187.0, 120.0, 58.0, 28.0, 17.0, 12.0, 7.0, 8.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-70.37223815917969, -67.91392517089844, -65.45560455322266, -62.997291564941406, -60.53897476196289, -58.080657958984375, -55.622344970703125, -53.16402816772461, -50.705711364746094, -48.24739456176758, -45.78908157348633, -43.33076477050781, -40.8724479675293, -38.41413116455078, -35.95581817626953, -33.497501373291016, -31.039188385009766, -28.580873489379883, -26.122556686401367, -23.664241790771484, -21.20592498779297, -18.747610092163086, -16.289295196533203, -13.830978393554688, -11.372663497924805, -8.914347648620605, -6.4560322761535645, -3.9977169036865234, -1.5394010543823242, 0.918914794921875, 3.377229690551758, 5.835546493530273, 8.293861389160156, 10.752177238464355, 13.210493087768555, 15.668807983398438, 18.127124786376953, 20.585439682006836, 23.04375457763672, 25.502071380615234, 27.960386276245117, 30.418701171875, 32.877017974853516, 35.33533477783203, 37.79364776611328, 40.2519645690918, 42.71028137207031, 45.16859436035156, 47.62691116333008, 50.085227966308594, 52.543540954589844, 55.00185775756836, 57.460174560546875, 59.918487548828125, 62.37680435180664, 64.83512115478516, 67.2934341430664, 69.75174713134766, 72.21006774902344, 74.66838073730469, 77.12669372558594, 79.58501434326172, 82.04332733154297, 84.50164794921875, 86.9599609375]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 4.0, 5.0, 1.0, 5.0, 4.0, 8.0, 2.0, 8.0, 13.0, 18.0, 14.0, 8.0, 26.0, 25.0, 27.0, 26.0, 33.0, 42.0, 30.0, 44.0, 36.0, 43.0, 54.0, 46.0, 54.0, 47.0, 53.0, 36.0, 35.0, 36.0, 29.0, 27.0, 30.0, 13.0, 21.0, 14.0, 19.0, 11.0, 12.0, 9.0, 6.0, 10.0, 5.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-38.6396369934082, -37.434715270996094, -36.22979736328125, -35.02487564086914, -33.81995391845703, -32.61503219604492, -31.410112380981445, -30.20519256591797, -29.00027084350586, -27.79534912109375, -26.590429306030273, -25.385509490966797, -24.180587768554688, -22.975666046142578, -21.7707462310791, -20.565826416015625, -19.360904693603516, -18.155982971191406, -16.95106315612793, -15.746142387390137, -14.541221618652344, -13.33630084991455, -12.131380081176758, -10.926459312438965, -9.721538543701172, -8.516617774963379, -7.311697006225586, -6.106776237487793, -4.90185546875, -3.696934700012207, -2.492013931274414, -1.287093162536621, -0.08217620849609375, 1.1227445602416992, 2.327665328979492, 3.532586097717285, 4.737506866455078, 5.942427635192871, 7.147348403930664, 8.352269172668457, 9.55718994140625, 10.762110710144043, 11.967031478881836, 13.171952247619629, 14.376873016357422, 15.581793785095215, 16.786714553833008, 17.991634368896484, 19.196556091308594, 20.401477813720703, 21.60639762878418, 22.811317443847656, 24.016239166259766, 25.221160888671875, 26.42608070373535, 27.631000518798828, 28.835922241210938, 30.040843963623047, 31.245763778686523, 32.45068359375, 33.65560531616211, 34.86052703857422, 36.06544494628906, 37.27036666870117, 38.47528839111328]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 6.0, 4.0, 6.0, 3.0, 12.0, 10.0, 14.0, 28.0, 27.0, 57.0, 88.0, 127.0, 227.0, 347.0, 639.0, 1210.0, 2231.0, 4367.0, 9172.0, 21649.0, 63123.0, 280219.0, 1704031.0, 1703465.0, 297035.0, 65839.0, 21883.0, 9246.0, 4316.0, 2223.0, 1132.0, 617.0, 372.0, 216.0, 110.0, 89.0, 51.0, 28.0, 26.0, 17.0, 10.0, 6.0, 5.0, 3.0, 5.0, 4.0, 2.0, 1.0], "bins": [-3.310546875, -3.225677490234375, -3.14080810546875, -3.055938720703125, -2.9710693359375, -2.886199951171875, -2.80133056640625, -2.716461181640625, -2.631591796875, -2.546722412109375, -2.46185302734375, -2.376983642578125, -2.2921142578125, -2.207244873046875, -2.12237548828125, -2.037506103515625, -1.95263671875, -1.867767333984375, -1.78289794921875, -1.698028564453125, -1.6131591796875, -1.528289794921875, -1.44342041015625, -1.358551025390625, -1.273681640625, -1.188812255859375, -1.10394287109375, -1.019073486328125, -0.9342041015625, -0.849334716796875, -0.76446533203125, -0.679595947265625, -0.5947265625, -0.509857177734375, -0.42498779296875, -0.340118408203125, -0.2552490234375, -0.170379638671875, -0.08551025390625, -0.000640869140625, 0.084228515625, 0.169097900390625, 0.25396728515625, 0.338836669921875, 0.4237060546875, 0.508575439453125, 0.59344482421875, 0.678314208984375, 0.76318359375, 0.848052978515625, 0.93292236328125, 1.017791748046875, 1.1026611328125, 1.187530517578125, 1.27239990234375, 1.357269287109375, 1.442138671875, 1.527008056640625, 1.61187744140625, 1.696746826171875, 1.7816162109375, 1.866485595703125, 1.95135498046875, 2.036224365234375, 2.12109375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 5.0, 7.0, 5.0, 5.0, 10.0, 4.0, 16.0, 12.0, 16.0, 17.0, 19.0, 14.0, 32.0, 26.0, 21.0, 35.0, 32.0, 44.0, 46.0, 44.0, 35.0, 49.0, 58.0, 47.0, 49.0, 50.0, 37.0, 45.0, 34.0, 27.0, 29.0, 19.0, 28.0, 19.0, 12.0, 16.0, 9.0, 11.0, 5.0, 7.0, 5.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.708984375, -1.642852783203125, -1.57672119140625, -1.510589599609375, -1.4444580078125, -1.378326416015625, -1.31219482421875, -1.246063232421875, -1.179931640625, -1.113800048828125, -1.04766845703125, -0.981536865234375, -0.9154052734375, -0.849273681640625, -0.78314208984375, -0.717010498046875, -0.65087890625, -0.584747314453125, -0.51861572265625, -0.452484130859375, -0.3863525390625, -0.320220947265625, -0.25408935546875, -0.187957763671875, -0.121826171875, -0.055694580078125, 0.01043701171875, 0.076568603515625, 0.1427001953125, 0.208831787109375, 0.27496337890625, 0.341094970703125, 0.4072265625, 0.473358154296875, 0.53948974609375, 0.605621337890625, 0.6717529296875, 0.737884521484375, 0.80401611328125, 0.870147705078125, 0.936279296875, 1.002410888671875, 1.06854248046875, 1.134674072265625, 1.2008056640625, 1.266937255859375, 1.33306884765625, 1.399200439453125, 1.46533203125, 1.531463623046875, 1.59759521484375, 1.663726806640625, 1.7298583984375, 1.795989990234375, 1.86212158203125, 1.928253173828125, 1.994384765625, 2.060516357421875, 2.12664794921875, 2.192779541015625, 2.2589111328125, 2.325042724609375, 2.39117431640625, 2.457305908203125, 2.5234375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 7.0, 8.0, 14.0, 13.0, 19.0, 33.0, 28.0, 55.0, 85.0, 126.0, 193.0, 375.0, 728.0, 1579.0, 3799.0, 10193.0, 35871.0, 187886.0, 3011319.0, 832088.0, 79997.0, 18960.0, 6155.0, 2373.0, 1042.0, 527.0, 298.0, 182.0, 91.0, 64.0, 51.0, 28.0, 21.0, 22.0, 13.0, 12.0, 6.0, 7.0, 9.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.91796875, -5.7374267578125, -5.556884765625, -5.3763427734375, -5.19580078125, -5.0152587890625, -4.834716796875, -4.6541748046875, -4.4736328125, -4.2930908203125, -4.112548828125, -3.9320068359375, -3.75146484375, -3.5709228515625, -3.390380859375, -3.2098388671875, -3.029296875, -2.8487548828125, -2.668212890625, -2.4876708984375, -2.30712890625, -2.1265869140625, -1.946044921875, -1.7655029296875, -1.5849609375, -1.4044189453125, -1.223876953125, -1.0433349609375, -0.86279296875, -0.6822509765625, -0.501708984375, -0.3211669921875, -0.140625, 0.0399169921875, 0.220458984375, 0.4010009765625, 0.58154296875, 0.7620849609375, 0.942626953125, 1.1231689453125, 1.3037109375, 1.4842529296875, 1.664794921875, 1.8453369140625, 2.02587890625, 2.2064208984375, 2.386962890625, 2.5675048828125, 2.748046875, 2.9285888671875, 3.109130859375, 3.2896728515625, 3.47021484375, 3.6507568359375, 3.831298828125, 4.0118408203125, 4.1923828125, 4.3729248046875, 4.553466796875, 4.7340087890625, 4.91455078125, 5.0950927734375, 5.275634765625, 5.4561767578125, 5.63671875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 5.0, 7.0, 8.0, 9.0, 15.0, 13.0, 21.0, 23.0, 36.0, 56.0, 70.0, 106.0, 165.0, 276.0, 460.0, 716.0, 780.0, 503.0, 282.0, 151.0, 95.0, 81.0, 52.0, 44.0, 20.0, 20.0, 6.0, 12.0, 8.0, 6.0, 3.0, 10.0, 7.0, 4.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.9375, -5.740234375, -5.54296875, -5.345703125, -5.1484375, -4.951171875, -4.75390625, -4.556640625, -4.359375, -4.162109375, -3.96484375, -3.767578125, -3.5703125, -3.373046875, -3.17578125, -2.978515625, -2.78125, -2.583984375, -2.38671875, -2.189453125, -1.9921875, -1.794921875, -1.59765625, -1.400390625, -1.203125, -1.005859375, -0.80859375, -0.611328125, -0.4140625, -0.216796875, -0.01953125, 0.177734375, 0.375, 0.572265625, 0.76953125, 0.966796875, 1.1640625, 1.361328125, 1.55859375, 1.755859375, 1.953125, 2.150390625, 2.34765625, 2.544921875, 2.7421875, 2.939453125, 3.13671875, 3.333984375, 3.53125, 3.728515625, 3.92578125, 4.123046875, 4.3203125, 4.517578125, 4.71484375, 4.912109375, 5.109375, 5.306640625, 5.50390625, 5.701171875, 5.8984375, 6.095703125, 6.29296875, 6.490234375, 6.6875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 8.0, 12.0, 20.0, 88.0, 193.0, 289.0, 246.0, 88.0, 32.0, 11.0, 8.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.10240936279297, -63.84999465942383, -60.59757995605469, -57.34516143798828, -54.092750549316406, -50.84033203125, -47.58791732788086, -44.33550262451172, -41.08308792114258, -37.83067321777344, -34.5782585144043, -31.325841903686523, -28.073427200317383, -24.821012496948242, -21.56859588623047, -18.316181182861328, -15.063766479492188, -11.811351776123047, -8.55893611907959, -5.306520462036133, -2.054105758666992, 1.1983089447021484, 4.450725555419922, 7.7031402587890625, 10.955554962158203, 14.207969665527344, 17.460384368896484, 20.712800979614258, 23.9652156829834, 27.21763038635254, 30.470046997070312, 33.72246170043945, 36.97486877441406, 40.2272834777832, 43.479698181152344, 46.73211669921875, 49.984527587890625, 53.23694610595703, 56.48936080932617, 59.74177551269531, 62.99419021606445, 66.2466049194336, 69.4990234375, 72.75143432617188, 76.00385284423828, 79.25626373291016, 82.50868225097656, 85.76109313964844, 89.01351165771484, 92.26593017578125, 95.51834106445312, 98.77075958251953, 102.0231704711914, 105.27558898925781, 108.52799987792969, 111.7804183959961, 115.0328369140625, 118.2852554321289, 121.53766632080078, 124.79008483886719, 128.04249572753906, 131.29490661621094, 134.54733276367188, 137.79974365234375, 141.05215454101562]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 2.0, 3.0, 3.0, 6.0, 8.0, 14.0, 9.0, 13.0, 26.0, 31.0, 38.0, 43.0, 41.0, 38.0, 45.0, 67.0, 62.0, 68.0, 58.0, 55.0, 48.0, 59.0, 40.0, 55.0, 37.0, 28.0, 23.0, 25.0, 20.0, 15.0, 7.0, 6.0, 7.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.968656539916992, -25.84511375427246, -24.72157096862793, -23.59803009033203, -22.4744873046875, -21.35094451904297, -20.227401733398438, -19.103858947753906, -17.980316162109375, -16.856773376464844, -15.733231544494629, -14.609688758850098, -13.486146926879883, -12.362604141235352, -11.23906135559082, -10.115518569946289, -8.99197769165039, -7.868435382843018, -6.7448930740356445, -5.621350288391113, -4.49780797958374, -3.374265670776367, -2.250722885131836, -1.127180576324463, -0.0036382675170898438, 1.1199041604995728, 2.2434465885162354, 3.3669891357421875, 4.4905314445495605, 5.614073753356934, 6.737616539001465, 7.861158847808838, 8.984699249267578, 10.10824203491211, 11.231783866882324, 12.355326652526855, 13.47886848449707, 14.602411270141602, 15.725954055786133, 16.849496841430664, 17.973037719726562, 19.096580505371094, 20.220123291015625, 21.343666076660156, 22.467206954956055, 23.590749740600586, 24.714292526245117, 25.83783531188965, 26.96137809753418, 28.08492088317871, 29.208463668823242, 30.33200454711914, 31.455547332763672, 32.5790901184082, 33.702632904052734, 34.826175689697266, 35.9497184753418, 37.07326126098633, 38.19680404663086, 39.32034683227539, 40.44388961791992, 41.56742858886719, 42.69097137451172, 43.81451416015625, 44.93805694580078]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 3.0, 9.0, 8.0, 30.0, 46.0, 64.0, 98.0, 122.0, 194.0, 366.0, 505.0, 840.0, 1494.0, 2527.0, 4274.0, 7604.0, 13225.0, 23319.0, 40756.0, 70203.0, 116426.0, 179661.0, 206315.0, 153024.0, 94577.0, 56564.0, 32489.0, 18455.0, 10796.0, 6017.0, 3516.0, 2028.0, 1175.0, 667.0, 424.0, 262.0, 166.0, 105.0, 69.0, 46.0, 33.0, 22.0, 13.0, 8.0, 8.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.31640625, -2.237335205078125, -2.15826416015625, -2.079193115234375, -2.0001220703125, -1.921051025390625, -1.84197998046875, -1.762908935546875, -1.683837890625, -1.604766845703125, -1.52569580078125, -1.446624755859375, -1.3675537109375, -1.288482666015625, -1.20941162109375, -1.130340576171875, -1.05126953125, -0.972198486328125, -0.89312744140625, -0.814056396484375, -0.7349853515625, -0.655914306640625, -0.57684326171875, -0.497772216796875, -0.418701171875, -0.339630126953125, -0.26055908203125, -0.181488037109375, -0.1024169921875, -0.023345947265625, 0.05572509765625, 0.134796142578125, 0.2138671875, 0.292938232421875, 0.37200927734375, 0.451080322265625, 0.5301513671875, 0.609222412109375, 0.68829345703125, 0.767364501953125, 0.846435546875, 0.925506591796875, 1.00457763671875, 1.083648681640625, 1.1627197265625, 1.241790771484375, 1.32086181640625, 1.399932861328125, 1.47900390625, 1.558074951171875, 1.63714599609375, 1.716217041015625, 1.7952880859375, 1.874359130859375, 1.95343017578125, 2.032501220703125, 2.111572265625, 2.190643310546875, 2.26971435546875, 2.348785400390625, 2.4278564453125, 2.506927490234375, 2.58599853515625, 2.665069580078125, 2.744140625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 1.0, 5.0, 7.0, 8.0, 10.0, 10.0, 12.0, 12.0, 18.0, 26.0, 20.0, 28.0, 25.0, 31.0, 36.0, 28.0, 32.0, 39.0, 39.0, 41.0, 69.0, 50.0, 45.0, 57.0, 33.0, 41.0, 37.0, 35.0, 26.0, 33.0, 22.0, 31.0, 20.0, 15.0, 11.0, 14.0, 9.0, 6.0, 6.0, 6.0, 3.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8193359375, -1.7544097900390625, -1.689483642578125, -1.6245574951171875, -1.55963134765625, -1.4947052001953125, -1.429779052734375, -1.3648529052734375, -1.2999267578125, -1.2350006103515625, -1.170074462890625, -1.1051483154296875, -1.04022216796875, -0.9752960205078125, -0.910369873046875, -0.8454437255859375, -0.780517578125, -0.7155914306640625, -0.650665283203125, -0.5857391357421875, -0.52081298828125, -0.4558868408203125, -0.390960693359375, -0.3260345458984375, -0.2611083984375, -0.1961822509765625, -0.131256103515625, -0.0663299560546875, -0.00140380859375, 0.0635223388671875, 0.128448486328125, 0.1933746337890625, 0.25830078125, 0.3232269287109375, 0.388153076171875, 0.4530792236328125, 0.51800537109375, 0.5829315185546875, 0.647857666015625, 0.7127838134765625, 0.7777099609375, 0.8426361083984375, 0.907562255859375, 0.9724884033203125, 1.03741455078125, 1.1023406982421875, 1.167266845703125, 1.2321929931640625, 1.297119140625, 1.3620452880859375, 1.426971435546875, 1.4918975830078125, 1.55682373046875, 1.6217498779296875, 1.686676025390625, 1.7516021728515625, 1.8165283203125, 1.8814544677734375, 1.946380615234375, 2.0113067626953125, 2.07623291015625, 2.1411590576171875, 2.206085205078125, 2.2710113525390625, 2.3359375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 2.0, 6.0, 4.0, 13.0, 17.0, 28.0, 35.0, 27.0, 51.0, 87.0, 106.0, 136.0, 206.0, 278.0, 466.0, 697.0, 1061.0, 1975.0, 4467.0, 14969.0, 70633.0, 452920.0, 407743.0, 68157.0, 14622.0, 4571.0, 1995.0, 1133.0, 690.0, 433.0, 280.0, 222.0, 151.0, 106.0, 76.0, 46.0, 41.0, 27.0, 27.0, 12.0, 11.0, 6.0, 6.0, 7.0, 0.0, 4.0, 3.0, 0.0, 0.0, 3.0, 1.0], "bins": [-8.0390625, -7.809326171875, -7.57958984375, -7.349853515625, -7.1201171875, -6.890380859375, -6.66064453125, -6.430908203125, -6.201171875, -5.971435546875, -5.74169921875, -5.511962890625, -5.2822265625, -5.052490234375, -4.82275390625, -4.593017578125, -4.36328125, -4.133544921875, -3.90380859375, -3.674072265625, -3.4443359375, -3.214599609375, -2.98486328125, -2.755126953125, -2.525390625, -2.295654296875, -2.06591796875, -1.836181640625, -1.6064453125, -1.376708984375, -1.14697265625, -0.917236328125, -0.6875, -0.457763671875, -0.22802734375, 0.001708984375, 0.2314453125, 0.461181640625, 0.69091796875, 0.920654296875, 1.150390625, 1.380126953125, 1.60986328125, 1.839599609375, 2.0693359375, 2.299072265625, 2.52880859375, 2.758544921875, 2.98828125, 3.218017578125, 3.44775390625, 3.677490234375, 3.9072265625, 4.136962890625, 4.36669921875, 4.596435546875, 4.826171875, 5.055908203125, 5.28564453125, 5.515380859375, 5.7451171875, 5.974853515625, 6.20458984375, 6.434326171875, 6.6640625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 5.0, 3.0, 8.0, 6.0, 9.0, 6.0, 7.0, 10.0, 11.0, 22.0, 30.0, 20.0, 38.0, 27.0, 37.0, 42.0, 49.0, 61.0, 44.0, 47.0, 32.0, 35.0, 47.0, 59.0, 54.0, 38.0, 41.0, 32.0, 36.0, 26.0, 22.0, 20.0, 19.0, 6.0, 7.0, 12.0, 9.0, 8.0, 7.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-9.609375, -9.3209228515625, -9.032470703125, -8.7440185546875, -8.45556640625, -8.1671142578125, -7.878662109375, -7.5902099609375, -7.3017578125, -7.0133056640625, -6.724853515625, -6.4364013671875, -6.14794921875, -5.8594970703125, -5.571044921875, -5.2825927734375, -4.994140625, -4.7056884765625, -4.417236328125, -4.1287841796875, -3.84033203125, -3.5518798828125, -3.263427734375, -2.9749755859375, -2.6865234375, -2.3980712890625, -2.109619140625, -1.8211669921875, -1.53271484375, -1.2442626953125, -0.955810546875, -0.6673583984375, -0.37890625, -0.0904541015625, 0.197998046875, 0.4864501953125, 0.77490234375, 1.0633544921875, 1.351806640625, 1.6402587890625, 1.9287109375, 2.2171630859375, 2.505615234375, 2.7940673828125, 3.08251953125, 3.3709716796875, 3.659423828125, 3.9478759765625, 4.236328125, 4.5247802734375, 4.813232421875, 5.1016845703125, 5.39013671875, 5.6785888671875, 5.967041015625, 6.2554931640625, 6.5439453125, 6.8323974609375, 7.120849609375, 7.4093017578125, 7.69775390625, 7.9862060546875, 8.274658203125, 8.5631103515625, 8.8515625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 4.0, 5.0, 7.0, 10.0, 17.0, 18.0, 22.0, 33.0, 42.0, 79.0, 130.0, 234.0, 475.0, 992.0, 2734.0, 11207.0, 104560.0, 826899.0, 86518.0, 9986.0, 2594.0, 912.0, 441.0, 254.0, 142.0, 59.0, 47.0, 38.0, 18.0, 21.0, 13.0, 11.0, 13.0, 2.0, 2.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.765625, -3.64202880859375, -3.5184326171875, -3.39483642578125, -3.271240234375, -3.14764404296875, -3.0240478515625, -2.90045166015625, -2.77685546875, -2.65325927734375, -2.5296630859375, -2.40606689453125, -2.282470703125, -2.15887451171875, -2.0352783203125, -1.91168212890625, -1.7880859375, -1.66448974609375, -1.5408935546875, -1.41729736328125, -1.293701171875, -1.17010498046875, -1.0465087890625, -0.92291259765625, -0.79931640625, -0.67572021484375, -0.5521240234375, -0.42852783203125, -0.304931640625, -0.18133544921875, -0.0577392578125, 0.06585693359375, 0.189453125, 0.31304931640625, 0.4366455078125, 0.56024169921875, 0.683837890625, 0.80743408203125, 0.9310302734375, 1.05462646484375, 1.17822265625, 1.30181884765625, 1.4254150390625, 1.54901123046875, 1.672607421875, 1.79620361328125, 1.9197998046875, 2.04339599609375, 2.1669921875, 2.29058837890625, 2.4141845703125, 2.53778076171875, 2.661376953125, 2.78497314453125, 2.9085693359375, 3.03216552734375, 3.15576171875, 3.27935791015625, 3.4029541015625, 3.52655029296875, 3.650146484375, 3.77374267578125, 3.8973388671875, 4.02093505859375, 4.14453125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 9.0, 12.0, 20.0, 23.0, 22.0, 43.0, 56.0, 81.0, 104.0, 119.0, 112.0, 106.0, 85.0, 54.0, 46.0, 31.0, 25.0, 21.0, 8.0, 8.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006494522094726562, -0.0006244927644729614, -0.0005995333194732666, -0.0005745738744735718, -0.000549614429473877, -0.0005246549844741821, -0.0004996955394744873, -0.0004747360944747925, -0.00044977664947509766, -0.00042481720447540283, -0.000399857759475708, -0.0003748983144760132, -0.00034993886947631836, -0.00032497942447662354, -0.0003000199794769287, -0.0002750605344772339, -0.00025010108947753906, -0.00022514164447784424, -0.00020018219947814941, -0.0001752227544784546, -0.00015026330947875977, -0.00012530386447906494, -0.00010034441947937012, -7.538497447967529e-05, -5.042552947998047e-05, -2.5466084480285645e-05, -5.066394805908203e-07, 2.4452805519104004e-05, 4.941225051879883e-05, 7.437169551849365e-05, 9.933114051818848e-05, 0.0001242905855178833, 0.00014925003051757812, 0.00017420947551727295, 0.00019916892051696777, 0.0002241283655166626, 0.0002490878105163574, 0.00027404725551605225, 0.00029900670051574707, 0.0003239661455154419, 0.0003489255905151367, 0.00037388503551483154, 0.00039884448051452637, 0.0004238039255142212, 0.000448763370513916, 0.00047372281551361084, 0.0004986822605133057, 0.0005236417055130005, 0.0005486011505126953, 0.0005735605955123901, 0.000598520040512085, 0.0006234794855117798, 0.0006484389305114746, 0.0006733983755111694, 0.0006983578205108643, 0.0007233172655105591, 0.0007482767105102539, 0.0007732361555099487, 0.0007981956005096436, 0.0008231550455093384, 0.0008481144905090332, 0.000873073935508728, 0.0008980333805084229, 0.0009229928255081177, 0.0009479522705078125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 5.0, 8.0, 7.0, 6.0, 11.0, 15.0, 16.0, 20.0, 27.0, 52.0, 67.0, 84.0, 136.0, 213.0, 354.0, 566.0, 1332.0, 3052.0, 8918.0, 40982.0, 370515.0, 556236.0, 48977.0, 10332.0, 3463.0, 1398.0, 705.0, 386.0, 214.0, 140.0, 102.0, 63.0, 43.0, 29.0, 21.0, 16.0, 19.0, 11.0, 4.0, 2.0, 2.0, 4.0, 4.0, 2.0, 4.0], "bins": [-3.33203125, -3.2488250732421875, -3.165618896484375, -3.0824127197265625, -2.99920654296875, -2.9160003662109375, -2.832794189453125, -2.7495880126953125, -2.6663818359375, -2.5831756591796875, -2.499969482421875, -2.4167633056640625, -2.33355712890625, -2.2503509521484375, -2.167144775390625, -2.0839385986328125, -2.000732421875, -1.9175262451171875, -1.834320068359375, -1.7511138916015625, -1.66790771484375, -1.5847015380859375, -1.501495361328125, -1.4182891845703125, -1.3350830078125, -1.2518768310546875, -1.168670654296875, -1.0854644775390625, -1.00225830078125, -0.9190521240234375, -0.835845947265625, -0.7526397705078125, -0.66943359375, -0.5862274169921875, -0.503021240234375, -0.4198150634765625, -0.33660888671875, -0.2534027099609375, -0.170196533203125, -0.0869903564453125, -0.0037841796875, 0.0794219970703125, 0.162628173828125, 0.2458343505859375, 0.32904052734375, 0.4122467041015625, 0.495452880859375, 0.5786590576171875, 0.661865234375, 0.7450714111328125, 0.828277587890625, 0.9114837646484375, 0.99468994140625, 1.0778961181640625, 1.161102294921875, 1.2443084716796875, 1.3275146484375, 1.4107208251953125, 1.493927001953125, 1.5771331787109375, 1.66033935546875, 1.7435455322265625, 1.826751708984375, 1.9099578857421875, 1.9931640625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 2.0, 4.0, 5.0, 9.0, 3.0, 16.0, 9.0, 17.0, 23.0, 33.0, 41.0, 38.0, 43.0, 55.0, 61.0, 70.0, 67.0, 61.0, 66.0, 63.0, 49.0, 72.0, 38.0, 37.0, 27.0, 26.0, 18.0, 18.0, 8.0, 5.0, 8.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.900390625, -2.82208251953125, -2.7437744140625, -2.66546630859375, -2.587158203125, -2.50885009765625, -2.4305419921875, -2.35223388671875, -2.27392578125, -2.19561767578125, -2.1173095703125, -2.03900146484375, -1.960693359375, -1.88238525390625, -1.8040771484375, -1.72576904296875, -1.6474609375, -1.56915283203125, -1.4908447265625, -1.41253662109375, -1.334228515625, -1.25592041015625, -1.1776123046875, -1.09930419921875, -1.02099609375, -0.94268798828125, -0.8643798828125, -0.78607177734375, -0.707763671875, -0.62945556640625, -0.5511474609375, -0.47283935546875, -0.39453125, -0.31622314453125, -0.2379150390625, -0.15960693359375, -0.081298828125, -0.00299072265625, 0.0753173828125, 0.15362548828125, 0.23193359375, 0.31024169921875, 0.3885498046875, 0.46685791015625, 0.545166015625, 0.62347412109375, 0.7017822265625, 0.78009033203125, 0.8583984375, 0.93670654296875, 1.0150146484375, 1.09332275390625, 1.171630859375, 1.24993896484375, 1.3282470703125, 1.40655517578125, 1.48486328125, 1.56317138671875, 1.6414794921875, 1.71978759765625, 1.798095703125, 1.87640380859375, 1.9547119140625, 2.03302001953125, 2.111328125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 12.0, 39.0, 58.0, 134.0, 248.0, 276.0, 140.0, 48.0, 17.0, 11.0, 5.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.76946258544922, -73.69979858398438, -70.63014221191406, -67.56047821044922, -64.49081420898438, -61.42115783691406, -58.35149383544922, -55.28183364868164, -52.21217346191406, -49.142513275146484, -46.07284927368164, -43.00318908691406, -39.933528900146484, -36.863868713378906, -33.79420471191406, -30.724544525146484, -27.65488052368164, -24.58521842956543, -21.51555824279785, -18.44589614868164, -15.376235008239746, -12.306573867797852, -9.23691177368164, -6.1672515869140625, -3.0975894927978516, -0.02792811393737793, 3.0417332649230957, 6.111394882202148, 9.181056022644043, 12.250717163085938, 15.320379257202148, 18.390039443969727, 21.459701538085938, 24.52936363220215, 27.599023818969727, 30.668685913085938, 33.738346099853516, 36.808006286621094, 39.87767028808594, 42.947330474853516, 46.016990661621094, 49.08665084838867, 52.156314849853516, 55.225975036621094, 58.29563522338867, 61.36529541015625, 64.4349594116211, 67.50462341308594, 70.57427978515625, 73.6439437866211, 76.7136001586914, 79.78326416015625, 82.8529281616211, 85.9225845336914, 88.99224853515625, 92.06190490722656, 95.13157653808594, 98.20124053955078, 101.2708969116211, 104.34056091308594, 107.41022491455078, 110.4798812866211, 113.54954528808594, 116.61920166015625, 119.6888656616211]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 11.0, 6.0, 9.0, 11.0, 24.0, 19.0, 27.0, 23.0, 24.0, 35.0, 37.0, 41.0, 42.0, 50.0, 59.0, 85.0, 79.0, 64.0, 63.0, 42.0, 45.0, 31.0, 33.0, 23.0, 20.0, 21.0, 11.0, 16.0, 15.0, 14.0, 5.0, 6.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-41.24934005737305, -39.95686340332031, -38.66438293457031, -37.37190628051758, -36.07942581176758, -34.786949157714844, -33.494468688964844, -32.20199203491211, -30.909513473510742, -29.617034912109375, -28.324556350708008, -27.03207778930664, -25.739601135253906, -24.447120666503906, -23.154644012451172, -21.862165451049805, -20.569686889648438, -19.27720832824707, -17.984729766845703, -16.692251205444336, -15.399773597717285, -14.107295036315918, -12.814817428588867, -11.5223388671875, -10.229860305786133, -8.937381744384766, -7.644903659820557, -6.352425575256348, -5.0599470138549805, -3.7674684524536133, -2.4749903678894043, -1.1825122833251953, 0.10996246337890625, 1.4024407863616943, 2.6949191093444824, 3.9873974323272705, 5.279875755310059, 6.572354316711426, 7.864832401275635, 9.157310485839844, 10.449789047241211, 11.742267608642578, 13.034746170043945, 14.327223777770996, 15.619702339172363, 16.912181854248047, 18.20465850830078, 19.49713706970215, 20.789615631103516, 22.082094192504883, 23.37457275390625, 24.667051315307617, 25.959529876708984, 27.25200653076172, 28.544485092163086, 29.836963653564453, 31.12944221496582, 32.42192077636719, 33.71439743041992, 35.00687789916992, 36.299354553222656, 37.591835021972656, 38.88431167602539, 40.176788330078125, 41.469268798828125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 4.0, 6.0, 10.0, 16.0, 27.0, 60.0, 43.0, 85.0, 130.0, 202.0, 289.0, 474.0, 831.0, 1450.0, 2663.0, 5006.0, 9986.0, 22732.0, 60458.0, 220949.0, 1099094.0, 2050605.0, 529648.0, 120425.0, 37642.0, 15765.0, 7131.0, 3609.0, 1997.0, 1135.0, 663.0, 367.0, 286.0, 179.0, 99.0, 72.0, 42.0, 32.0, 20.0, 16.0, 13.0, 6.0, 8.0, 2.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-2.82421875, -2.7418212890625, -2.659423828125, -2.5770263671875, -2.49462890625, -2.4122314453125, -2.329833984375, -2.2474365234375, -2.1650390625, -2.0826416015625, -2.000244140625, -1.9178466796875, -1.83544921875, -1.7530517578125, -1.670654296875, -1.5882568359375, -1.505859375, -1.4234619140625, -1.341064453125, -1.2586669921875, -1.17626953125, -1.0938720703125, -1.011474609375, -0.9290771484375, -0.8466796875, -0.7642822265625, -0.681884765625, -0.5994873046875, -0.51708984375, -0.4346923828125, -0.352294921875, -0.2698974609375, -0.1875, -0.1051025390625, -0.022705078125, 0.0596923828125, 0.14208984375, 0.2244873046875, 0.306884765625, 0.3892822265625, 0.4716796875, 0.5540771484375, 0.636474609375, 0.7188720703125, 0.80126953125, 0.8836669921875, 0.966064453125, 1.0484619140625, 1.130859375, 1.2132568359375, 1.295654296875, 1.3780517578125, 1.46044921875, 1.5428466796875, 1.625244140625, 1.7076416015625, 1.7900390625, 1.8724365234375, 1.954833984375, 2.0372314453125, 2.11962890625, 2.2020263671875, 2.284423828125, 2.3668212890625, 2.44921875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 1.0, 6.0, 6.0, 6.0, 2.0, 13.0, 8.0, 9.0, 10.0, 16.0, 19.0, 18.0, 22.0, 24.0, 24.0, 31.0, 32.0, 34.0, 45.0, 37.0, 37.0, 33.0, 43.0, 40.0, 53.0, 47.0, 40.0, 42.0, 34.0, 25.0, 20.0, 27.0, 28.0, 34.0, 20.0, 24.0, 17.0, 17.0, 11.0, 17.0, 7.0, 6.0, 3.0, 5.0, 3.0, 5.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.736328125, -1.67926025390625, -1.6221923828125, -1.56512451171875, -1.508056640625, -1.45098876953125, -1.3939208984375, -1.33685302734375, -1.27978515625, -1.22271728515625, -1.1656494140625, -1.10858154296875, -1.051513671875, -0.99444580078125, -0.9373779296875, -0.88031005859375, -0.8232421875, -0.76617431640625, -0.7091064453125, -0.65203857421875, -0.594970703125, -0.53790283203125, -0.4808349609375, -0.42376708984375, -0.36669921875, -0.30963134765625, -0.2525634765625, -0.19549560546875, -0.138427734375, -0.08135986328125, -0.0242919921875, 0.03277587890625, 0.08984375, 0.14691162109375, 0.2039794921875, 0.26104736328125, 0.318115234375, 0.37518310546875, 0.4322509765625, 0.48931884765625, 0.54638671875, 0.60345458984375, 0.6605224609375, 0.71759033203125, 0.774658203125, 0.83172607421875, 0.8887939453125, 0.94586181640625, 1.0029296875, 1.05999755859375, 1.1170654296875, 1.17413330078125, 1.231201171875, 1.28826904296875, 1.3453369140625, 1.40240478515625, 1.45947265625, 1.51654052734375, 1.5736083984375, 1.63067626953125, 1.687744140625, 1.74481201171875, 1.8018798828125, 1.85894775390625, 1.916015625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 7.0, 0.0, 6.0, 9.0, 6.0, 17.0, 13.0, 19.0, 27.0, 45.0, 57.0, 95.0, 133.0, 229.0, 368.0, 706.0, 1392.0, 2983.0, 7870.0, 25697.0, 112717.0, 1446766.0, 2400701.0, 149808.0, 30226.0, 8500.0, 3053.0, 1265.0, 616.0, 365.0, 219.0, 124.0, 82.0, 48.0, 36.0, 27.0, 13.0, 11.0, 7.0, 4.0, 7.0, 7.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.01953125, -5.84796142578125, -5.6763916015625, -5.50482177734375, -5.333251953125, -5.16168212890625, -4.9901123046875, -4.81854248046875, -4.64697265625, -4.47540283203125, -4.3038330078125, -4.13226318359375, -3.960693359375, -3.78912353515625, -3.6175537109375, -3.44598388671875, -3.2744140625, -3.10284423828125, -2.9312744140625, -2.75970458984375, -2.588134765625, -2.41656494140625, -2.2449951171875, -2.07342529296875, -1.90185546875, -1.73028564453125, -1.5587158203125, -1.38714599609375, -1.215576171875, -1.04400634765625, -0.8724365234375, -0.70086669921875, -0.529296875, -0.35772705078125, -0.1861572265625, -0.01458740234375, 0.156982421875, 0.32855224609375, 0.5001220703125, 0.67169189453125, 0.84326171875, 1.01483154296875, 1.1864013671875, 1.35797119140625, 1.529541015625, 1.70111083984375, 1.8726806640625, 2.04425048828125, 2.2158203125, 2.38739013671875, 2.5589599609375, 2.73052978515625, 2.902099609375, 3.07366943359375, 3.2452392578125, 3.41680908203125, 3.58837890625, 3.75994873046875, 3.9315185546875, 4.10308837890625, 4.274658203125, 4.44622802734375, 4.6177978515625, 4.78936767578125, 4.9609375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 7.0, 7.0, 12.0, 10.0, 12.0, 20.0, 24.0, 33.0, 50.0, 54.0, 94.0, 182.0, 306.0, 513.0, 883.0, 774.0, 447.0, 235.0, 120.0, 91.0, 48.0, 41.0, 27.0, 21.0, 25.0, 14.0, 8.0, 5.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.94140625, -5.71160888671875, -5.4818115234375, -5.25201416015625, -5.022216796875, -4.79241943359375, -4.5626220703125, -4.33282470703125, -4.10302734375, -3.87322998046875, -3.6434326171875, -3.41363525390625, -3.183837890625, -2.95404052734375, -2.7242431640625, -2.49444580078125, -2.2646484375, -2.03485107421875, -1.8050537109375, -1.57525634765625, -1.345458984375, -1.11566162109375, -0.8858642578125, -0.65606689453125, -0.42626953125, -0.19647216796875, 0.0333251953125, 0.26312255859375, 0.492919921875, 0.72271728515625, 0.9525146484375, 1.18231201171875, 1.412109375, 1.64190673828125, 1.8717041015625, 2.10150146484375, 2.331298828125, 2.56109619140625, 2.7908935546875, 3.02069091796875, 3.25048828125, 3.48028564453125, 3.7100830078125, 3.93988037109375, 4.169677734375, 4.39947509765625, 4.6292724609375, 4.85906982421875, 5.0888671875, 5.31866455078125, 5.5484619140625, 5.77825927734375, 6.008056640625, 6.23785400390625, 6.4676513671875, 6.69744873046875, 6.92724609375, 7.15704345703125, 7.3868408203125, 7.61663818359375, 7.846435546875, 8.07623291015625, 8.3060302734375, 8.53582763671875, 8.765625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 7.0, 13.0, 26.0, 56.0, 109.0, 182.0, 224.0, 181.0, 98.0, 56.0, 19.0, 5.0, 5.0, 7.0, 5.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-90.60877990722656, -88.32697296142578, -86.04515838623047, -83.76335144042969, -81.48153686523438, -79.1997299194336, -76.91792297363281, -74.6361083984375, -72.35430145263672, -70.07249450683594, -67.79067993164062, -65.50887298583984, -63.2270622253418, -60.94525146484375, -58.66344451904297, -56.38163375854492, -54.099822998046875, -51.81801223754883, -49.53620147705078, -47.25439453125, -44.97258377075195, -42.690773010253906, -40.408966064453125, -38.12715530395508, -35.84534454345703, -33.563533782958984, -31.28172492980957, -28.999916076660156, -26.71810531616211, -24.436294555664062, -22.15448570251465, -19.872676849365234, -17.590858459472656, -15.309048652648926, -13.027238845825195, -10.745429039001465, -8.463619232177734, -6.181809425354004, -3.8999996185302734, -1.618189811706543, 0.6636199951171875, 2.945429801940918, 5.227239608764648, 7.509049415588379, 9.79085922241211, 12.07266902923584, 14.35447883605957, 16.636287689208984, 18.91809844970703, 21.199909210205078, 23.481718063354492, 25.763526916503906, 28.045337677001953, 30.3271484375, 32.60895538330078, 34.89076614379883, 37.172576904296875, 39.45438766479492, 41.73619842529297, 44.01800537109375, 46.2998161315918, 48.581626892089844, 50.863433837890625, 53.14524459838867, 55.42705535888672]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 8.0, 2.0, 6.0, 12.0, 18.0, 12.0, 15.0, 15.0, 25.0, 22.0, 38.0, 40.0, 32.0, 36.0, 38.0, 48.0, 48.0, 52.0, 54.0, 47.0, 52.0, 38.0, 46.0, 40.0, 33.0, 35.0, 26.0, 24.0, 21.0, 19.0, 17.0, 10.0, 14.0, 11.0, 7.0, 6.0, 9.0, 9.0, 3.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.809492111206055, -28.851871490478516, -27.89425277709961, -26.936634063720703, -25.979013442993164, -25.021392822265625, -24.06377410888672, -23.106155395507812, -22.148534774780273, -21.190914154052734, -20.233295440673828, -19.275676727294922, -18.318056106567383, -17.360435485839844, -16.402816772460938, -15.445197105407715, -14.487577438354492, -13.52995777130127, -12.572338104248047, -11.614718437194824, -10.657098770141602, -9.699479103088379, -8.741859436035156, -7.784239768981934, -6.826620101928711, -5.869000434875488, -4.911380767822266, -3.953761100769043, -2.9961414337158203, -2.0385217666625977, -1.080902099609375, -0.12328243255615234, 0.8343353271484375, 1.7919549942016602, 2.749574661254883, 3.7071943283081055, 4.664813995361328, 5.622433662414551, 6.580053329467773, 7.537672996520996, 8.495292663574219, 9.452912330627441, 10.410531997680664, 11.368151664733887, 12.32577133178711, 13.283390998840332, 14.241010665893555, 15.198630332946777, 16.15625, 17.113868713378906, 18.071489334106445, 19.029109954833984, 19.98672866821289, 20.944347381591797, 21.901968002319336, 22.859588623046875, 23.81720733642578, 24.774826049804688, 25.732446670532227, 26.690067291259766, 27.647686004638672, 28.605304718017578, 29.562925338745117, 30.520545959472656, 31.478164672851562]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 8.0, 10.0, 14.0, 27.0, 36.0, 36.0, 65.0, 95.0, 108.0, 199.0, 261.0, 402.0, 601.0, 887.0, 1279.0, 1930.0, 3016.0, 4776.0, 7797.0, 12091.0, 19917.0, 32504.0, 53498.0, 86309.0, 138731.0, 196898.0, 179528.0, 117306.0, 72577.0, 44645.0, 27455.0, 16824.0, 10410.0, 6509.0, 4144.0, 2563.0, 1628.0, 1115.0, 757.0, 495.0, 347.0, 232.0, 155.0, 122.0, 80.0, 47.0, 51.0, 28.0, 20.0, 12.0, 11.0, 6.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0], "bins": [-2.443359375, -2.3665771484375, -2.289794921875, -2.2130126953125, -2.13623046875, -2.0594482421875, -1.982666015625, -1.9058837890625, -1.8291015625, -1.7523193359375, -1.675537109375, -1.5987548828125, -1.52197265625, -1.4451904296875, -1.368408203125, -1.2916259765625, -1.21484375, -1.1380615234375, -1.061279296875, -0.9844970703125, -0.90771484375, -0.8309326171875, -0.754150390625, -0.6773681640625, -0.6005859375, -0.5238037109375, -0.447021484375, -0.3702392578125, -0.29345703125, -0.2166748046875, -0.139892578125, -0.0631103515625, 0.013671875, 0.0904541015625, 0.167236328125, 0.2440185546875, 0.32080078125, 0.3975830078125, 0.474365234375, 0.5511474609375, 0.6279296875, 0.7047119140625, 0.781494140625, 0.8582763671875, 0.93505859375, 1.0118408203125, 1.088623046875, 1.1654052734375, 1.2421875, 1.3189697265625, 1.395751953125, 1.4725341796875, 1.54931640625, 1.6260986328125, 1.702880859375, 1.7796630859375, 1.8564453125, 1.9332275390625, 2.010009765625, 2.0867919921875, 2.16357421875, 2.2403564453125, 2.317138671875, 2.3939208984375, 2.470703125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 8.0, 6.0, 3.0, 7.0, 12.0, 11.0, 18.0, 24.0, 23.0, 18.0, 32.0, 25.0, 23.0, 37.0, 33.0, 27.0, 46.0, 47.0, 46.0, 49.0, 47.0, 57.0, 39.0, 44.0, 34.0, 38.0, 32.0, 31.0, 26.0, 28.0, 28.0, 18.0, 15.0, 14.0, 13.0, 12.0, 6.0, 9.0, 3.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.88671875, -1.821197509765625, -1.75567626953125, -1.690155029296875, -1.6246337890625, -1.559112548828125, -1.49359130859375, -1.428070068359375, -1.362548828125, -1.297027587890625, -1.23150634765625, -1.165985107421875, -1.1004638671875, -1.034942626953125, -0.96942138671875, -0.903900146484375, -0.83837890625, -0.772857666015625, -0.70733642578125, -0.641815185546875, -0.5762939453125, -0.510772705078125, -0.44525146484375, -0.379730224609375, -0.314208984375, -0.248687744140625, -0.18316650390625, -0.117645263671875, -0.0521240234375, 0.013397216796875, 0.07891845703125, 0.144439697265625, 0.2099609375, 0.275482177734375, 0.34100341796875, 0.406524658203125, 0.4720458984375, 0.537567138671875, 0.60308837890625, 0.668609619140625, 0.734130859375, 0.799652099609375, 0.86517333984375, 0.930694580078125, 0.9962158203125, 1.061737060546875, 1.12725830078125, 1.192779541015625, 1.25830078125, 1.323822021484375, 1.38934326171875, 1.454864501953125, 1.5203857421875, 1.585906982421875, 1.65142822265625, 1.716949462890625, 1.782470703125, 1.847991943359375, 1.91351318359375, 1.979034423828125, 2.0445556640625, 2.110076904296875, 2.17559814453125, 2.241119384765625, 2.306640625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 7.0, 12.0, 8.0, 21.0, 17.0, 22.0, 41.0, 55.0, 82.0, 97.0, 143.0, 216.0, 296.0, 438.0, 665.0, 1362.0, 2640.0, 7109.0, 27737.0, 151381.0, 663978.0, 151650.0, 27445.0, 7111.0, 2580.0, 1225.0, 757.0, 423.0, 315.0, 202.0, 159.0, 102.0, 71.0, 44.0, 33.0, 18.0, 23.0, 27.0, 13.0, 9.0, 8.0, 4.0, 7.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.703125, -7.4505615234375, -7.197998046875, -6.9454345703125, -6.69287109375, -6.4403076171875, -6.187744140625, -5.9351806640625, -5.6826171875, -5.4300537109375, -5.177490234375, -4.9249267578125, -4.67236328125, -4.4197998046875, -4.167236328125, -3.9146728515625, -3.662109375, -3.4095458984375, -3.156982421875, -2.9044189453125, -2.65185546875, -2.3992919921875, -2.146728515625, -1.8941650390625, -1.6416015625, -1.3890380859375, -1.136474609375, -0.8839111328125, -0.63134765625, -0.3787841796875, -0.126220703125, 0.1263427734375, 0.37890625, 0.6314697265625, 0.884033203125, 1.1365966796875, 1.38916015625, 1.6417236328125, 1.894287109375, 2.1468505859375, 2.3994140625, 2.6519775390625, 2.904541015625, 3.1571044921875, 3.40966796875, 3.6622314453125, 3.914794921875, 4.1673583984375, 4.419921875, 4.6724853515625, 4.925048828125, 5.1776123046875, 5.43017578125, 5.6827392578125, 5.935302734375, 6.1878662109375, 6.4404296875, 6.6929931640625, 6.945556640625, 7.1981201171875, 7.45068359375, 7.7032470703125, 7.955810546875, 8.2083740234375, 8.4609375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 2.0, 4.0, 7.0, 6.0, 8.0, 7.0, 10.0, 12.0, 13.0, 10.0, 11.0, 30.0, 22.0, 21.0, 29.0, 33.0, 36.0, 45.0, 37.0, 40.0, 46.0, 44.0, 45.0, 50.0, 41.0, 46.0, 43.0, 39.0, 32.0, 40.0, 34.0, 27.0, 22.0, 19.0, 10.0, 25.0, 12.0, 11.0, 5.0, 3.0, 5.0, 5.0, 3.0, 4.0, 4.0, 1.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0], "bins": [-8.671875, -8.4130859375, -8.154296875, -7.8955078125, -7.63671875, -7.3779296875, -7.119140625, -6.8603515625, -6.6015625, -6.3427734375, -6.083984375, -5.8251953125, -5.56640625, -5.3076171875, -5.048828125, -4.7900390625, -4.53125, -4.2724609375, -4.013671875, -3.7548828125, -3.49609375, -3.2373046875, -2.978515625, -2.7197265625, -2.4609375, -2.2021484375, -1.943359375, -1.6845703125, -1.42578125, -1.1669921875, -0.908203125, -0.6494140625, -0.390625, -0.1318359375, 0.126953125, 0.3857421875, 0.64453125, 0.9033203125, 1.162109375, 1.4208984375, 1.6796875, 1.9384765625, 2.197265625, 2.4560546875, 2.71484375, 2.9736328125, 3.232421875, 3.4912109375, 3.75, 4.0087890625, 4.267578125, 4.5263671875, 4.78515625, 5.0439453125, 5.302734375, 5.5615234375, 5.8203125, 6.0791015625, 6.337890625, 6.5966796875, 6.85546875, 7.1142578125, 7.373046875, 7.6318359375, 7.890625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 5.0, 2.0, 7.0, 7.0, 10.0, 11.0, 22.0, 33.0, 54.0, 100.0, 209.0, 443.0, 1286.0, 5292.0, 44436.0, 687968.0, 282725.0, 21314.0, 3080.0, 857.0, 348.0, 141.0, 75.0, 40.0, 25.0, 21.0, 13.0, 13.0, 2.0, 7.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.951171875, -2.852294921875, -2.75341796875, -2.654541015625, -2.5556640625, -2.456787109375, -2.35791015625, -2.259033203125, -2.16015625, -2.061279296875, -1.96240234375, -1.863525390625, -1.7646484375, -1.665771484375, -1.56689453125, -1.468017578125, -1.369140625, -1.270263671875, -1.17138671875, -1.072509765625, -0.9736328125, -0.874755859375, -0.77587890625, -0.677001953125, -0.578125, -0.479248046875, -0.38037109375, -0.281494140625, -0.1826171875, -0.083740234375, 0.01513671875, 0.114013671875, 0.212890625, 0.311767578125, 0.41064453125, 0.509521484375, 0.6083984375, 0.707275390625, 0.80615234375, 0.905029296875, 1.00390625, 1.102783203125, 1.20166015625, 1.300537109375, 1.3994140625, 1.498291015625, 1.59716796875, 1.696044921875, 1.794921875, 1.893798828125, 1.99267578125, 2.091552734375, 2.1904296875, 2.289306640625, 2.38818359375, 2.487060546875, 2.5859375, 2.684814453125, 2.78369140625, 2.882568359375, 2.9814453125, 3.080322265625, 3.17919921875, 3.278076171875, 3.376953125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 8.0, 2.0, 8.0, 11.0, 10.0, 23.0, 22.0, 25.0, 25.0, 37.0, 34.0, 56.0, 64.0, 70.0, 64.0, 88.0, 80.0, 63.0, 76.0, 43.0, 39.0, 40.0, 26.0, 20.0, 8.0, 14.0, 14.0, 7.0, 5.0, 4.0, 6.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0], "bins": [-0.00061798095703125, -0.00060218945145607, -0.0005863979458808899, -0.0005706064403057098, -0.0005548149347305298, -0.0005390234291553497, -0.0005232319235801697, -0.0005074404180049896, -0.0004916489124298096, -0.0004758574068546295, -0.00046006590127944946, -0.0004442743957042694, -0.00042848289012908936, -0.0004126913845539093, -0.00039689987897872925, -0.0003811083734035492, -0.00036531686782836914, -0.0003495253622531891, -0.00033373385667800903, -0.000317942351102829, -0.0003021508455276489, -0.00028635933995246887, -0.0002705678343772888, -0.00025477632880210876, -0.0002389848232269287, -0.00022319331765174866, -0.0002074018120765686, -0.00019161030650138855, -0.0001758188009262085, -0.00016002729535102844, -0.0001442357897758484, -0.00012844428420066833, -0.00011265277862548828, -9.686127305030823e-05, -8.106976747512817e-05, -6.527826189994812e-05, -4.9486756324768066e-05, -3.369525074958801e-05, -1.790374517440796e-05, -2.1122395992279053e-06, 1.3679265975952148e-05, 2.9470771551132202e-05, 4.5262277126312256e-05, 6.105378270149231e-05, 7.684528827667236e-05, 9.263679385185242e-05, 0.00010842829942703247, 0.00012421980500221252, 0.00014001131057739258, 0.00015580281615257263, 0.00017159432172775269, 0.00018738582730293274, 0.0002031773328781128, 0.00021896883845329285, 0.0002347603440284729, 0.00025055184960365295, 0.000266343355178833, 0.00028213486075401306, 0.0002979263663291931, 0.00031371787190437317, 0.0003295093774795532, 0.0003453008830547333, 0.00036109238862991333, 0.0003768838942050934, 0.00039267539978027344]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 2.0, 7.0, 13.0, 14.0, 19.0, 18.0, 19.0, 40.0, 68.0, 86.0, 122.0, 209.0, 376.0, 586.0, 1094.0, 2354.0, 6404.0, 24411.0, 136601.0, 629740.0, 197882.0, 34418.0, 8182.0, 2742.0, 1299.0, 677.0, 434.0, 252.0, 146.0, 106.0, 65.0, 57.0, 25.0, 20.0, 25.0, 14.0, 8.0, 7.0, 5.0, 3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0], "bins": [-2.068359375, -2.0118560791015625, -1.955352783203125, -1.8988494873046875, -1.84234619140625, -1.7858428955078125, -1.729339599609375, -1.6728363037109375, -1.6163330078125, -1.5598297119140625, -1.503326416015625, -1.4468231201171875, -1.39031982421875, -1.3338165283203125, -1.277313232421875, -1.2208099365234375, -1.164306640625, -1.1078033447265625, -1.051300048828125, -0.9947967529296875, -0.93829345703125, -0.8817901611328125, -0.825286865234375, -0.7687835693359375, -0.7122802734375, -0.6557769775390625, -0.599273681640625, -0.5427703857421875, -0.48626708984375, -0.4297637939453125, -0.373260498046875, -0.3167572021484375, -0.26025390625, -0.2037506103515625, -0.147247314453125, -0.0907440185546875, -0.03424072265625, 0.0222625732421875, 0.078765869140625, 0.1352691650390625, 0.1917724609375, 0.2482757568359375, 0.304779052734375, 0.3612823486328125, 0.41778564453125, 0.4742889404296875, 0.530792236328125, 0.5872955322265625, 0.643798828125, 0.7003021240234375, 0.756805419921875, 0.8133087158203125, 0.86981201171875, 0.9263153076171875, 0.982818603515625, 1.0393218994140625, 1.0958251953125, 1.1523284912109375, 1.208831787109375, 1.2653350830078125, 1.32183837890625, 1.3783416748046875, 1.434844970703125, 1.4913482666015625, 1.5478515625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 5.0, 7.0, 7.0, 14.0, 22.0, 19.0, 24.0, 42.0, 46.0, 58.0, 72.0, 74.0, 84.0, 84.0, 77.0, 64.0, 66.0, 41.0, 46.0, 31.0, 30.0, 19.0, 24.0, 16.0, 11.0, 6.0, 2.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.03125, -1.963592529296875, -1.89593505859375, -1.828277587890625, -1.7606201171875, -1.692962646484375, -1.62530517578125, -1.557647705078125, -1.489990234375, -1.422332763671875, -1.35467529296875, -1.287017822265625, -1.2193603515625, -1.151702880859375, -1.08404541015625, -1.016387939453125, -0.94873046875, -0.881072998046875, -0.81341552734375, -0.745758056640625, -0.6781005859375, -0.610443115234375, -0.54278564453125, -0.475128173828125, -0.407470703125, -0.339813232421875, -0.27215576171875, -0.204498291015625, -0.1368408203125, -0.069183349609375, -0.00152587890625, 0.066131591796875, 0.1337890625, 0.201446533203125, 0.26910400390625, 0.336761474609375, 0.4044189453125, 0.472076416015625, 0.53973388671875, 0.607391357421875, 0.675048828125, 0.742706298828125, 0.81036376953125, 0.878021240234375, 0.9456787109375, 1.013336181640625, 1.08099365234375, 1.148651123046875, 1.21630859375, 1.283966064453125, 1.35162353515625, 1.419281005859375, 1.4869384765625, 1.554595947265625, 1.62225341796875, 1.689910888671875, 1.757568359375, 1.825225830078125, 1.89288330078125, 1.960540771484375, 2.0281982421875, 2.095855712890625, 2.16351318359375, 2.231170654296875, 2.298828125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 13.0, 43.0, 87.0, 185.0, 329.0, 170.0, 98.0, 32.0, 22.0, 9.0, 2.0, 2.0, 4.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.013771057128906, -39.45927047729492, -36.90476989746094, -34.35026931762695, -31.79576873779297, -29.241268157958984, -26.686769485473633, -24.13226890563965, -21.577768325805664, -19.02326774597168, -16.468767166137695, -13.914267539978027, -11.359766960144043, -8.805266380310059, -6.250766754150391, -3.6962661743164062, -1.1417655944824219, 1.4127347469329834, 3.9672350883483887, 6.521735191345215, 9.0762357711792, 11.630736351013184, 14.185235977172852, 16.739736557006836, 19.29423713684082, 21.848737716674805, 24.40323829650879, 26.95773696899414, 29.512237548828125, 32.06673812866211, 34.621238708496094, 37.17573928833008, 39.73023986816406, 42.28474044799805, 44.83924102783203, 47.393741607666016, 49.9482421875, 52.502742767333984, 55.05724334716797, 57.61174011230469, 60.16624450683594, 62.72074508666992, 65.2752456665039, 67.82974243164062, 70.38424682617188, 72.9387435913086, 75.49324798583984, 78.04774475097656, 80.60224914550781, 83.15674591064453, 85.71125030517578, 88.2657470703125, 90.82025146484375, 93.37474822998047, 95.92925262451172, 98.48374938964844, 101.03824615478516, 103.59274291992188, 106.14724731445312, 108.70174407958984, 111.2562484741211, 113.81074523925781, 116.36524963378906, 118.91974639892578, 121.47425079345703]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 3.0, 5.0, 6.0, 8.0, 6.0, 10.0, 12.0, 16.0, 22.0, 17.0, 14.0, 29.0, 19.0, 27.0, 23.0, 39.0, 32.0, 58.0, 57.0, 74.0, 74.0, 70.0, 57.0, 35.0, 27.0, 30.0, 21.0, 35.0, 23.0, 23.0, 22.0, 11.0, 25.0, 14.0, 14.0, 10.0, 5.0, 5.0, 10.0, 4.0, 6.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.208620071411133, -28.090166091918945, -26.971712112426758, -25.853260040283203, -24.734806060791016, -23.616352081298828, -22.49789810180664, -21.379444122314453, -20.260990142822266, -19.142536163330078, -18.02408218383789, -16.905628204345703, -15.787176132202148, -14.668722152709961, -13.550268173217773, -12.431814193725586, -11.313362121582031, -10.194908142089844, -9.076455116271973, -7.958001136779785, -6.839547634124756, -5.721094131469727, -4.602640151977539, -3.4841866493225098, -2.3657331466674805, -1.2472795248031616, -0.12882590293884277, 0.9896278381347656, 2.108081340789795, 3.226534843444824, 4.344988822937012, 5.463442325592041, 6.581897735595703, 7.700351238250732, 8.818804740905762, 9.93725872039795, 11.05571174621582, 12.174165725708008, 13.292619705200195, 14.411073684692383, 15.529526710510254, 16.647979736328125, 17.766433715820312, 18.8848876953125, 20.003341674804688, 21.121795654296875, 22.240249633789062, 23.358701705932617, 24.477155685424805, 25.595609664916992, 26.71406364440918, 27.832515716552734, 28.950969696044922, 30.06942367553711, 31.187877655029297, 32.306331634521484, 33.42478561401367, 34.54323959350586, 35.66169357299805, 36.780147552490234, 37.89860153198242, 39.017051696777344, 40.13550567626953, 41.25395965576172, 42.372413635253906]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 0.0, 7.0, 7.0, 12.0, 10.0, 23.0, 21.0, 40.0, 36.0, 57.0, 89.0, 116.0, 175.0, 302.0, 411.0, 700.0, 1258.0, 2065.0, 4104.0, 8281.0, 19068.0, 55098.0, 199591.0, 816033.0, 1932890.0, 849982.0, 210382.0, 56008.0, 19383.0, 8455.0, 4236.0, 2175.0, 1248.0, 724.0, 411.0, 264.0, 185.0, 125.0, 101.0, 68.0, 49.0, 21.0, 25.0, 16.0, 9.0, 14.0, 8.0, 3.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.8740234375, -1.8083038330078125, -1.742584228515625, -1.6768646240234375, -1.61114501953125, -1.5454254150390625, -1.479705810546875, -1.4139862060546875, -1.3482666015625, -1.2825469970703125, -1.216827392578125, -1.1511077880859375, -1.08538818359375, -1.0196685791015625, -0.953948974609375, -0.8882293701171875, -0.822509765625, -0.7567901611328125, -0.691070556640625, -0.6253509521484375, -0.55963134765625, -0.4939117431640625, -0.428192138671875, -0.3624725341796875, -0.2967529296875, -0.2310333251953125, -0.165313720703125, -0.0995941162109375, -0.03387451171875, 0.0318450927734375, 0.097564697265625, 0.1632843017578125, 0.22900390625, 0.2947235107421875, 0.360443115234375, 0.4261627197265625, 0.49188232421875, 0.5576019287109375, 0.623321533203125, 0.6890411376953125, 0.7547607421875, 0.8204803466796875, 0.886199951171875, 0.9519195556640625, 1.01763916015625, 1.0833587646484375, 1.149078369140625, 1.2147979736328125, 1.280517578125, 1.3462371826171875, 1.411956787109375, 1.4776763916015625, 1.54339599609375, 1.6091156005859375, 1.674835205078125, 1.7405548095703125, 1.8062744140625, 1.8719940185546875, 1.937713623046875, 2.0034332275390625, 2.06915283203125, 2.1348724365234375, 2.200592041015625, 2.2663116455078125, 2.33203125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 4.0, 6.0, 4.0, 5.0, 9.0, 9.0, 15.0, 15.0, 18.0, 11.0, 24.0, 20.0, 25.0, 23.0, 33.0, 44.0, 43.0, 43.0, 51.0, 35.0, 42.0, 36.0, 45.0, 39.0, 49.0, 43.0, 33.0, 32.0, 34.0, 36.0, 33.0, 24.0, 22.0, 17.0, 15.0, 17.0, 10.0, 15.0, 7.0, 5.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9111328125, -1.850738525390625, -1.79034423828125, -1.729949951171875, -1.6695556640625, -1.609161376953125, -1.54876708984375, -1.488372802734375, -1.427978515625, -1.367584228515625, -1.30718994140625, -1.246795654296875, -1.1864013671875, -1.126007080078125, -1.06561279296875, -1.005218505859375, -0.94482421875, -0.884429931640625, -0.82403564453125, -0.763641357421875, -0.7032470703125, -0.642852783203125, -0.58245849609375, -0.522064208984375, -0.461669921875, -0.401275634765625, -0.34088134765625, -0.280487060546875, -0.2200927734375, -0.159698486328125, -0.09930419921875, -0.038909912109375, 0.021484375, 0.081878662109375, 0.14227294921875, 0.202667236328125, 0.2630615234375, 0.323455810546875, 0.38385009765625, 0.444244384765625, 0.504638671875, 0.565032958984375, 0.62542724609375, 0.685821533203125, 0.7462158203125, 0.806610107421875, 0.86700439453125, 0.927398681640625, 0.98779296875, 1.048187255859375, 1.10858154296875, 1.168975830078125, 1.2293701171875, 1.289764404296875, 1.35015869140625, 1.410552978515625, 1.470947265625, 1.531341552734375, 1.59173583984375, 1.652130126953125, 1.7125244140625, 1.772918701171875, 1.83331298828125, 1.893707275390625, 1.9541015625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 8.0, 15.0, 15.0, 16.0, 38.0, 60.0, 87.0, 146.0, 264.0, 700.0, 3323.0, 33627.0, 3718555.0, 424765.0, 10185.0, 1583.0, 506.0, 184.0, 99.0, 46.0, 23.0, 20.0, 5.0, 5.0, 6.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.140625, -12.783447265625, -12.42626953125, -12.069091796875, -11.7119140625, -11.354736328125, -10.99755859375, -10.640380859375, -10.283203125, -9.926025390625, -9.56884765625, -9.211669921875, -8.8544921875, -8.497314453125, -8.14013671875, -7.782958984375, -7.42578125, -7.068603515625, -6.71142578125, -6.354248046875, -5.9970703125, -5.639892578125, -5.28271484375, -4.925537109375, -4.568359375, -4.211181640625, -3.85400390625, -3.496826171875, -3.1396484375, -2.782470703125, -2.42529296875, -2.068115234375, -1.7109375, -1.353759765625, -0.99658203125, -0.639404296875, -0.2822265625, 0.074951171875, 0.43212890625, 0.789306640625, 1.146484375, 1.503662109375, 1.86083984375, 2.218017578125, 2.5751953125, 2.932373046875, 3.28955078125, 3.646728515625, 4.00390625, 4.361083984375, 4.71826171875, 5.075439453125, 5.4326171875, 5.789794921875, 6.14697265625, 6.504150390625, 6.861328125, 7.218505859375, 7.57568359375, 7.932861328125, 8.2900390625, 8.647216796875, 9.00439453125, 9.361572265625, 9.71875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 6.0, 8.0, 18.0, 36.0, 52.0, 99.0, 174.0, 366.0, 886.0, 1184.0, 652.0, 282.0, 131.0, 75.0, 45.0, 24.0, 12.0, 10.0, 3.0, 7.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.3515625, -12.072509765625, -11.79345703125, -11.514404296875, -11.2353515625, -10.956298828125, -10.67724609375, -10.398193359375, -10.119140625, -9.840087890625, -9.56103515625, -9.281982421875, -9.0029296875, -8.723876953125, -8.44482421875, -8.165771484375, -7.88671875, -7.607666015625, -7.32861328125, -7.049560546875, -6.7705078125, -6.491455078125, -6.21240234375, -5.933349609375, -5.654296875, -5.375244140625, -5.09619140625, -4.817138671875, -4.5380859375, -4.259033203125, -3.97998046875, -3.700927734375, -3.421875, -3.142822265625, -2.86376953125, -2.584716796875, -2.3056640625, -2.026611328125, -1.74755859375, -1.468505859375, -1.189453125, -0.910400390625, -0.63134765625, -0.352294921875, -0.0732421875, 0.205810546875, 0.48486328125, 0.763916015625, 1.04296875, 1.322021484375, 1.60107421875, 1.880126953125, 2.1591796875, 2.438232421875, 2.71728515625, 2.996337890625, 3.275390625, 3.554443359375, 3.83349609375, 4.112548828125, 4.3916015625, 4.670654296875, 4.94970703125, 5.228759765625, 5.5078125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 10.0, 5.0, 18.0, 27.0, 48.0, 80.0, 140.0, 183.0, 166.0, 136.0, 83.0, 40.0, 21.0, 13.0, 10.0, 4.0, 3.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.324188232421875, -41.77286911010742, -40.221553802490234, -38.67023468017578, -37.118919372558594, -35.56760025024414, -34.01628112792969, -32.4649658203125, -30.913646697998047, -29.362329483032227, -27.811012268066406, -26.259693145751953, -24.708375930786133, -23.157058715820312, -21.60573959350586, -20.05442237854004, -18.50310516357422, -16.9517879486084, -15.400469779968262, -13.849151611328125, -12.297834396362305, -10.746517181396484, -9.195199012756348, -7.643880844116211, -6.092563629150391, -4.541245937347412, -2.9899282455444336, -1.438610553741455, 0.11270713806152344, 1.664024829864502, 3.2153425216674805, 4.766660690307617, 6.317981719970703, 7.869299411773682, 9.42061710357666, 10.971935272216797, 12.523252487182617, 14.074569702148438, 15.625887870788574, 17.17720603942871, 18.72852325439453, 20.27984046936035, 21.831157684326172, 23.382476806640625, 24.933794021606445, 26.485111236572266, 28.03643035888672, 29.58774757385254, 31.13906478881836, 32.69038391113281, 34.24169921875, 35.79301834106445, 37.344337463378906, 38.895652770996094, 40.44697189331055, 41.998291015625, 43.54960632324219, 45.10092544555664, 46.65224075317383, 48.20355987548828, 49.75487518310547, 51.30619430541992, 52.857513427734375, 54.40882873535156, 55.960147857666016]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 7.0, 6.0, 10.0, 10.0, 14.0, 23.0, 22.0, 32.0, 24.0, 32.0, 29.0, 36.0, 45.0, 56.0, 44.0, 47.0, 47.0, 41.0, 49.0, 55.0, 47.0, 33.0, 43.0, 27.0, 39.0, 19.0, 31.0, 19.0, 16.0, 24.0, 25.0, 18.0, 9.0, 5.0, 8.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-26.42144012451172, -25.6193790435791, -24.81731605529785, -24.015254974365234, -23.213191986083984, -22.411130905151367, -21.609067916870117, -20.8070068359375, -20.00494384765625, -19.202882766723633, -18.400819778442383, -17.598758697509766, -16.796695709228516, -15.994634628295898, -15.192571640014648, -14.390510559082031, -13.588448524475098, -12.786386489868164, -11.98432445526123, -11.182262420654297, -10.380200386047363, -9.57813835144043, -8.776077270507812, -7.974014759063721, -7.171952724456787, -6.3698906898498535, -5.56782865524292, -4.7657670974731445, -3.963704824447632, -3.1616430282592773, -2.3595809936523438, -1.5575189590454102, -0.7554569244384766, 0.046605050563812256, 0.8486670255661011, 1.6507289409637451, 2.4527909755706787, 3.254852771759033, 4.056914806365967, 4.8589768409729, 5.661038875579834, 6.463100910186768, 7.265162944793701, 8.067224502563477, 8.86928653717041, 9.671348571777344, 10.473410606384277, 11.275472640991211, 12.077534675598145, 12.879596710205078, 13.681658744812012, 14.483720779418945, 15.285782814025879, 16.087844848632812, 16.88990592956543, 17.69196891784668, 18.494029998779297, 19.296091079711914, 20.098154067993164, 20.90021514892578, 21.70227813720703, 22.50433921813965, 23.3064022064209, 24.108463287353516, 24.910526275634766]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 5.0, 6.0, 6.0, 8.0, 18.0, 21.0, 33.0, 33.0, 60.0, 111.0, 96.0, 160.0, 225.0, 305.0, 467.0, 726.0, 1139.0, 1686.0, 2800.0, 4729.0, 7978.0, 14478.0, 25257.0, 46886.0, 85028.0, 145542.0, 210906.0, 200240.0, 130592.0, 74240.0, 41281.0, 22597.0, 12663.0, 6899.0, 4187.0, 2535.0, 1560.0, 975.0, 613.0, 457.0, 267.0, 209.0, 155.0, 111.0, 71.0, 68.0, 37.0, 21.0, 15.0, 18.0, 11.0, 13.0, 12.0, 6.0, 2.0, 3.0, 1.0, 2.0, 2.0], "bins": [-2.578125, -2.497283935546875, -2.41644287109375, -2.335601806640625, -2.2547607421875, -2.173919677734375, -2.09307861328125, -2.012237548828125, -1.931396484375, -1.850555419921875, -1.76971435546875, -1.688873291015625, -1.6080322265625, -1.527191162109375, -1.44635009765625, -1.365509033203125, -1.28466796875, -1.203826904296875, -1.12298583984375, -1.042144775390625, -0.9613037109375, -0.880462646484375, -0.79962158203125, -0.718780517578125, -0.637939453125, -0.557098388671875, -0.47625732421875, -0.395416259765625, -0.3145751953125, -0.233734130859375, -0.15289306640625, -0.072052001953125, 0.0087890625, 0.089630126953125, 0.17047119140625, 0.251312255859375, 0.3321533203125, 0.412994384765625, 0.49383544921875, 0.574676513671875, 0.655517578125, 0.736358642578125, 0.81719970703125, 0.898040771484375, 0.9788818359375, 1.059722900390625, 1.14056396484375, 1.221405029296875, 1.30224609375, 1.383087158203125, 1.46392822265625, 1.544769287109375, 1.6256103515625, 1.706451416015625, 1.78729248046875, 1.868133544921875, 1.948974609375, 2.029815673828125, 2.11065673828125, 2.191497802734375, 2.2723388671875, 2.353179931640625, 2.43402099609375, 2.514862060546875, 2.595703125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 2.0, 6.0, 2.0, 7.0, 11.0, 9.0, 6.0, 13.0, 17.0, 21.0, 19.0, 21.0, 25.0, 42.0, 21.0, 30.0, 37.0, 45.0, 45.0, 45.0, 47.0, 45.0, 41.0, 45.0, 47.0, 32.0, 48.0, 34.0, 39.0, 25.0, 24.0, 21.0, 23.0, 17.0, 18.0, 13.0, 14.0, 12.0, 10.0, 4.0, 4.0, 4.0, 3.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-2.232421875, -2.1678924560546875, -2.103363037109375, -2.0388336181640625, -1.97430419921875, -1.9097747802734375, -1.845245361328125, -1.7807159423828125, -1.7161865234375, -1.6516571044921875, -1.587127685546875, -1.5225982666015625, -1.45806884765625, -1.3935394287109375, -1.329010009765625, -1.2644805908203125, -1.199951171875, -1.1354217529296875, -1.070892333984375, -1.0063629150390625, -0.94183349609375, -0.8773040771484375, -0.812774658203125, -0.7482452392578125, -0.6837158203125, -0.6191864013671875, -0.554656982421875, -0.4901275634765625, -0.42559814453125, -0.3610687255859375, -0.296539306640625, -0.2320098876953125, -0.16748046875, -0.1029510498046875, -0.038421630859375, 0.0261077880859375, 0.09063720703125, 0.1551666259765625, 0.219696044921875, 0.2842254638671875, 0.3487548828125, 0.4132843017578125, 0.477813720703125, 0.5423431396484375, 0.60687255859375, 0.6714019775390625, 0.735931396484375, 0.8004608154296875, 0.864990234375, 0.9295196533203125, 0.994049072265625, 1.0585784912109375, 1.12310791015625, 1.1876373291015625, 1.252166748046875, 1.3166961669921875, 1.3812255859375, 1.4457550048828125, 1.510284423828125, 1.5748138427734375, 1.63934326171875, 1.7038726806640625, 1.768402099609375, 1.8329315185546875, 1.8974609375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 3.0, 10.0, 11.0, 7.0, 18.0, 15.0, 27.0, 38.0, 47.0, 55.0, 75.0, 128.0, 201.0, 350.0, 797.0, 2016.0, 6853.0, 28108.0, 149737.0, 642678.0, 173016.0, 32681.0, 7544.0, 2268.0, 853.0, 378.0, 212.0, 122.0, 75.0, 64.0, 42.0, 39.0, 22.0, 16.0, 15.0, 12.0, 2.0, 4.0, 4.0, 5.0, 6.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.61328125, -7.39288330078125, -7.1724853515625, -6.95208740234375, -6.731689453125, -6.51129150390625, -6.2908935546875, -6.07049560546875, -5.85009765625, -5.62969970703125, -5.4093017578125, -5.18890380859375, -4.968505859375, -4.74810791015625, -4.5277099609375, -4.30731201171875, -4.0869140625, -3.86651611328125, -3.6461181640625, -3.42572021484375, -3.205322265625, -2.98492431640625, -2.7645263671875, -2.54412841796875, -2.32373046875, -2.10333251953125, -1.8829345703125, -1.66253662109375, -1.442138671875, -1.22174072265625, -1.0013427734375, -0.78094482421875, -0.560546875, -0.34014892578125, -0.1197509765625, 0.10064697265625, 0.321044921875, 0.54144287109375, 0.7618408203125, 0.98223876953125, 1.20263671875, 1.42303466796875, 1.6434326171875, 1.86383056640625, 2.084228515625, 2.30462646484375, 2.5250244140625, 2.74542236328125, 2.9658203125, 3.18621826171875, 3.4066162109375, 3.62701416015625, 3.847412109375, 4.06781005859375, 4.2882080078125, 4.50860595703125, 4.72900390625, 4.94940185546875, 5.1697998046875, 5.39019775390625, 5.610595703125, 5.83099365234375, 6.0513916015625, 6.27178955078125, 6.4921875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 2.0, 5.0, 3.0, 1.0, 4.0, 8.0, 6.0, 7.0, 12.0, 9.0, 8.0, 17.0, 18.0, 23.0, 28.0, 18.0, 28.0, 39.0, 32.0, 41.0, 45.0, 40.0, 43.0, 46.0, 62.0, 50.0, 41.0, 46.0, 49.0, 39.0, 35.0, 36.0, 33.0, 14.0, 27.0, 17.0, 14.0, 12.0, 9.0, 13.0, 5.0, 6.0, 2.0, 6.0, 1.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.55859375, -6.31939697265625, -6.0802001953125, -5.84100341796875, -5.601806640625, -5.36260986328125, -5.1234130859375, -4.88421630859375, -4.64501953125, -4.40582275390625, -4.1666259765625, -3.92742919921875, -3.688232421875, -3.44903564453125, -3.2098388671875, -2.97064208984375, -2.7314453125, -2.49224853515625, -2.2530517578125, -2.01385498046875, -1.774658203125, -1.53546142578125, -1.2962646484375, -1.05706787109375, -0.81787109375, -0.57867431640625, -0.3394775390625, -0.10028076171875, 0.138916015625, 0.37811279296875, 0.6173095703125, 0.85650634765625, 1.095703125, 1.33489990234375, 1.5740966796875, 1.81329345703125, 2.052490234375, 2.29168701171875, 2.5308837890625, 2.77008056640625, 3.00927734375, 3.24847412109375, 3.4876708984375, 3.72686767578125, 3.966064453125, 4.20526123046875, 4.4444580078125, 4.68365478515625, 4.9228515625, 5.16204833984375, 5.4012451171875, 5.64044189453125, 5.879638671875, 6.11883544921875, 6.3580322265625, 6.59722900390625, 6.83642578125, 7.07562255859375, 7.3148193359375, 7.55401611328125, 7.793212890625, 8.03240966796875, 8.2716064453125, 8.51080322265625, 8.75]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 1.0, 9.0, 4.0, 17.0, 7.0, 21.0, 35.0, 41.0, 82.0, 150.0, 217.0, 490.0, 1176.0, 3156.0, 10361.0, 43110.0, 212763.0, 620685.0, 120487.0, 25110.0, 6671.0, 2265.0, 825.0, 390.0, 185.0, 87.0, 76.0, 34.0, 30.0, 16.0, 14.0, 7.0, 9.0, 7.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.90625, -1.8433837890625, -1.780517578125, -1.7176513671875, -1.65478515625, -1.5919189453125, -1.529052734375, -1.4661865234375, -1.4033203125, -1.3404541015625, -1.277587890625, -1.2147216796875, -1.15185546875, -1.0889892578125, -1.026123046875, -0.9632568359375, -0.900390625, -0.8375244140625, -0.774658203125, -0.7117919921875, -0.64892578125, -0.5860595703125, -0.523193359375, -0.4603271484375, -0.3974609375, -0.3345947265625, -0.271728515625, -0.2088623046875, -0.14599609375, -0.0831298828125, -0.020263671875, 0.0426025390625, 0.10546875, 0.1683349609375, 0.231201171875, 0.2940673828125, 0.35693359375, 0.4197998046875, 0.482666015625, 0.5455322265625, 0.6083984375, 0.6712646484375, 0.734130859375, 0.7969970703125, 0.85986328125, 0.9227294921875, 0.985595703125, 1.0484619140625, 1.111328125, 1.1741943359375, 1.237060546875, 1.2999267578125, 1.36279296875, 1.4256591796875, 1.488525390625, 1.5513916015625, 1.6142578125, 1.6771240234375, 1.739990234375, 1.8028564453125, 1.86572265625, 1.9285888671875, 1.991455078125, 2.0543212890625, 2.1171875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 6.0, 7.0, 2.0, 11.0, 5.0, 12.0, 14.0, 29.0, 34.0, 53.0, 59.0, 64.0, 96.0, 95.0, 109.0, 91.0, 76.0, 63.0, 45.0, 41.0, 22.0, 19.0, 11.0, 9.0, 10.0, 5.0, 3.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005116462707519531, -0.0004921108484268188, -0.00047257542610168457, -0.0004530400037765503, -0.000433504581451416, -0.00041396915912628174, -0.00039443373680114746, -0.0003748983144760132, -0.0003553628921508789, -0.00033582746982574463, -0.00031629204750061035, -0.0002967566251754761, -0.0002772212028503418, -0.0002576857805252075, -0.00023815035820007324, -0.00021861493587493896, -0.0001990795135498047, -0.0001795440912246704, -0.00016000866889953613, -0.00014047324657440186, -0.00012093782424926758, -0.0001014024019241333, -8.186697959899902e-05, -6.233155727386475e-05, -4.279613494873047e-05, -2.326071262359619e-05, -3.725290298461914e-06, 1.5810132026672363e-05, 3.534555435180664e-05, 5.488097667694092e-05, 7.44163990020752e-05, 9.395182132720947e-05, 0.00011348724365234375, 0.00013302266597747803, 0.0001525580883026123, 0.00017209351062774658, 0.00019162893295288086, 0.00021116435527801514, 0.00023069977760314941, 0.0002502351999282837, 0.00026977062225341797, 0.00028930604457855225, 0.0003088414669036865, 0.0003283768892288208, 0.0003479123115539551, 0.00036744773387908936, 0.00038698315620422363, 0.0004065185785293579, 0.0004260540008544922, 0.00044558942317962646, 0.00046512484550476074, 0.000484660267829895, 0.0005041956901550293, 0.0005237311124801636, 0.0005432665348052979, 0.0005628019571304321, 0.0005823373794555664, 0.0006018728017807007, 0.000621408224105835, 0.0006409436464309692, 0.0006604790687561035, 0.0006800144910812378, 0.0006995499134063721, 0.0007190853357315063, 0.0007386207580566406]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 7.0, 27.0, 32.0, 79.0, 165.0, 538.0, 2321.0, 23084.0, 724625.0, 284034.0, 11426.0, 1546.0, 418.0, 138.0, 55.0, 33.0, 11.0, 6.0, 8.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.115234375, -2.979034423828125, -2.84283447265625, -2.706634521484375, -2.5704345703125, -2.434234619140625, -2.29803466796875, -2.161834716796875, -2.025634765625, -1.889434814453125, -1.75323486328125, -1.617034912109375, -1.4808349609375, -1.344635009765625, -1.20843505859375, -1.072235107421875, -0.93603515625, -0.799835205078125, -0.66363525390625, -0.527435302734375, -0.3912353515625, -0.255035400390625, -0.11883544921875, 0.017364501953125, 0.153564453125, 0.289764404296875, 0.42596435546875, 0.562164306640625, 0.6983642578125, 0.834564208984375, 0.97076416015625, 1.106964111328125, 1.2431640625, 1.379364013671875, 1.51556396484375, 1.651763916015625, 1.7879638671875, 1.924163818359375, 2.06036376953125, 2.196563720703125, 2.332763671875, 2.468963623046875, 2.60516357421875, 2.741363525390625, 2.8775634765625, 3.013763427734375, 3.14996337890625, 3.286163330078125, 3.42236328125, 3.558563232421875, 3.69476318359375, 3.830963134765625, 3.9671630859375, 4.103363037109375, 4.23956298828125, 4.375762939453125, 4.511962890625, 4.648162841796875, 4.78436279296875, 4.920562744140625, 5.0567626953125, 5.192962646484375, 5.32916259765625, 5.465362548828125, 5.6015625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 5.0, 2.0, 4.0, 7.0, 10.0, 21.0, 25.0, 22.0, 27.0, 46.0, 52.0, 59.0, 66.0, 75.0, 79.0, 106.0, 85.0, 74.0, 59.0, 41.0, 46.0, 23.0, 14.0, 17.0, 10.0, 10.0, 6.0, 7.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.904296875, -2.82525634765625, -2.7462158203125, -2.66717529296875, -2.588134765625, -2.50909423828125, -2.4300537109375, -2.35101318359375, -2.27197265625, -2.19293212890625, -2.1138916015625, -2.03485107421875, -1.955810546875, -1.87677001953125, -1.7977294921875, -1.71868896484375, -1.6396484375, -1.56060791015625, -1.4815673828125, -1.40252685546875, -1.323486328125, -1.24444580078125, -1.1654052734375, -1.08636474609375, -1.00732421875, -0.92828369140625, -0.8492431640625, -0.77020263671875, -0.691162109375, -0.61212158203125, -0.5330810546875, -0.45404052734375, -0.375, -0.29595947265625, -0.2169189453125, -0.13787841796875, -0.058837890625, 0.02020263671875, 0.0992431640625, 0.17828369140625, 0.25732421875, 0.33636474609375, 0.4154052734375, 0.49444580078125, 0.573486328125, 0.65252685546875, 0.7315673828125, 0.81060791015625, 0.8896484375, 0.96868896484375, 1.0477294921875, 1.12677001953125, 1.205810546875, 1.28485107421875, 1.3638916015625, 1.44293212890625, 1.52197265625, 1.60101318359375, 1.6800537109375, 1.75909423828125, 1.838134765625, 1.91717529296875, 1.9962158203125, 2.07525634765625, 2.154296875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 5.0, 13.0, 18.0, 52.0, 76.0, 191.0, 257.0, 125.0, 84.0, 65.0, 35.0, 28.0, 17.0, 9.0, 6.0, 4.0, 1.0, 5.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.088706970214844, -31.371530532836914, -29.654354095458984, -27.937175750732422, -26.219999313354492, -24.502822875976562, -22.78564453125, -21.06846809387207, -19.35129165649414, -17.63411521911621, -15.916937828063965, -14.199760437011719, -12.482583999633789, -10.76540756225586, -9.048230171203613, -7.331052780151367, -5.6138763427734375, -3.8966994285583496, -2.1795225143432617, -0.46234560012817383, 1.254831314086914, 2.9720077514648438, 4.68918514251709, 6.406362533569336, 8.123538970947266, 9.840715408325195, 11.557892799377441, 13.275070190429688, 14.992246627807617, 16.709423065185547, 18.42660140991211, 20.14377784729004, 21.86095428466797, 23.5781307220459, 25.295307159423828, 27.01248550415039, 28.72966194152832, 30.44683837890625, 32.16401672363281, 33.881195068359375, 35.59836959838867, 37.315547943115234, 39.03272247314453, 40.749900817871094, 42.467079162597656, 44.18425369262695, 45.901432037353516, 47.61860656738281, 49.335784912109375, 51.05296325683594, 52.770137786865234, 54.4873161315918, 56.204490661621094, 57.921669006347656, 59.63884735107422, 61.35602569580078, 63.07320022583008, 64.79037475585938, 66.50755310058594, 68.2247314453125, 69.94190979003906, 71.65908813476562, 73.37625885009766, 75.09343719482422, 76.81061553955078]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 6.0, 1.0, 7.0, 9.0, 7.0, 17.0, 8.0, 17.0, 21.0, 20.0, 27.0, 11.0, 29.0, 27.0, 28.0, 24.0, 36.0, 55.0, 64.0, 69.0, 77.0, 62.0, 46.0, 40.0, 30.0, 30.0, 35.0, 28.0, 21.0, 31.0, 20.0, 12.0, 18.0, 12.0, 4.0, 10.0, 13.0, 3.0, 2.0, 3.0, 6.0, 5.0, 4.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 3.0], "bins": [-33.36609649658203, -32.365840911865234, -31.36558723449707, -30.365333557128906, -29.36507797241211, -28.364822387695312, -27.36456871032715, -26.364315032958984, -25.364059448242188, -24.36380386352539, -23.363550186157227, -22.363296508789062, -21.363040924072266, -20.36278533935547, -19.362531661987305, -18.36227798461914, -17.362022399902344, -16.361766815185547, -15.361513137817383, -14.361258506774902, -13.361003875732422, -12.360749244689941, -11.360494613647461, -10.36023998260498, -9.3599853515625, -8.35973072052002, -7.359476089477539, -6.359221458435059, -5.358966827392578, -4.358712196350098, -3.358457565307617, -2.3582029342651367, -1.357950210571289, -0.3576955795288086, 0.6425590515136719, 1.6428136825561523, 2.643068313598633, 3.6433229446411133, 4.643577575683594, 5.643832206726074, 6.644086837768555, 7.644341468811035, 8.644596099853516, 9.644850730895996, 10.645105361938477, 11.645359992980957, 12.645614624023438, 13.645869255065918, 14.646123886108398, 15.646378517150879, 16.64663314819336, 17.646888732910156, 18.64714241027832, 19.647396087646484, 20.64765167236328, 21.647907257080078, 22.648160934448242, 23.648414611816406, 24.648670196533203, 25.64892578125, 26.649179458618164, 27.649433135986328, 28.649688720703125, 29.649944305419922, 30.650197982788086]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 6.0, 6.0, 13.0, 17.0, 14.0, 22.0, 36.0, 54.0, 105.0, 159.0, 211.0, 352.0, 583.0, 892.0, 1439.0, 2218.0, 3924.0, 7087.0, 14424.0, 32636.0, 87761.0, 255136.0, 723755.0, 1486221.0, 998094.0, 368632.0, 126250.0, 45366.0, 18497.0, 8629.0, 4642.0, 2674.0, 1583.0, 970.0, 657.0, 398.0, 277.0, 161.0, 135.0, 79.0, 61.0, 34.0, 21.0, 15.0, 12.0, 11.0, 8.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.400390625, -1.3515472412109375, -1.302703857421875, -1.2538604736328125, -1.20501708984375, -1.1561737060546875, -1.107330322265625, -1.0584869384765625, -1.0096435546875, -0.9608001708984375, -0.911956787109375, -0.8631134033203125, -0.81427001953125, -0.7654266357421875, -0.716583251953125, -0.6677398681640625, -0.618896484375, -0.5700531005859375, -0.521209716796875, -0.4723663330078125, -0.42352294921875, -0.3746795654296875, -0.325836181640625, -0.2769927978515625, -0.2281494140625, -0.1793060302734375, -0.130462646484375, -0.0816192626953125, -0.03277587890625, 0.0160675048828125, 0.064910888671875, 0.1137542724609375, 0.16259765625, 0.2114410400390625, 0.260284423828125, 0.3091278076171875, 0.35797119140625, 0.4068145751953125, 0.455657958984375, 0.5045013427734375, 0.5533447265625, 0.6021881103515625, 0.651031494140625, 0.6998748779296875, 0.74871826171875, 0.7975616455078125, 0.846405029296875, 0.8952484130859375, 0.944091796875, 0.9929351806640625, 1.041778564453125, 1.0906219482421875, 1.13946533203125, 1.1883087158203125, 1.237152099609375, 1.2859954833984375, 1.3348388671875, 1.3836822509765625, 1.432525634765625, 1.4813690185546875, 1.53021240234375, 1.5790557861328125, 1.627899169921875, 1.6767425537109375, 1.7255859375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 6.0, 9.0, 7.0, 8.0, 9.0, 19.0, 19.0, 15.0, 15.0, 38.0, 27.0, 27.0, 29.0, 36.0, 36.0, 39.0, 46.0, 40.0, 50.0, 55.0, 52.0, 45.0, 42.0, 39.0, 37.0, 36.0, 26.0, 24.0, 27.0, 22.0, 16.0, 23.0, 16.0, 16.0, 5.0, 6.0, 13.0, 4.0, 6.0, 6.0, 6.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.09765625, -2.0348358154296875, -1.972015380859375, -1.9091949462890625, -1.84637451171875, -1.7835540771484375, -1.720733642578125, -1.6579132080078125, -1.5950927734375, -1.5322723388671875, -1.469451904296875, -1.4066314697265625, -1.34381103515625, -1.2809906005859375, -1.218170166015625, -1.1553497314453125, -1.092529296875, -1.0297088623046875, -0.966888427734375, -0.9040679931640625, -0.84124755859375, -0.7784271240234375, -0.715606689453125, -0.6527862548828125, -0.5899658203125, -0.5271453857421875, -0.464324951171875, -0.4015045166015625, -0.33868408203125, -0.2758636474609375, -0.213043212890625, -0.1502227783203125, -0.08740234375, -0.0245819091796875, 0.038238525390625, 0.1010589599609375, 0.16387939453125, 0.2266998291015625, 0.289520263671875, 0.3523406982421875, 0.4151611328125, 0.4779815673828125, 0.540802001953125, 0.6036224365234375, 0.66644287109375, 0.7292633056640625, 0.792083740234375, 0.8549041748046875, 0.917724609375, 0.9805450439453125, 1.043365478515625, 1.1061859130859375, 1.16900634765625, 1.2318267822265625, 1.294647216796875, 1.3574676513671875, 1.4202880859375, 1.4831085205078125, 1.545928955078125, 1.6087493896484375, 1.67156982421875, 1.7343902587890625, 1.797210693359375, 1.8600311279296875, 1.9228515625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 3.0, 12.0, 13.0, 25.0, 39.0, 71.0, 137.0, 278.0, 744.0, 2964.0, 38451.0, 3945973.0, 197471.0, 6354.0, 1033.0, 356.0, 171.0, 88.0, 44.0, 11.0, 16.0, 11.0, 6.0, 7.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.859375, -12.4886474609375, -12.117919921875, -11.7471923828125, -11.37646484375, -11.0057373046875, -10.635009765625, -10.2642822265625, -9.8935546875, -9.5228271484375, -9.152099609375, -8.7813720703125, -8.41064453125, -8.0399169921875, -7.669189453125, -7.2984619140625, -6.927734375, -6.5570068359375, -6.186279296875, -5.8155517578125, -5.44482421875, -5.0740966796875, -4.703369140625, -4.3326416015625, -3.9619140625, -3.5911865234375, -3.220458984375, -2.8497314453125, -2.47900390625, -2.1082763671875, -1.737548828125, -1.3668212890625, -0.99609375, -0.6253662109375, -0.254638671875, 0.1160888671875, 0.48681640625, 0.8575439453125, 1.228271484375, 1.5989990234375, 1.9697265625, 2.3404541015625, 2.711181640625, 3.0819091796875, 3.45263671875, 3.8233642578125, 4.194091796875, 4.5648193359375, 4.935546875, 5.3062744140625, 5.677001953125, 6.0477294921875, 6.41845703125, 6.7891845703125, 7.159912109375, 7.5306396484375, 7.9013671875, 8.2720947265625, 8.642822265625, 9.0135498046875, 9.38427734375, 9.7550048828125, 10.125732421875, 10.4964599609375, 10.8671875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 5.0, 4.0, 10.0, 13.0, 21.0, 35.0, 52.0, 114.0, 194.0, 414.0, 895.0, 1156.0, 590.0, 283.0, 119.0, 63.0, 43.0, 26.0, 12.0, 7.0, 14.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.90625, -10.647705078125, -10.38916015625, -10.130615234375, -9.8720703125, -9.613525390625, -9.35498046875, -9.096435546875, -8.837890625, -8.579345703125, -8.32080078125, -8.062255859375, -7.8037109375, -7.545166015625, -7.28662109375, -7.028076171875, -6.76953125, -6.510986328125, -6.25244140625, -5.993896484375, -5.7353515625, -5.476806640625, -5.21826171875, -4.959716796875, -4.701171875, -4.442626953125, -4.18408203125, -3.925537109375, -3.6669921875, -3.408447265625, -3.14990234375, -2.891357421875, -2.6328125, -2.374267578125, -2.11572265625, -1.857177734375, -1.5986328125, -1.340087890625, -1.08154296875, -0.822998046875, -0.564453125, -0.305908203125, -0.04736328125, 0.211181640625, 0.4697265625, 0.728271484375, 0.98681640625, 1.245361328125, 1.50390625, 1.762451171875, 2.02099609375, 2.279541015625, 2.5380859375, 2.796630859375, 3.05517578125, 3.313720703125, 3.572265625, 3.830810546875, 4.08935546875, 4.347900390625, 4.6064453125, 4.864990234375, 5.12353515625, 5.382080078125, 5.640625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 10.0, 11.0, 33.0, 91.0, 164.0, 274.0, 226.0, 108.0, 47.0, 14.0, 10.0, 8.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-105.82020568847656, -103.69187927246094, -101.56355285644531, -99.43522644042969, -97.30690002441406, -95.17857360839844, -93.05024719238281, -90.92192840576172, -88.7936019897461, -86.66527557373047, -84.53694915771484, -82.40862274169922, -80.2802963256836, -78.1519775390625, -76.02365112304688, -73.89532470703125, -71.76699829101562, -69.638671875, -67.51034545898438, -65.38201904296875, -63.25369644165039, -61.125370025634766, -58.99704360961914, -56.868717193603516, -54.740386962890625, -52.612060546875, -50.483734130859375, -48.35540771484375, -46.22708511352539, -44.098758697509766, -41.97043228149414, -39.842105865478516, -37.71377944946289, -35.585453033447266, -33.45712661743164, -31.32880210876465, -29.200477600097656, -27.07215118408203, -24.943824768066406, -22.81549835205078, -20.68717384338379, -18.558847427368164, -16.430522918701172, -14.302196502685547, -12.173871040344238, -10.04554557800293, -7.917219161987305, -5.788893699645996, -3.6605682373046875, -1.5322425365447998, 0.5960831642150879, 2.7244091033935547, 4.852734565734863, 6.981060028076172, 9.109386444091797, 11.237711906433105, 13.366037368774414, 15.494362831115723, 17.62268829345703, 19.751014709472656, 21.87934112548828, 24.007665634155273, 26.1359920501709, 28.26431655883789, 30.392642974853516]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 6.0, 6.0, 7.0, 7.0, 13.0, 16.0, 12.0, 23.0, 26.0, 22.0, 27.0, 21.0, 44.0, 28.0, 50.0, 46.0, 45.0, 51.0, 61.0, 51.0, 46.0, 45.0, 47.0, 42.0, 34.0, 35.0, 29.0, 27.0, 20.0, 25.0, 10.0, 13.0, 8.0, 7.0, 11.0, 9.0, 9.0, 6.0, 5.0, 2.0, 5.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-25.260395050048828, -24.523662567138672, -23.786930084228516, -23.05019760131836, -22.313465118408203, -21.576732635498047, -20.84000015258789, -20.103267669677734, -19.366535186767578, -18.629802703857422, -17.893070220947266, -17.15633773803711, -16.419605255126953, -15.682872772216797, -14.946139335632324, -14.209406852722168, -13.472673416137695, -12.735940933227539, -11.999208450317383, -11.262475967407227, -10.52574348449707, -9.789011001586914, -9.052277565002441, -8.315545082092285, -7.578812599182129, -6.842080116271973, -6.105347633361816, -5.368614673614502, -4.631882190704346, -3.8951497077941895, -3.158416748046875, -2.4216842651367188, -1.6849517822265625, -0.9482191801071167, -0.2114865779876709, 0.5252461433410645, 1.2619786262512207, 1.998711109161377, 2.7354440689086914, 3.4721765518188477, 4.208909034729004, 4.94564151763916, 5.682374000549316, 6.419106960296631, 7.155839443206787, 7.892571926116943, 8.629304885864258, 9.366037368774414, 10.10276985168457, 10.839502334594727, 11.576234817504883, 12.312967300415039, 13.049699783325195, 13.786432266235352, 14.523165702819824, 15.25989818572998, 15.996630668640137, 16.73336410522461, 17.470096588134766, 18.206829071044922, 18.943561553955078, 19.680294036865234, 20.41702651977539, 21.153759002685547, 21.890491485595703]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 0.0, 2.0, 5.0, 2.0, 10.0, 10.0, 5.0, 31.0, 30.0, 35.0, 40.0, 78.0, 105.0, 180.0, 261.0, 401.0, 633.0, 1008.0, 1650.0, 2936.0, 5005.0, 9037.0, 16491.0, 30895.0, 57524.0, 107641.0, 186691.0, 238431.0, 174253.0, 98800.0, 53375.0, 28063.0, 15171.0, 8185.0, 4666.0, 2691.0, 1564.0, 948.0, 609.0, 347.0, 272.0, 137.0, 94.0, 73.0, 47.0, 41.0, 31.0, 21.0, 18.0, 7.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.291015625, -2.215728759765625, -2.14044189453125, -2.065155029296875, -1.9898681640625, -1.914581298828125, -1.83929443359375, -1.764007568359375, -1.688720703125, -1.613433837890625, -1.53814697265625, -1.462860107421875, -1.3875732421875, -1.312286376953125, -1.23699951171875, -1.161712646484375, -1.08642578125, -1.011138916015625, -0.93585205078125, -0.860565185546875, -0.7852783203125, -0.709991455078125, -0.63470458984375, -0.559417724609375, -0.484130859375, -0.408843994140625, -0.33355712890625, -0.258270263671875, -0.1829833984375, -0.107696533203125, -0.03240966796875, 0.042877197265625, 0.1181640625, 0.193450927734375, 0.26873779296875, 0.344024658203125, 0.4193115234375, 0.494598388671875, 0.56988525390625, 0.645172119140625, 0.720458984375, 0.795745849609375, 0.87103271484375, 0.946319580078125, 1.0216064453125, 1.096893310546875, 1.17218017578125, 1.247467041015625, 1.32275390625, 1.398040771484375, 1.47332763671875, 1.548614501953125, 1.6239013671875, 1.699188232421875, 1.77447509765625, 1.849761962890625, 1.925048828125, 2.000335693359375, 2.07562255859375, 2.150909423828125, 2.2261962890625, 2.301483154296875, 2.37677001953125, 2.452056884765625, 2.52734375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 5.0, 8.0, 5.0, 13.0, 9.0, 9.0, 11.0, 13.0, 26.0, 28.0, 31.0, 29.0, 40.0, 40.0, 39.0, 44.0, 47.0, 42.0, 63.0, 50.0, 66.0, 32.0, 37.0, 41.0, 37.0, 40.0, 27.0, 21.0, 25.0, 25.0, 24.0, 11.0, 8.0, 11.0, 12.0, 14.0, 6.0, 3.0, 0.0, 4.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.05078125, -1.9774169921875, -1.904052734375, -1.8306884765625, -1.75732421875, -1.6839599609375, -1.610595703125, -1.5372314453125, -1.4638671875, -1.3905029296875, -1.317138671875, -1.2437744140625, -1.17041015625, -1.0970458984375, -1.023681640625, -0.9503173828125, -0.876953125, -0.8035888671875, -0.730224609375, -0.6568603515625, -0.58349609375, -0.5101318359375, -0.436767578125, -0.3634033203125, -0.2900390625, -0.2166748046875, -0.143310546875, -0.0699462890625, 0.00341796875, 0.0767822265625, 0.150146484375, 0.2235107421875, 0.296875, 0.3702392578125, 0.443603515625, 0.5169677734375, 0.59033203125, 0.6636962890625, 0.737060546875, 0.8104248046875, 0.8837890625, 0.9571533203125, 1.030517578125, 1.1038818359375, 1.17724609375, 1.2506103515625, 1.323974609375, 1.3973388671875, 1.470703125, 1.5440673828125, 1.617431640625, 1.6907958984375, 1.76416015625, 1.8375244140625, 1.910888671875, 1.9842529296875, 2.0576171875, 2.1309814453125, 2.204345703125, 2.2777099609375, 2.35107421875, 2.4244384765625, 2.497802734375, 2.5711669921875, 2.64453125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 4.0, 3.0, 12.0, 6.0, 17.0, 29.0, 22.0, 35.0, 48.0, 93.0, 128.0, 188.0, 334.0, 587.0, 1234.0, 3215.0, 13355.0, 81597.0, 715306.0, 196937.0, 26178.0, 5686.0, 1699.0, 793.0, 390.0, 237.0, 136.0, 99.0, 61.0, 41.0, 21.0, 26.0, 12.0, 11.0, 7.0, 3.0, 2.0, 1.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.5859375, -7.33056640625, -7.0751953125, -6.81982421875, -6.564453125, -6.30908203125, -6.0537109375, -5.79833984375, -5.54296875, -5.28759765625, -5.0322265625, -4.77685546875, -4.521484375, -4.26611328125, -4.0107421875, -3.75537109375, -3.5, -3.24462890625, -2.9892578125, -2.73388671875, -2.478515625, -2.22314453125, -1.9677734375, -1.71240234375, -1.45703125, -1.20166015625, -0.9462890625, -0.69091796875, -0.435546875, -0.18017578125, 0.0751953125, 0.33056640625, 0.5859375, 0.84130859375, 1.0966796875, 1.35205078125, 1.607421875, 1.86279296875, 2.1181640625, 2.37353515625, 2.62890625, 2.88427734375, 3.1396484375, 3.39501953125, 3.650390625, 3.90576171875, 4.1611328125, 4.41650390625, 4.671875, 4.92724609375, 5.1826171875, 5.43798828125, 5.693359375, 5.94873046875, 6.2041015625, 6.45947265625, 6.71484375, 6.97021484375, 7.2255859375, 7.48095703125, 7.736328125, 7.99169921875, 8.2470703125, 8.50244140625, 8.7578125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 3.0, 9.0, 11.0, 6.0, 12.0, 19.0, 19.0, 32.0, 26.0, 42.0, 51.0, 61.0, 67.0, 69.0, 74.0, 76.0, 81.0, 66.0, 59.0, 54.0, 43.0, 34.0, 22.0, 16.0, 12.0, 10.0, 9.0, 8.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6796875, -9.289306640625, -8.89892578125, -8.508544921875, -8.1181640625, -7.727783203125, -7.33740234375, -6.947021484375, -6.556640625, -6.166259765625, -5.77587890625, -5.385498046875, -4.9951171875, -4.604736328125, -4.21435546875, -3.823974609375, -3.43359375, -3.043212890625, -2.65283203125, -2.262451171875, -1.8720703125, -1.481689453125, -1.09130859375, -0.700927734375, -0.310546875, 0.079833984375, 0.47021484375, 0.860595703125, 1.2509765625, 1.641357421875, 2.03173828125, 2.422119140625, 2.8125, 3.202880859375, 3.59326171875, 3.983642578125, 4.3740234375, 4.764404296875, 5.15478515625, 5.545166015625, 5.935546875, 6.325927734375, 6.71630859375, 7.106689453125, 7.4970703125, 7.887451171875, 8.27783203125, 8.668212890625, 9.05859375, 9.448974609375, 9.83935546875, 10.229736328125, 10.6201171875, 11.010498046875, 11.40087890625, 11.791259765625, 12.181640625, 12.572021484375, 12.96240234375, 13.352783203125, 13.7431640625, 14.133544921875, 14.52392578125, 14.914306640625, 15.3046875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 5.0, 5.0, 6.0, 13.0, 16.0, 24.0, 19.0, 41.0, 60.0, 122.0, 146.0, 244.0, 529.0, 1066.0, 2779.0, 8905.0, 35475.0, 191872.0, 684457.0, 93709.0, 19900.0, 5542.0, 1897.0, 771.0, 372.0, 195.0, 133.0, 84.0, 49.0, 31.0, 28.0, 16.0, 11.0, 8.0, 12.0, 3.0, 7.0, 2.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6943359375, -1.6322784423828125, -1.570220947265625, -1.5081634521484375, -1.44610595703125, -1.3840484619140625, -1.321990966796875, -1.2599334716796875, -1.1978759765625, -1.1358184814453125, -1.073760986328125, -1.0117034912109375, -0.94964599609375, -0.8875885009765625, -0.825531005859375, -0.7634735107421875, -0.701416015625, -0.6393585205078125, -0.577301025390625, -0.5152435302734375, -0.45318603515625, -0.3911285400390625, -0.329071044921875, -0.2670135498046875, -0.2049560546875, -0.1428985595703125, -0.080841064453125, -0.0187835693359375, 0.04327392578125, 0.1053314208984375, 0.167388916015625, 0.2294464111328125, 0.29150390625, 0.3535614013671875, 0.415618896484375, 0.4776763916015625, 0.53973388671875, 0.6017913818359375, 0.663848876953125, 0.7259063720703125, 0.7879638671875, 0.8500213623046875, 0.912078857421875, 0.9741363525390625, 1.03619384765625, 1.0982513427734375, 1.160308837890625, 1.2223663330078125, 1.284423828125, 1.3464813232421875, 1.408538818359375, 1.4705963134765625, 1.53265380859375, 1.5947113037109375, 1.656768798828125, 1.7188262939453125, 1.7808837890625, 1.8429412841796875, 1.904998779296875, 1.9670562744140625, 2.02911376953125, 2.0911712646484375, 2.153228759765625, 2.2152862548828125, 2.27734375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 9.0, 11.0, 13.0, 14.0, 22.0, 25.0, 22.0, 31.0, 45.0, 58.0, 67.0, 97.0, 100.0, 98.0, 78.0, 60.0, 51.0, 34.0, 42.0, 25.0, 25.0, 14.0, 13.0, 12.0, 5.0, 7.0, 5.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004782676696777344, -0.0004617348313331604, -0.0004452019929885864, -0.00042866915464401245, -0.0004121363162994385, -0.0003956034779548645, -0.00037907063961029053, -0.00036253780126571655, -0.0003460049629211426, -0.0003294721245765686, -0.00031293928623199463, -0.00029640644788742065, -0.0002798736095428467, -0.0002633407711982727, -0.00024680793285369873, -0.00023027509450912476, -0.00021374225616455078, -0.0001972094178199768, -0.00018067657947540283, -0.00016414374113082886, -0.00014761090278625488, -0.0001310780644416809, -0.00011454522609710693, -9.801238775253296e-05, -8.147954940795898e-05, -6.494671106338501e-05, -4.8413872718811035e-05, -3.188103437423706e-05, -1.5348196029663086e-05, 1.1846423149108887e-06, 1.7717480659484863e-05, 3.425031900405884e-05, 5.078315734863281e-05, 6.731599569320679e-05, 8.384883403778076e-05, 0.00010038167238235474, 0.00011691451072692871, 0.00013344734907150269, 0.00014998018741607666, 0.00016651302576065063, 0.0001830458641052246, 0.00019957870244979858, 0.00021611154079437256, 0.00023264437913894653, 0.0002491772174835205, 0.0002657100558280945, 0.00028224289417266846, 0.00029877573251724243, 0.0003153085708618164, 0.0003318414092063904, 0.00034837424755096436, 0.00036490708589553833, 0.0003814399242401123, 0.0003979727625846863, 0.00041450560092926025, 0.00043103843927383423, 0.0004475712776184082, 0.0004641041159629822, 0.00048063695430755615, 0.0004971697926521301, 0.0005137026309967041, 0.0005302354693412781, 0.000546768307685852, 0.000563301146030426, 0.000579833984375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 8.0, 15.0, 19.0, 32.0, 48.0, 81.0, 188.0, 354.0, 949.0, 2969.0, 16741.0, 222503.0, 757207.0, 39847.0, 5224.0, 1358.0, 484.0, 252.0, 109.0, 73.0, 37.0, 19.0, 17.0, 5.0, 6.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.59375, -2.49835205078125, -2.4029541015625, -2.30755615234375, -2.212158203125, -2.11676025390625, -2.0213623046875, -1.92596435546875, -1.83056640625, -1.73516845703125, -1.6397705078125, -1.54437255859375, -1.448974609375, -1.35357666015625, -1.2581787109375, -1.16278076171875, -1.0673828125, -0.97198486328125, -0.8765869140625, -0.78118896484375, -0.685791015625, -0.59039306640625, -0.4949951171875, -0.39959716796875, -0.30419921875, -0.20880126953125, -0.1134033203125, -0.01800537109375, 0.077392578125, 0.17279052734375, 0.2681884765625, 0.36358642578125, 0.458984375, 0.55438232421875, 0.6497802734375, 0.74517822265625, 0.840576171875, 0.93597412109375, 1.0313720703125, 1.12677001953125, 1.22216796875, 1.31756591796875, 1.4129638671875, 1.50836181640625, 1.603759765625, 1.69915771484375, 1.7945556640625, 1.88995361328125, 1.9853515625, 2.08074951171875, 2.1761474609375, 2.27154541015625, 2.366943359375, 2.46234130859375, 2.5577392578125, 2.65313720703125, 2.74853515625, 2.84393310546875, 2.9393310546875, 3.03472900390625, 3.130126953125, 3.22552490234375, 3.3209228515625, 3.41632080078125, 3.51171875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 6.0, 4.0, 4.0, 11.0, 12.0, 21.0, 12.0, 32.0, 33.0, 32.0, 49.0, 50.0, 53.0, 63.0, 80.0, 80.0, 71.0, 69.0, 58.0, 50.0, 42.0, 39.0, 22.0, 16.0, 25.0, 20.0, 9.0, 10.0, 2.0, 4.0, 3.0, 6.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3671875, -1.312896728515625, -1.25860595703125, -1.204315185546875, -1.1500244140625, -1.095733642578125, -1.04144287109375, -0.987152099609375, -0.932861328125, -0.878570556640625, -0.82427978515625, -0.769989013671875, -0.7156982421875, -0.661407470703125, -0.60711669921875, -0.552825927734375, -0.49853515625, -0.444244384765625, -0.38995361328125, -0.335662841796875, -0.2813720703125, -0.227081298828125, -0.17279052734375, -0.118499755859375, -0.064208984375, -0.009918212890625, 0.04437255859375, 0.098663330078125, 0.1529541015625, 0.207244873046875, 0.26153564453125, 0.315826416015625, 0.3701171875, 0.424407958984375, 0.47869873046875, 0.532989501953125, 0.5872802734375, 0.641571044921875, 0.69586181640625, 0.750152587890625, 0.804443359375, 0.858734130859375, 0.91302490234375, 0.967315673828125, 1.0216064453125, 1.075897216796875, 1.13018798828125, 1.184478759765625, 1.23876953125, 1.293060302734375, 1.34735107421875, 1.401641845703125, 1.4559326171875, 1.510223388671875, 1.56451416015625, 1.618804931640625, 1.673095703125, 1.727386474609375, 1.78167724609375, 1.835968017578125, 1.8902587890625, 1.944549560546875, 1.99884033203125, 2.053131103515625, 2.107421875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 2.0, 4.0, 4.0, 8.0, 30.0, 56.0, 100.0, 335.0, 271.0, 105.0, 46.0, 22.0, 9.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-107.48383331298828, -105.14241027832031, -102.80098724365234, -100.45956420898438, -98.11813354492188, -95.7767105102539, -93.43528747558594, -91.09386444091797, -88.75244140625, -86.41101837158203, -84.06959533691406, -81.7281723022461, -79.38674926757812, -77.04531860351562, -74.70389556884766, -72.36247253417969, -70.02104949951172, -67.67962646484375, -65.33820343017578, -62.99677658081055, -60.65535354614258, -58.31393051147461, -55.972503662109375, -53.631080627441406, -51.28965759277344, -48.94823455810547, -46.6068115234375, -44.265384674072266, -41.9239616394043, -39.58253860473633, -37.241111755371094, -34.899688720703125, -32.55826187133789, -30.216838836669922, -27.87541389465332, -25.53398895263672, -23.19256591796875, -20.85114288330078, -18.50971794128418, -16.168292999267578, -13.82686996459961, -11.485445976257324, -9.144021987915039, -6.802597999572754, -4.461174011230469, -2.1197500228881836, 0.22167396545410156, 2.563098907470703, 4.904521942138672, 7.245945930480957, 9.587369918823242, 11.928793907165527, 14.270217895507812, 16.61164093017578, 18.953065872192383, 21.294490814208984, 23.635913848876953, 25.977336883544922, 28.318761825561523, 30.660186767578125, 33.001609802246094, 35.34303283691406, 37.68445587158203, 40.025882720947266, 42.367305755615234]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 9.0, 5.0, 7.0, 8.0, 6.0, 13.0, 15.0, 16.0, 15.0, 14.0, 23.0, 15.0, 22.0, 29.0, 27.0, 24.0, 38.0, 44.0, 75.0, 105.0, 107.0, 71.0, 40.0, 38.0, 28.0, 27.0, 20.0, 32.0, 17.0, 16.0, 14.0, 12.0, 9.0, 12.0, 10.0, 11.0, 5.0, 6.0, 3.0, 5.0, 3.0, 2.0, 3.0, 5.0, 0.0, 1.0, 0.0, 2.0], "bins": [-35.56679153442383, -34.57630920410156, -33.5858268737793, -32.59534454345703, -31.6048641204834, -30.614381790161133, -29.623899459838867, -28.6334171295166, -27.64293670654297, -26.652454376220703, -25.661972045898438, -24.671489715576172, -23.68100929260254, -22.690526962280273, -21.700044631958008, -20.709562301635742, -19.719079971313477, -18.72859764099121, -17.738115310668945, -16.747634887695312, -15.757152557373047, -14.766670227050781, -13.776187896728516, -12.78570556640625, -11.7952241897583, -10.804741859436035, -9.814260482788086, -8.82377815246582, -7.833296298980713, -6.8428144454956055, -5.85233211517334, -4.861850261688232, -3.871370315551758, -2.8808884620666504, -1.8904063701629639, -0.8999242782592773, 0.09055757522583008, 1.0810394287109375, 2.071521759033203, 3.0620036125183105, 4.052485466003418, 5.042967319488525, 6.033449172973633, 7.023931503295898, 8.014413833618164, 9.004895210266113, 9.995377540588379, 10.985858917236328, 11.976341247558594, 12.96682357788086, 13.957304954528809, 14.947787284851074, 15.938268661499023, 16.92875099182129, 17.919233322143555, 18.90971565246582, 19.900196075439453, 20.89067840576172, 21.881160736083984, 22.87164306640625, 23.862123489379883, 24.85260581970215, 25.843088150024414, 26.83357048034668, 27.824052810668945]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 6.0, 11.0, 10.0, 14.0, 17.0, 40.0, 58.0, 66.0, 100.0, 145.0, 249.0, 355.0, 550.0, 961.0, 1494.0, 2749.0, 5144.0, 10267.0, 23960.0, 64243.0, 184456.0, 534736.0, 1335466.0, 1271856.0, 492662.0, 164750.0, 57465.0, 21669.0, 9465.0, 4701.0, 2539.0, 1511.0, 910.0, 522.0, 361.0, 247.0, 165.0, 113.0, 82.0, 60.0, 30.0, 22.0, 19.0, 13.0, 9.0, 4.0, 6.0, 3.0, 4.0, 0.0, 1.0, 1.0], "bins": [-1.9169921875, -1.862152099609375, -1.80731201171875, -1.752471923828125, -1.6976318359375, -1.642791748046875, -1.58795166015625, -1.533111572265625, -1.478271484375, -1.423431396484375, -1.36859130859375, -1.313751220703125, -1.2589111328125, -1.204071044921875, -1.14923095703125, -1.094390869140625, -1.03955078125, -0.984710693359375, -0.92987060546875, -0.875030517578125, -0.8201904296875, -0.765350341796875, -0.71051025390625, -0.655670166015625, -0.600830078125, -0.545989990234375, -0.49114990234375, -0.436309814453125, -0.3814697265625, -0.326629638671875, -0.27178955078125, -0.216949462890625, -0.162109375, -0.107269287109375, -0.05242919921875, 0.002410888671875, 0.0572509765625, 0.112091064453125, 0.16693115234375, 0.221771240234375, 0.276611328125, 0.331451416015625, 0.38629150390625, 0.441131591796875, 0.4959716796875, 0.550811767578125, 0.60565185546875, 0.660491943359375, 0.71533203125, 0.770172119140625, 0.82501220703125, 0.879852294921875, 0.9346923828125, 0.989532470703125, 1.04437255859375, 1.099212646484375, 1.154052734375, 1.208892822265625, 1.26373291015625, 1.318572998046875, 1.3734130859375, 1.428253173828125, 1.48309326171875, 1.537933349609375, 1.5927734375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 12.0, 3.0, 9.0, 6.0, 5.0, 5.0, 12.0, 10.0, 11.0, 16.0, 22.0, 29.0, 32.0, 30.0, 30.0, 31.0, 34.0, 52.0, 27.0, 41.0, 38.0, 49.0, 52.0, 48.0, 39.0, 35.0, 38.0, 38.0, 32.0, 21.0, 24.0, 28.0, 17.0, 13.0, 26.0, 14.0, 10.0, 10.0, 6.0, 8.0, 10.0, 6.0, 3.0, 5.0, 2.0, 3.0, 4.0, 3.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.90625, -1.8443603515625, -1.782470703125, -1.7205810546875, -1.65869140625, -1.5968017578125, -1.534912109375, -1.4730224609375, -1.4111328125, -1.3492431640625, -1.287353515625, -1.2254638671875, -1.16357421875, -1.1016845703125, -1.039794921875, -0.9779052734375, -0.916015625, -0.8541259765625, -0.792236328125, -0.7303466796875, -0.66845703125, -0.6065673828125, -0.544677734375, -0.4827880859375, -0.4208984375, -0.3590087890625, -0.297119140625, -0.2352294921875, -0.17333984375, -0.1114501953125, -0.049560546875, 0.0123291015625, 0.07421875, 0.1361083984375, 0.197998046875, 0.2598876953125, 0.32177734375, 0.3836669921875, 0.445556640625, 0.5074462890625, 0.5693359375, 0.6312255859375, 0.693115234375, 0.7550048828125, 0.81689453125, 0.8787841796875, 0.940673828125, 1.0025634765625, 1.064453125, 1.1263427734375, 1.188232421875, 1.2501220703125, 1.31201171875, 1.3739013671875, 1.435791015625, 1.4976806640625, 1.5595703125, 1.6214599609375, 1.683349609375, 1.7452392578125, 1.80712890625, 1.8690185546875, 1.930908203125, 1.9927978515625, 2.0546875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 5.0, 6.0, 5.0, 7.0, 5.0, 13.0, 6.0, 14.0, 16.0, 27.0, 28.0, 34.0, 53.0, 102.0, 177.0, 363.0, 780.0, 2226.0, 8068.0, 51037.0, 1637005.0, 2417760.0, 63835.0, 8916.0, 2174.0, 789.0, 335.0, 178.0, 87.0, 57.0, 45.0, 35.0, 27.0, 19.0, 14.0, 6.0, 6.0, 5.0, 6.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.43359375, -6.22637939453125, -6.0191650390625, -5.81195068359375, -5.604736328125, -5.39752197265625, -5.1903076171875, -4.98309326171875, -4.77587890625, -4.56866455078125, -4.3614501953125, -4.15423583984375, -3.947021484375, -3.73980712890625, -3.5325927734375, -3.32537841796875, -3.1181640625, -2.91094970703125, -2.7037353515625, -2.49652099609375, -2.289306640625, -2.08209228515625, -1.8748779296875, -1.66766357421875, -1.46044921875, -1.25323486328125, -1.0460205078125, -0.83880615234375, -0.631591796875, -0.42437744140625, -0.2171630859375, -0.00994873046875, 0.197265625, 0.40447998046875, 0.6116943359375, 0.81890869140625, 1.026123046875, 1.23333740234375, 1.4405517578125, 1.64776611328125, 1.85498046875, 2.06219482421875, 2.2694091796875, 2.47662353515625, 2.683837890625, 2.89105224609375, 3.0982666015625, 3.30548095703125, 3.5126953125, 3.71990966796875, 3.9271240234375, 4.13433837890625, 4.341552734375, 4.54876708984375, 4.7559814453125, 4.96319580078125, 5.17041015625, 5.37762451171875, 5.5848388671875, 5.79205322265625, 5.999267578125, 6.20648193359375, 6.4136962890625, 6.62091064453125, 6.828125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 8.0, 3.0, 5.0, 4.0, 9.0, 13.0, 11.0, 14.0, 31.0, 52.0, 45.0, 61.0, 103.0, 157.0, 258.0, 384.0, 606.0, 688.0, 559.0, 400.0, 217.0, 156.0, 84.0, 64.0, 38.0, 30.0, 21.0, 16.0, 11.0, 8.0, 5.0, 5.0, 5.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.23828125, -6.07110595703125, -5.9039306640625, -5.73675537109375, -5.569580078125, -5.40240478515625, -5.2352294921875, -5.06805419921875, -4.90087890625, -4.73370361328125, -4.5665283203125, -4.39935302734375, -4.232177734375, -4.06500244140625, -3.8978271484375, -3.73065185546875, -3.5634765625, -3.39630126953125, -3.2291259765625, -3.06195068359375, -2.894775390625, -2.72760009765625, -2.5604248046875, -2.39324951171875, -2.22607421875, -2.05889892578125, -1.8917236328125, -1.72454833984375, -1.557373046875, -1.39019775390625, -1.2230224609375, -1.05584716796875, -0.888671875, -0.72149658203125, -0.5543212890625, -0.38714599609375, -0.219970703125, -0.05279541015625, 0.1143798828125, 0.28155517578125, 0.44873046875, 0.61590576171875, 0.7830810546875, 0.95025634765625, 1.117431640625, 1.28460693359375, 1.4517822265625, 1.61895751953125, 1.7861328125, 1.95330810546875, 2.1204833984375, 2.28765869140625, 2.454833984375, 2.62200927734375, 2.7891845703125, 2.95635986328125, 3.12353515625, 3.29071044921875, 3.4578857421875, 3.62506103515625, 3.792236328125, 3.95941162109375, 4.1265869140625, 4.29376220703125, 4.4609375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 9.0, 9.0, 24.0, 61.0, 157.0, 298.0, 271.0, 111.0, 36.0, 15.0, 9.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.35106658935547, -116.86079406738281, -114.37052917480469, -111.88025665283203, -109.3899917602539, -106.89971923828125, -104.40945434570312, -101.91918182373047, -99.42890930175781, -96.93863677978516, -94.44837188720703, -91.95809936523438, -89.46783447265625, -86.9775619506836, -84.48729705810547, -81.99702453613281, -79.50675964355469, -77.01648712158203, -74.5262222290039, -72.03594970703125, -69.54568481445312, -67.05541229248047, -64.56514739990234, -62.07487487792969, -59.5846061706543, -57.094337463378906, -54.604068756103516, -52.113800048828125, -49.62352752685547, -47.133262634277344, -44.64299011230469, -42.1527214050293, -39.662452697753906, -37.172183990478516, -34.681915283203125, -32.191646575927734, -29.70137596130371, -27.21110725402832, -24.720836639404297, -22.230567932128906, -19.740299224853516, -17.250030517578125, -14.759760856628418, -12.269491195678711, -9.77922248840332, -7.28895378112793, -4.798684120178223, -2.3084144592285156, 0.181854248046875, 2.672123432159424, 5.162392616271973, 7.6526618003845215, 10.14293098449707, 12.633199691772461, 15.123469352722168, 17.613739013671875, 20.104007720947266, 22.594276428222656, 25.084545135498047, 27.57481575012207, 30.06508445739746, 32.55535125732422, 35.045623779296875, 37.535892486572266, 40.026161193847656]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 6.0, 5.0, 10.0, 5.0, 13.0, 19.0, 17.0, 24.0, 23.0, 32.0, 40.0, 42.0, 46.0, 60.0, 59.0, 71.0, 74.0, 66.0, 59.0, 51.0, 37.0, 35.0, 40.0, 26.0, 30.0, 23.0, 16.0, 15.0, 15.0, 9.0, 7.0, 10.0, 6.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.55684471130371, -25.677698135375977, -24.79854965209961, -23.919403076171875, -23.04025650024414, -22.161109924316406, -21.281963348388672, -20.402814865112305, -19.52366828918457, -18.644521713256836, -17.76537322998047, -16.886226654052734, -16.007080078125, -15.127933502197266, -14.248785972595215, -13.369638442993164, -12.49049186706543, -11.611345291137695, -10.732197761535645, -9.853050231933594, -8.97390365600586, -8.094757080078125, -7.215609550476074, -6.336462497711182, -5.457315444946289, -4.5781683921813965, -3.699021339416504, -2.8198742866516113, -1.9407272338867188, -1.0615801811218262, -0.1824331283569336, 0.696713924407959, 1.5758628845214844, 2.455009937286377, 3.3341569900512695, 4.213304042816162, 5.092451095581055, 5.971598148345947, 6.85074520111084, 7.729892253875732, 8.609039306640625, 9.48818588256836, 10.36733341217041, 11.246480941772461, 12.125627517700195, 13.00477409362793, 13.88392162322998, 14.763069152832031, 15.642215728759766, 16.5213623046875, 17.400508880615234, 18.2796573638916, 19.158803939819336, 20.03795051574707, 20.917098999023438, 21.796245574951172, 22.675392150878906, 23.55453872680664, 24.433685302734375, 25.312833786010742, 26.191980361938477, 27.07112693786621, 27.950275421142578, 28.829421997070312, 29.708568572998047]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 5.0, 12.0, 18.0, 29.0, 36.0, 41.0, 80.0, 114.0, 159.0, 301.0, 467.0, 754.0, 1344.0, 2413.0, 4186.0, 7788.0, 14984.0, 29812.0, 63430.0, 139801.0, 285425.0, 261147.0, 123718.0, 56168.0, 26762.0, 13400.0, 6940.0, 3808.0, 2193.0, 1278.0, 764.0, 474.0, 249.0, 156.0, 102.0, 69.0, 49.0, 29.0, 16.0, 11.0, 10.0, 8.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.33203125, -3.224273681640625, -3.11651611328125, -3.008758544921875, -2.9010009765625, -2.793243408203125, -2.68548583984375, -2.577728271484375, -2.469970703125, -2.362213134765625, -2.25445556640625, -2.146697998046875, -2.0389404296875, -1.931182861328125, -1.82342529296875, -1.715667724609375, -1.60791015625, -1.500152587890625, -1.39239501953125, -1.284637451171875, -1.1768798828125, -1.069122314453125, -0.96136474609375, -0.853607177734375, -0.745849609375, -0.638092041015625, -0.53033447265625, -0.422576904296875, -0.3148193359375, -0.207061767578125, -0.09930419921875, 0.008453369140625, 0.1162109375, 0.223968505859375, 0.33172607421875, 0.439483642578125, 0.5472412109375, 0.654998779296875, 0.76275634765625, 0.870513916015625, 0.978271484375, 1.086029052734375, 1.19378662109375, 1.301544189453125, 1.4093017578125, 1.517059326171875, 1.62481689453125, 1.732574462890625, 1.84033203125, 1.948089599609375, 2.05584716796875, 2.163604736328125, 2.2713623046875, 2.379119873046875, 2.48687744140625, 2.594635009765625, 2.702392578125, 2.810150146484375, 2.91790771484375, 3.025665283203125, 3.1334228515625, 3.241180419921875, 3.34893798828125, 3.456695556640625, 3.564453125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 6.0, 6.0, 6.0, 12.0, 16.0, 10.0, 18.0, 8.0, 21.0, 30.0, 42.0, 32.0, 35.0, 35.0, 44.0, 42.0, 48.0, 45.0, 44.0, 49.0, 46.0, 50.0, 35.0, 37.0, 30.0, 37.0, 34.0, 22.0, 28.0, 25.0, 18.0, 17.0, 11.0, 13.0, 6.0, 7.0, 7.0, 8.0, 8.0, 6.0, 4.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.255859375, -2.18341064453125, -2.1109619140625, -2.03851318359375, -1.966064453125, -1.89361572265625, -1.8211669921875, -1.74871826171875, -1.67626953125, -1.60382080078125, -1.5313720703125, -1.45892333984375, -1.386474609375, -1.31402587890625, -1.2415771484375, -1.16912841796875, -1.0966796875, -1.02423095703125, -0.9517822265625, -0.87933349609375, -0.806884765625, -0.73443603515625, -0.6619873046875, -0.58953857421875, -0.51708984375, -0.44464111328125, -0.3721923828125, -0.29974365234375, -0.227294921875, -0.15484619140625, -0.0823974609375, -0.00994873046875, 0.0625, 0.13494873046875, 0.2073974609375, 0.27984619140625, 0.352294921875, 0.42474365234375, 0.4971923828125, 0.56964111328125, 0.64208984375, 0.71453857421875, 0.7869873046875, 0.85943603515625, 0.931884765625, 1.00433349609375, 1.0767822265625, 1.14923095703125, 1.2216796875, 1.29412841796875, 1.3665771484375, 1.43902587890625, 1.511474609375, 1.58392333984375, 1.6563720703125, 1.72882080078125, 1.80126953125, 1.87371826171875, 1.9461669921875, 2.01861572265625, 2.091064453125, 2.16351318359375, 2.2359619140625, 2.30841064453125, 2.380859375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 8.0, 4.0, 23.0, 16.0, 23.0, 19.0, 57.0, 59.0, 82.0, 130.0, 184.0, 268.0, 387.0, 648.0, 1105.0, 2405.0, 7073.0, 33599.0, 281550.0, 659300.0, 46569.0, 8874.0, 2792.0, 1296.0, 711.0, 424.0, 291.0, 193.0, 134.0, 108.0, 61.0, 43.0, 36.0, 31.0, 10.0, 10.0, 11.0, 5.0, 4.0, 6.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.9453125, -7.69769287109375, -7.4500732421875, -7.20245361328125, -6.954833984375, -6.70721435546875, -6.4595947265625, -6.21197509765625, -5.96435546875, -5.71673583984375, -5.4691162109375, -5.22149658203125, -4.973876953125, -4.72625732421875, -4.4786376953125, -4.23101806640625, -3.9833984375, -3.73577880859375, -3.4881591796875, -3.24053955078125, -2.992919921875, -2.74530029296875, -2.4976806640625, -2.25006103515625, -2.00244140625, -1.75482177734375, -1.5072021484375, -1.25958251953125, -1.011962890625, -0.76434326171875, -0.5167236328125, -0.26910400390625, -0.021484375, 0.22613525390625, 0.4737548828125, 0.72137451171875, 0.968994140625, 1.21661376953125, 1.4642333984375, 1.71185302734375, 1.95947265625, 2.20709228515625, 2.4547119140625, 2.70233154296875, 2.949951171875, 3.19757080078125, 3.4451904296875, 3.69281005859375, 3.9404296875, 4.18804931640625, 4.4356689453125, 4.68328857421875, 4.930908203125, 5.17852783203125, 5.4261474609375, 5.67376708984375, 5.92138671875, 6.16900634765625, 6.4166259765625, 6.66424560546875, 6.911865234375, 7.15948486328125, 7.4071044921875, 7.65472412109375, 7.90234375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 10.0, 7.0, 12.0, 17.0, 17.0, 26.0, 17.0, 16.0, 22.0, 26.0, 40.0, 42.0, 50.0, 44.0, 50.0, 58.0, 74.0, 64.0, 63.0, 40.0, 35.0, 45.0, 23.0, 32.0, 24.0, 20.0, 17.0, 14.0, 23.0, 17.0, 11.0, 8.0, 7.0, 6.0, 6.0, 3.0, 2.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.1875, -8.9129638671875, -8.638427734375, -8.3638916015625, -8.08935546875, -7.8148193359375, -7.540283203125, -7.2657470703125, -6.9912109375, -6.7166748046875, -6.442138671875, -6.1676025390625, -5.89306640625, -5.6185302734375, -5.343994140625, -5.0694580078125, -4.794921875, -4.5203857421875, -4.245849609375, -3.9713134765625, -3.69677734375, -3.4222412109375, -3.147705078125, -2.8731689453125, -2.5986328125, -2.3240966796875, -2.049560546875, -1.7750244140625, -1.50048828125, -1.2259521484375, -0.951416015625, -0.6768798828125, -0.40234375, -0.1278076171875, 0.146728515625, 0.4212646484375, 0.69580078125, 0.9703369140625, 1.244873046875, 1.5194091796875, 1.7939453125, 2.0684814453125, 2.343017578125, 2.6175537109375, 2.89208984375, 3.1666259765625, 3.441162109375, 3.7156982421875, 3.990234375, 4.2647705078125, 4.539306640625, 4.8138427734375, 5.08837890625, 5.3629150390625, 5.637451171875, 5.9119873046875, 6.1865234375, 6.4610595703125, 6.735595703125, 7.0101318359375, 7.28466796875, 7.5592041015625, 7.833740234375, 8.1082763671875, 8.3828125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 6.0, 5.0, 6.0, 4.0, 8.0, 19.0, 19.0, 18.0, 49.0, 65.0, 126.0, 246.0, 490.0, 1295.0, 4703.0, 32141.0, 719145.0, 264397.0, 20420.0, 3458.0, 1000.0, 428.0, 215.0, 129.0, 49.0, 43.0, 15.0, 19.0, 14.0, 14.0, 4.0, 5.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.234375, -3.1552886962890625, -3.076202392578125, -2.9971160888671875, -2.91802978515625, -2.8389434814453125, -2.759857177734375, -2.6807708740234375, -2.6016845703125, -2.5225982666015625, -2.443511962890625, -2.3644256591796875, -2.28533935546875, -2.2062530517578125, -2.127166748046875, -2.0480804443359375, -1.968994140625, -1.8899078369140625, -1.810821533203125, -1.7317352294921875, -1.65264892578125, -1.5735626220703125, -1.494476318359375, -1.4153900146484375, -1.3363037109375, -1.2572174072265625, -1.178131103515625, -1.0990447998046875, -1.01995849609375, -0.9408721923828125, -0.861785888671875, -0.7826995849609375, -0.70361328125, -0.6245269775390625, -0.545440673828125, -0.4663543701171875, -0.38726806640625, -0.3081817626953125, -0.229095458984375, -0.1500091552734375, -0.0709228515625, 0.0081634521484375, 0.087249755859375, 0.1663360595703125, 0.24542236328125, 0.3245086669921875, 0.403594970703125, 0.4826812744140625, 0.561767578125, 0.6408538818359375, 0.719940185546875, 0.7990264892578125, 0.87811279296875, 0.9571990966796875, 1.036285400390625, 1.1153717041015625, 1.1944580078125, 1.2735443115234375, 1.352630615234375, 1.4317169189453125, 1.51080322265625, 1.5898895263671875, 1.668975830078125, 1.7480621337890625, 1.8271484375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 9.0, 6.0, 9.0, 6.0, 14.0, 20.0, 28.0, 23.0, 42.0, 46.0, 58.0, 84.0, 120.0, 104.0, 99.0, 76.0, 62.0, 49.0, 36.0, 36.0, 14.0, 12.0, 10.0, 13.0, 6.0, 5.0, 7.0, 2.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006017684936523438, -0.0005847364664077759, -0.000567704439163208, -0.0005506724119186401, -0.0005336403846740723, -0.0005166083574295044, -0.0004995763301849365, -0.00048254430294036865, -0.0004655122756958008, -0.0004484802484512329, -0.00043144822120666504, -0.00041441619396209717, -0.0003973841667175293, -0.0003803521394729614, -0.00036332011222839355, -0.0003462880849838257, -0.0003292560577392578, -0.00031222403049468994, -0.00029519200325012207, -0.0002781599760055542, -0.00026112794876098633, -0.00024409592151641846, -0.00022706389427185059, -0.00021003186702728271, -0.00019299983978271484, -0.00017596781253814697, -0.0001589357852935791, -0.00014190375804901123, -0.00012487173080444336, -0.00010783970355987549, -9.080767631530762e-05, -7.377564907073975e-05, -5.6743621826171875e-05, -3.9711594581604004e-05, -2.2679567337036133e-05, -5.647540092468262e-06, 1.138448715209961e-05, 2.841651439666748e-05, 4.544854164123535e-05, 6.248056888580322e-05, 7.95125961303711e-05, 9.654462337493896e-05, 0.00011357665061950684, 0.0001306086778640747, 0.00014764070510864258, 0.00016467273235321045, 0.00018170475959777832, 0.0001987367868423462, 0.00021576881408691406, 0.00023280084133148193, 0.0002498328685760498, 0.0002668648958206177, 0.00028389692306518555, 0.0003009289503097534, 0.0003179609775543213, 0.00033499300479888916, 0.00035202503204345703, 0.0003690570592880249, 0.0003860890865325928, 0.00040312111377716064, 0.0004201531410217285, 0.0004371851682662964, 0.00045421719551086426, 0.00047124922275543213, 0.00048828125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 6.0, 3.0, 7.0, 10.0, 6.0, 11.0, 16.0, 24.0, 26.0, 57.0, 58.0, 128.0, 179.0, 308.0, 475.0, 947.0, 2043.0, 5947.0, 25838.0, 215241.0, 724100.0, 57107.0, 10093.0, 2991.0, 1268.0, 636.0, 348.0, 236.0, 140.0, 81.0, 79.0, 41.0, 28.0, 23.0, 11.0, 13.0, 9.0, 10.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.8427734375, -1.785552978515625, -1.72833251953125, -1.671112060546875, -1.6138916015625, -1.556671142578125, -1.49945068359375, -1.442230224609375, -1.385009765625, -1.327789306640625, -1.27056884765625, -1.213348388671875, -1.1561279296875, -1.098907470703125, -1.04168701171875, -0.984466552734375, -0.92724609375, -0.870025634765625, -0.81280517578125, -0.755584716796875, -0.6983642578125, -0.641143798828125, -0.58392333984375, -0.526702880859375, -0.469482421875, -0.412261962890625, -0.35504150390625, -0.297821044921875, -0.2406005859375, -0.183380126953125, -0.12615966796875, -0.068939208984375, -0.01171875, 0.045501708984375, 0.10272216796875, 0.159942626953125, 0.2171630859375, 0.274383544921875, 0.33160400390625, 0.388824462890625, 0.446044921875, 0.503265380859375, 0.56048583984375, 0.617706298828125, 0.6749267578125, 0.732147216796875, 0.78936767578125, 0.846588134765625, 0.90380859375, 0.961029052734375, 1.01824951171875, 1.075469970703125, 1.1326904296875, 1.189910888671875, 1.24713134765625, 1.304351806640625, 1.361572265625, 1.418792724609375, 1.47601318359375, 1.533233642578125, 1.5904541015625, 1.647674560546875, 1.70489501953125, 1.762115478515625, 1.8193359375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 9.0, 4.0, 4.0, 9.0, 9.0, 12.0, 16.0, 22.0, 26.0, 44.0, 42.0, 42.0, 57.0, 73.0, 74.0, 83.0, 89.0, 74.0, 51.0, 47.0, 37.0, 27.0, 27.0, 17.0, 14.0, 15.0, 15.0, 13.0, 11.0, 2.0, 4.0, 11.0, 6.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.73046875, -1.6787261962890625, -1.626983642578125, -1.5752410888671875, -1.52349853515625, -1.4717559814453125, -1.420013427734375, -1.3682708740234375, -1.3165283203125, -1.2647857666015625, -1.213043212890625, -1.1613006591796875, -1.10955810546875, -1.0578155517578125, -1.006072998046875, -0.9543304443359375, -0.902587890625, -0.8508453369140625, -0.799102783203125, -0.7473602294921875, -0.69561767578125, -0.6438751220703125, -0.592132568359375, -0.5403900146484375, -0.4886474609375, -0.4369049072265625, -0.385162353515625, -0.3334197998046875, -0.28167724609375, -0.2299346923828125, -0.178192138671875, -0.1264495849609375, -0.07470703125, -0.0229644775390625, 0.028778076171875, 0.0805206298828125, 0.13226318359375, 0.1840057373046875, 0.235748291015625, 0.2874908447265625, 0.3392333984375, 0.3909759521484375, 0.442718505859375, 0.4944610595703125, 0.54620361328125, 0.5979461669921875, 0.649688720703125, 0.7014312744140625, 0.753173828125, 0.8049163818359375, 0.856658935546875, 0.9084014892578125, 0.96014404296875, 1.0118865966796875, 1.063629150390625, 1.1153717041015625, 1.1671142578125, 1.2188568115234375, 1.270599365234375, 1.3223419189453125, 1.37408447265625, 1.4258270263671875, 1.477569580078125, 1.5293121337890625, 1.5810546875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 8.0, 3.0, 17.0, 29.0, 39.0, 66.0, 136.0, 325.0, 136.0, 107.0, 53.0, 30.0, 23.0, 14.0, 7.0, 3.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.87493133544922, -44.46272277832031, -43.05051040649414, -41.638301849365234, -40.22609329223633, -38.813880920410156, -37.40167236328125, -35.989463806152344, -34.57725524902344, -33.16504669189453, -31.752836227416992, -30.340625762939453, -28.928417205810547, -27.516206741333008, -26.10399627685547, -24.691787719726562, -23.27957534790039, -21.86736488342285, -20.455156326293945, -19.042945861816406, -17.6307373046875, -16.21852684020996, -14.806316375732422, -13.3941068649292, -11.981897354125977, -10.569687843322754, -9.157478332519531, -7.745267868041992, -6.3330583572387695, -4.920848846435547, -3.508638381958008, -2.096428871154785, -0.6842231750488281, 0.7279865741729736, 2.1401963233947754, 3.5524063110351562, 4.964615821838379, 6.376825332641602, 7.789035797119141, 9.201245307922363, 10.613454818725586, 12.025664329528809, 13.437873840332031, 14.85008430480957, 16.26229476928711, 17.674503326416016, 19.086713790893555, 20.498924255371094, 21.9111328125, 23.32334327697754, 24.735551834106445, 26.147762298583984, 27.55997085571289, 28.97218132019043, 30.38439178466797, 31.796600341796875, 33.20880889892578, 34.62101745605469, 36.03322982788086, 37.445438385009766, 38.85764694213867, 40.269859313964844, 41.68206787109375, 43.094276428222656, 44.50648880004883]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 6.0, 4.0, 3.0, 8.0, 6.0, 10.0, 10.0, 15.0, 24.0, 21.0, 15.0, 27.0, 23.0, 23.0, 29.0, 32.0, 48.0, 55.0, 133.0, 135.0, 66.0, 28.0, 35.0, 36.0, 21.0, 36.0, 25.0, 19.0, 12.0, 21.0, 13.0, 15.0, 11.0, 9.0, 11.0, 4.0, 5.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.195968627929688, -30.15711212158203, -29.118255615234375, -28.07939910888672, -27.04054069519043, -26.001684188842773, -24.962827682495117, -23.92397117614746, -22.885112762451172, -21.846256256103516, -20.80739974975586, -19.768543243408203, -18.729684829711914, -17.690828323364258, -16.6519718170166, -15.613115310668945, -14.574258804321289, -13.535402297973633, -12.49654483795166, -11.457688331604004, -10.418830871582031, -9.379974365234375, -8.341117858886719, -7.302260875701904, -6.26340389251709, -5.224546909332275, -4.185689926147461, -3.1468334197998047, -2.1079764366149902, -1.0691194534301758, -0.03026294708251953, 1.008594036102295, 2.0474510192871094, 3.086308002471924, 4.125164985656738, 5.1640214920043945, 6.202878475189209, 7.241735458374023, 8.28059196472168, 9.319448471069336, 10.358305931091309, 11.397162437438965, 12.436019897460938, 13.474876403808594, 14.51373291015625, 15.552590370178223, 16.591445922851562, 17.63030433654785, 18.669160842895508, 19.708017349243164, 20.74687385559082, 21.78573226928711, 22.824588775634766, 23.863445281982422, 24.902301788330078, 25.941158294677734, 26.98001480102539, 28.018871307373047, 29.057727813720703, 30.09658432006836, 31.13544273376465, 32.17430114746094, 33.213157653808594, 34.25201416015625, 35.290870666503906]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 5.0, 7.0, 3.0, 21.0, 26.0, 29.0, 55.0, 78.0, 101.0, 174.0, 277.0, 481.0, 812.0, 1299.0, 2380.0, 4850.0, 10510.0, 27754.0, 95142.0, 383526.0, 1332801.0, 1614825.0, 529736.0, 127925.0, 35782.0, 13186.0, 5728.0, 2894.0, 1571.0, 883.0, 507.0, 308.0, 196.0, 131.0, 89.0, 61.0, 38.0, 28.0, 16.0, 16.0, 11.0, 11.0, 9.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.9140625, -2.820404052734375, -2.72674560546875, -2.633087158203125, -2.5394287109375, -2.445770263671875, -2.35211181640625, -2.258453369140625, -2.164794921875, -2.071136474609375, -1.97747802734375, -1.883819580078125, -1.7901611328125, -1.696502685546875, -1.60284423828125, -1.509185791015625, -1.41552734375, -1.321868896484375, -1.22821044921875, -1.134552001953125, -1.0408935546875, -0.947235107421875, -0.85357666015625, -0.759918212890625, -0.666259765625, -0.572601318359375, -0.47894287109375, -0.385284423828125, -0.2916259765625, -0.197967529296875, -0.10430908203125, -0.010650634765625, 0.0830078125, 0.176666259765625, 0.27032470703125, 0.363983154296875, 0.4576416015625, 0.551300048828125, 0.64495849609375, 0.738616943359375, 0.832275390625, 0.925933837890625, 1.01959228515625, 1.113250732421875, 1.2069091796875, 1.300567626953125, 1.39422607421875, 1.487884521484375, 1.58154296875, 1.675201416015625, 1.76885986328125, 1.862518310546875, 1.9561767578125, 2.049835205078125, 2.14349365234375, 2.237152099609375, 2.330810546875, 2.424468994140625, 2.51812744140625, 2.611785888671875, 2.7054443359375, 2.799102783203125, 2.89276123046875, 2.986419677734375, 3.080078125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 7.0, 13.0, 7.0, 9.0, 9.0, 12.0, 7.0, 13.0, 17.0, 16.0, 32.0, 22.0, 25.0, 31.0, 25.0, 37.0, 35.0, 47.0, 38.0, 38.0, 48.0, 40.0, 44.0, 43.0, 39.0, 37.0, 39.0, 31.0, 33.0, 24.0, 24.0, 28.0, 22.0, 24.0, 16.0, 13.0, 12.0, 8.0, 7.0, 3.0, 1.0, 4.0, 9.0, 4.0, 5.0, 4.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0], "bins": [-1.943359375, -1.88494873046875, -1.8265380859375, -1.76812744140625, -1.709716796875, -1.65130615234375, -1.5928955078125, -1.53448486328125, -1.47607421875, -1.41766357421875, -1.3592529296875, -1.30084228515625, -1.242431640625, -1.18402099609375, -1.1256103515625, -1.06719970703125, -1.0087890625, -0.95037841796875, -0.8919677734375, -0.83355712890625, -0.775146484375, -0.71673583984375, -0.6583251953125, -0.59991455078125, -0.54150390625, -0.48309326171875, -0.4246826171875, -0.36627197265625, -0.307861328125, -0.24945068359375, -0.1910400390625, -0.13262939453125, -0.07421875, -0.01580810546875, 0.0426025390625, 0.10101318359375, 0.159423828125, 0.21783447265625, 0.2762451171875, 0.33465576171875, 0.39306640625, 0.45147705078125, 0.5098876953125, 0.56829833984375, 0.626708984375, 0.68511962890625, 0.7435302734375, 0.80194091796875, 0.8603515625, 0.91876220703125, 0.9771728515625, 1.03558349609375, 1.093994140625, 1.15240478515625, 1.2108154296875, 1.26922607421875, 1.32763671875, 1.38604736328125, 1.4444580078125, 1.50286865234375, 1.561279296875, 1.61968994140625, 1.6781005859375, 1.73651123046875, 1.794921875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 5.0, 4.0, 5.0, 6.0, 7.0, 22.0, 45.0, 58.0, 114.0, 208.0, 454.0, 936.0, 2825.0, 25174.0, 3959434.0, 196293.0, 5979.0, 1499.0, 559.0, 296.0, 165.0, 97.0, 34.0, 35.0, 15.0, 12.0, 2.0, 0.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.28125, -13.783935546875, -13.28662109375, -12.789306640625, -12.2919921875, -11.794677734375, -11.29736328125, -10.800048828125, -10.302734375, -9.805419921875, -9.30810546875, -8.810791015625, -8.3134765625, -7.816162109375, -7.31884765625, -6.821533203125, -6.32421875, -5.826904296875, -5.32958984375, -4.832275390625, -4.3349609375, -3.837646484375, -3.34033203125, -2.843017578125, -2.345703125, -1.848388671875, -1.35107421875, -0.853759765625, -0.3564453125, 0.140869140625, 0.63818359375, 1.135498046875, 1.6328125, 2.130126953125, 2.62744140625, 3.124755859375, 3.6220703125, 4.119384765625, 4.61669921875, 5.114013671875, 5.611328125, 6.108642578125, 6.60595703125, 7.103271484375, 7.6005859375, 8.097900390625, 8.59521484375, 9.092529296875, 9.58984375, 10.087158203125, 10.58447265625, 11.081787109375, 11.5791015625, 12.076416015625, 12.57373046875, 13.071044921875, 13.568359375, 14.065673828125, 14.56298828125, 15.060302734375, 15.5576171875, 16.054931640625, 16.55224609375, 17.049560546875, 17.546875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 6.0, 10.0, 20.0, 24.0, 37.0, 64.0, 90.0, 105.0, 152.0, 237.0, 340.0, 506.0, 637.0, 580.0, 378.0, 282.0, 186.0, 126.0, 95.0, 69.0, 47.0, 23.0, 17.0, 22.0, 10.0, 5.0, 6.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0], "bins": [-10.453125, -10.2135009765625, -9.973876953125, -9.7342529296875, -9.49462890625, -9.2550048828125, -9.015380859375, -8.7757568359375, -8.5361328125, -8.2965087890625, -8.056884765625, -7.8172607421875, -7.57763671875, -7.3380126953125, -7.098388671875, -6.8587646484375, -6.619140625, -6.3795166015625, -6.139892578125, -5.9002685546875, -5.66064453125, -5.4210205078125, -5.181396484375, -4.9417724609375, -4.7021484375, -4.4625244140625, -4.222900390625, -3.9832763671875, -3.74365234375, -3.5040283203125, -3.264404296875, -3.0247802734375, -2.78515625, -2.5455322265625, -2.305908203125, -2.0662841796875, -1.82666015625, -1.5870361328125, -1.347412109375, -1.1077880859375, -0.8681640625, -0.6285400390625, -0.388916015625, -0.1492919921875, 0.09033203125, 0.3299560546875, 0.569580078125, 0.8092041015625, 1.048828125, 1.2884521484375, 1.528076171875, 1.7677001953125, 2.00732421875, 2.2469482421875, 2.486572265625, 2.7261962890625, 2.9658203125, 3.2054443359375, 3.445068359375, 3.6846923828125, 3.92431640625, 4.1639404296875, 4.403564453125, 4.6431884765625, 4.8828125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 2.0, 4.0, 2.0, 3.0, 7.0, 12.0, 13.0, 20.0, 21.0, 53.0, 88.0, 122.0, 175.0, 156.0, 108.0, 73.0, 43.0, 18.0, 24.0, 15.0, 6.0, 8.0, 3.0, 4.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-67.07365417480469, -65.02252960205078, -62.97140884399414, -60.9202880859375, -58.869163513183594, -56.81804275512695, -54.76692199707031, -52.715797424316406, -50.6646728515625, -48.61355209350586, -46.56242752075195, -44.51130676269531, -42.460182189941406, -40.409061431884766, -38.357940673828125, -36.30681610107422, -34.25569534301758, -32.20457458496094, -30.15345001220703, -28.10232925415039, -26.051204681396484, -24.000083923339844, -21.94896125793457, -19.897838592529297, -17.846715927124023, -15.79559326171875, -13.744470596313477, -11.69334888458252, -9.642226219177246, -7.591103553771973, -5.539981842041016, -3.488859176635742, -1.4377365112304688, 0.6133859157562256, 2.66450834274292, 4.715630531311035, 6.766753196716309, 8.817875862121582, 10.868997573852539, 12.920120239257812, 14.971242904663086, 17.02236557006836, 19.073488235473633, 21.124610900878906, 23.175731658935547, 25.226856231689453, 27.277976989746094, 29.329099655151367, 31.38022232055664, 33.43134307861328, 35.48246765136719, 37.53358840942383, 39.584712982177734, 41.635833740234375, 43.68695831298828, 45.73807907104492, 47.78919982910156, 49.8403205871582, 51.89144515991211, 53.94256591796875, 55.993690490722656, 58.0448112487793, 60.09593200683594, 62.147056579589844, 64.19818115234375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 6.0, 9.0, 12.0, 10.0, 11.0, 19.0, 19.0, 15.0, 18.0, 28.0, 25.0, 25.0, 39.0, 55.0, 58.0, 42.0, 53.0, 54.0, 64.0, 56.0, 63.0, 41.0, 40.0, 47.0, 31.0, 23.0, 26.0, 32.0, 13.0, 11.0, 15.0, 10.0, 6.0, 4.0, 7.0, 2.0, 1.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-44.854557037353516, -43.54741668701172, -42.24028015136719, -40.93313980102539, -39.625999450683594, -38.31886291503906, -37.011722564697266, -35.70458221435547, -34.39744567871094, -33.09030532836914, -31.783166885375977, -30.476028442382812, -29.168888092041016, -27.86174964904785, -26.554611206054688, -25.24747085571289, -23.940330505371094, -22.63319206237793, -21.326051712036133, -20.01891326904297, -18.711772918701172, -17.404634475708008, -16.097496032714844, -14.790356636047363, -13.483217239379883, -12.176077842712402, -10.868938446044922, -9.561800003051758, -8.254660606384277, -6.947521209716797, -5.640382289886475, -4.333243370056152, -3.0261001586914062, -1.7189610004425049, -0.4118218421936035, 0.8953173160552979, 2.202456474304199, 3.5095958709716797, 4.816734790802002, 6.123873710632324, 7.431013107299805, 8.738152503967285, 10.045291900634766, 11.35243034362793, 12.65956974029541, 13.96670913696289, 15.273847579956055, 16.58098602294922, 17.888126373291016, 19.19526481628418, 20.502405166625977, 21.80954360961914, 23.116683959960938, 24.4238224029541, 25.730960845947266, 27.038101196289062, 28.345239639282227, 29.65237808227539, 30.959518432617188, 32.266658782958984, 33.573795318603516, 34.88093566894531, 36.18807601928711, 37.49521255493164, 38.80235290527344]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 5.0, 8.0, 11.0, 12.0, 14.0, 23.0, 43.0, 79.0, 113.0, 212.0, 314.0, 591.0, 1104.0, 2322.0, 5043.0, 12389.0, 34646.0, 120766.0, 569686.0, 215846.0, 54258.0, 17849.0, 6874.0, 3090.0, 1458.0, 780.0, 415.0, 241.0, 146.0, 82.0, 54.0, 29.0, 22.0, 14.0, 12.0, 3.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.33984375, -5.18133544921875, -5.0228271484375, -4.86431884765625, -4.705810546875, -4.54730224609375, -4.3887939453125, -4.23028564453125, -4.07177734375, -3.91326904296875, -3.7547607421875, -3.59625244140625, -3.437744140625, -3.27923583984375, -3.1207275390625, -2.96221923828125, -2.8037109375, -2.64520263671875, -2.4866943359375, -2.32818603515625, -2.169677734375, -2.01116943359375, -1.8526611328125, -1.69415283203125, -1.53564453125, -1.37713623046875, -1.2186279296875, -1.06011962890625, -0.901611328125, -0.74310302734375, -0.5845947265625, -0.42608642578125, -0.267578125, -0.10906982421875, 0.0494384765625, 0.20794677734375, 0.366455078125, 0.52496337890625, 0.6834716796875, 0.84197998046875, 1.00048828125, 1.15899658203125, 1.3175048828125, 1.47601318359375, 1.634521484375, 1.79302978515625, 1.9515380859375, 2.11004638671875, 2.2685546875, 2.42706298828125, 2.5855712890625, 2.74407958984375, 2.902587890625, 3.06109619140625, 3.2196044921875, 3.37811279296875, 3.53662109375, 3.69512939453125, 3.8536376953125, 4.01214599609375, 4.170654296875, 4.32916259765625, 4.4876708984375, 4.64617919921875, 4.8046875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 8.0, 7.0, 17.0, 14.0, 8.0, 12.0, 16.0, 23.0, 16.0, 22.0, 24.0, 23.0, 41.0, 44.0, 35.0, 37.0, 43.0, 53.0, 36.0, 45.0, 46.0, 49.0, 41.0, 39.0, 42.0, 43.0, 26.0, 23.0, 26.0, 30.0, 9.0, 24.0, 17.0, 15.0, 12.0, 11.0, 6.0, 9.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.16015625, -2.086273193359375, -2.01239013671875, -1.938507080078125, -1.8646240234375, -1.790740966796875, -1.71685791015625, -1.642974853515625, -1.569091796875, -1.495208740234375, -1.42132568359375, -1.347442626953125, -1.2735595703125, -1.199676513671875, -1.12579345703125, -1.051910400390625, -0.97802734375, -0.904144287109375, -0.83026123046875, -0.756378173828125, -0.6824951171875, -0.608612060546875, -0.53472900390625, -0.460845947265625, -0.386962890625, -0.313079833984375, -0.23919677734375, -0.165313720703125, -0.0914306640625, -0.017547607421875, 0.05633544921875, 0.130218505859375, 0.2041015625, 0.277984619140625, 0.35186767578125, 0.425750732421875, 0.4996337890625, 0.573516845703125, 0.64739990234375, 0.721282958984375, 0.795166015625, 0.869049072265625, 0.94293212890625, 1.016815185546875, 1.0906982421875, 1.164581298828125, 1.23846435546875, 1.312347412109375, 1.38623046875, 1.460113525390625, 1.53399658203125, 1.607879638671875, 1.6817626953125, 1.755645751953125, 1.82952880859375, 1.903411865234375, 1.977294921875, 2.051177978515625, 2.12506103515625, 2.198944091796875, 2.2728271484375, 2.346710205078125, 2.42059326171875, 2.494476318359375, 2.568359375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 6.0, 1.0, 11.0, 7.0, 11.0, 26.0, 20.0, 25.0, 64.0, 72.0, 120.0, 195.0, 292.0, 561.0, 1099.0, 2767.0, 11548.0, 84094.0, 885827.0, 49238.0, 8111.0, 2257.0, 948.0, 479.0, 278.0, 149.0, 108.0, 84.0, 49.0, 31.0, 30.0, 14.0, 19.0, 5.0, 9.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.60546875, -7.35516357421875, -7.1048583984375, -6.85455322265625, -6.604248046875, -6.35394287109375, -6.1036376953125, -5.85333251953125, -5.60302734375, -5.35272216796875, -5.1024169921875, -4.85211181640625, -4.601806640625, -4.35150146484375, -4.1011962890625, -3.85089111328125, -3.6005859375, -3.35028076171875, -3.0999755859375, -2.84967041015625, -2.599365234375, -2.34906005859375, -2.0987548828125, -1.84844970703125, -1.59814453125, -1.34783935546875, -1.0975341796875, -0.84722900390625, -0.596923828125, -0.34661865234375, -0.0963134765625, 0.15399169921875, 0.404296875, 0.65460205078125, 0.9049072265625, 1.15521240234375, 1.405517578125, 1.65582275390625, 1.9061279296875, 2.15643310546875, 2.40673828125, 2.65704345703125, 2.9073486328125, 3.15765380859375, 3.407958984375, 3.65826416015625, 3.9085693359375, 4.15887451171875, 4.4091796875, 4.65948486328125, 4.9097900390625, 5.16009521484375, 5.410400390625, 5.66070556640625, 5.9110107421875, 6.16131591796875, 6.41162109375, 6.66192626953125, 6.9122314453125, 7.16253662109375, 7.412841796875, 7.66314697265625, 7.9134521484375, 8.16375732421875, 8.4140625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 5.0, 1.0, 5.0, 6.0, 9.0, 9.0, 9.0, 12.0, 18.0, 10.0, 23.0, 17.0, 26.0, 22.0, 26.0, 32.0, 43.0, 48.0, 66.0, 76.0, 74.0, 60.0, 61.0, 42.0, 51.0, 40.0, 31.0, 29.0, 17.0, 14.0, 21.0, 11.0, 15.0, 7.0, 11.0, 13.0, 11.0, 5.0, 8.0, 7.0, 4.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.0234375, -9.7225341796875, -9.421630859375, -9.1207275390625, -8.81982421875, -8.5189208984375, -8.218017578125, -7.9171142578125, -7.6162109375, -7.3153076171875, -7.014404296875, -6.7135009765625, -6.41259765625, -6.1116943359375, -5.810791015625, -5.5098876953125, -5.208984375, -4.9080810546875, -4.607177734375, -4.3062744140625, -4.00537109375, -3.7044677734375, -3.403564453125, -3.1026611328125, -2.8017578125, -2.5008544921875, -2.199951171875, -1.8990478515625, -1.59814453125, -1.2972412109375, -0.996337890625, -0.6954345703125, -0.39453125, -0.0936279296875, 0.207275390625, 0.5081787109375, 0.80908203125, 1.1099853515625, 1.410888671875, 1.7117919921875, 2.0126953125, 2.3135986328125, 2.614501953125, 2.9154052734375, 3.21630859375, 3.5172119140625, 3.818115234375, 4.1190185546875, 4.419921875, 4.7208251953125, 5.021728515625, 5.3226318359375, 5.62353515625, 5.9244384765625, 6.225341796875, 6.5262451171875, 6.8271484375, 7.1280517578125, 7.428955078125, 7.7298583984375, 8.03076171875, 8.3316650390625, 8.632568359375, 8.9334716796875, 9.234375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 8.0, 2.0, 7.0, 4.0, 6.0, 14.0, 21.0, 20.0, 31.0, 47.0, 62.0, 100.0, 149.0, 296.0, 593.0, 1495.0, 4643.0, 20921.0, 764538.0, 231114.0, 17682.0, 4120.0, 1402.0, 589.0, 261.0, 149.0, 79.0, 55.0, 39.0, 30.0, 23.0, 25.0, 9.0, 11.0, 4.0, 5.0, 6.0, 1.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.701171875, -1.644378662109375, -1.58758544921875, -1.530792236328125, -1.4739990234375, -1.417205810546875, -1.36041259765625, -1.303619384765625, -1.246826171875, -1.190032958984375, -1.13323974609375, -1.076446533203125, -1.0196533203125, -0.962860107421875, -0.90606689453125, -0.849273681640625, -0.79248046875, -0.735687255859375, -0.67889404296875, -0.622100830078125, -0.5653076171875, -0.508514404296875, -0.45172119140625, -0.394927978515625, -0.338134765625, -0.281341552734375, -0.22454833984375, -0.167755126953125, -0.1109619140625, -0.054168701171875, 0.00262451171875, 0.059417724609375, 0.1162109375, 0.173004150390625, 0.22979736328125, 0.286590576171875, 0.3433837890625, 0.400177001953125, 0.45697021484375, 0.513763427734375, 0.570556640625, 0.627349853515625, 0.68414306640625, 0.740936279296875, 0.7977294921875, 0.854522705078125, 0.91131591796875, 0.968109130859375, 1.02490234375, 1.081695556640625, 1.13848876953125, 1.195281982421875, 1.2520751953125, 1.308868408203125, 1.36566162109375, 1.422454833984375, 1.479248046875, 1.536041259765625, 1.59283447265625, 1.649627685546875, 1.7064208984375, 1.763214111328125, 1.82000732421875, 1.876800537109375, 1.93359375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 5.0, 3.0, 7.0, 5.0, 9.0, 8.0, 9.0, 14.0, 12.0, 13.0, 28.0, 22.0, 45.0, 68.0, 82.0, 114.0, 135.0, 107.0, 76.0, 60.0, 43.0, 25.0, 23.0, 17.0, 13.0, 12.0, 4.0, 6.0, 5.0, 6.0, 6.0, 6.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.000461578369140625, -0.00044780224561691284, -0.0004340261220932007, -0.0004202499985694885, -0.00040647387504577637, -0.0003926977515220642, -0.00037892162799835205, -0.0003651455044746399, -0.00035136938095092773, -0.0003375932574272156, -0.0003238171339035034, -0.00031004101037979126, -0.0002962648868560791, -0.00028248876333236694, -0.0002687126398086548, -0.0002549365162849426, -0.00024116039276123047, -0.0002273842692375183, -0.00021360814571380615, -0.000199832022190094, -0.00018605589866638184, -0.00017227977514266968, -0.00015850365161895752, -0.00014472752809524536, -0.0001309514045715332, -0.00011717528104782104, -0.00010339915752410889, -8.962303400039673e-05, -7.584691047668457e-05, -6.207078695297241e-05, -4.8294663429260254e-05, -3.4518539905548096e-05, -2.0742416381835938e-05, -6.966292858123779e-06, 6.809830665588379e-06, 2.0585954189300537e-05, 3.4362077713012695e-05, 4.8138201236724854e-05, 6.191432476043701e-05, 7.569044828414917e-05, 8.946657180786133e-05, 0.00010324269533157349, 0.00011701881885528564, 0.0001307949423789978, 0.00014457106590270996, 0.00015834718942642212, 0.00017212331295013428, 0.00018589943647384644, 0.0001996755599975586, 0.00021345168352127075, 0.0002272278070449829, 0.00024100393056869507, 0.0002547800540924072, 0.0002685561776161194, 0.00028233230113983154, 0.0002961084246635437, 0.00030988454818725586, 0.000323660671710968, 0.0003374367952346802, 0.00035121291875839233, 0.0003649890422821045, 0.00037876516580581665, 0.0003925412893295288, 0.00040631741285324097, 0.0004200935363769531]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 7.0, 7.0, 11.0, 11.0, 10.0, 26.0, 24.0, 39.0, 57.0, 84.0, 100.0, 142.0, 248.0, 404.0, 692.0, 1487.0, 3199.0, 8551.0, 32971.0, 743219.0, 217853.0, 26394.0, 7138.0, 2792.0, 1268.0, 695.0, 383.0, 248.0, 143.0, 103.0, 75.0, 42.0, 28.0, 31.0, 23.0, 11.0, 12.0, 6.0, 4.0, 5.0, 2.0, 4.0, 1.0, 3.0, 3.0, 2.0, 0.0, 2.0], "bins": [-1.2255859375, -1.1914749145507812, -1.1573638916015625, -1.1232528686523438, -1.089141845703125, -1.0550308227539062, -1.0209197998046875, -0.9868087768554688, -0.95269775390625, -0.9185867309570312, -0.8844757080078125, -0.8503646850585938, -0.816253662109375, -0.7821426391601562, -0.7480316162109375, -0.7139205932617188, -0.6798095703125, -0.6456985473632812, -0.6115875244140625, -0.5774765014648438, -0.543365478515625, -0.5092544555664062, -0.4751434326171875, -0.44103240966796875, -0.40692138671875, -0.37281036376953125, -0.3386993408203125, -0.30458831787109375, -0.270477294921875, -0.23636627197265625, -0.2022552490234375, -0.16814422607421875, -0.134033203125, -0.09992218017578125, -0.0658111572265625, -0.03170013427734375, 0.002410888671875, 0.03652191162109375, 0.0706329345703125, 0.10474395751953125, 0.13885498046875, 0.17296600341796875, 0.2070770263671875, 0.24118804931640625, 0.275299072265625, 0.30941009521484375, 0.3435211181640625, 0.37763214111328125, 0.4117431640625, 0.44585418701171875, 0.4799652099609375, 0.5140762329101562, 0.548187255859375, 0.5822982788085938, 0.6164093017578125, 0.6505203247070312, 0.68463134765625, 0.7187423706054688, 0.7528533935546875, 0.7869644165039062, 0.821075439453125, 0.8551864624023438, 0.8892974853515625, 0.9234085083007812, 0.95751953125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 6.0, 1.0, 2.0, 1.0, 5.0, 2.0, 5.0, 8.0, 6.0, 8.0, 4.0, 9.0, 8.0, 12.0, 18.0, 21.0, 36.0, 30.0, 43.0, 45.0, 66.0, 104.0, 101.0, 90.0, 90.0, 53.0, 53.0, 33.0, 25.0, 22.0, 20.0, 13.0, 11.0, 10.0, 7.0, 10.0, 8.0, 7.0, 2.0, 2.0, 4.0, 1.0, 3.0, 5.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.0810546875, -1.0492324829101562, -1.0174102783203125, -0.9855880737304688, -0.953765869140625, -0.9219436645507812, -0.8901214599609375, -0.8582992553710938, -0.82647705078125, -0.7946548461914062, -0.7628326416015625, -0.7310104370117188, -0.699188232421875, -0.6673660278320312, -0.6355438232421875, -0.6037216186523438, -0.5718994140625, -0.5400772094726562, -0.5082550048828125, -0.47643280029296875, -0.444610595703125, -0.41278839111328125, -0.3809661865234375, -0.34914398193359375, -0.31732177734375, -0.28549957275390625, -0.2536773681640625, -0.22185516357421875, -0.190032958984375, -0.15821075439453125, -0.1263885498046875, -0.09456634521484375, -0.062744140625, -0.03092193603515625, 0.0009002685546875, 0.03272247314453125, 0.064544677734375, 0.09636688232421875, 0.1281890869140625, 0.16001129150390625, 0.19183349609375, 0.22365570068359375, 0.2554779052734375, 0.28730010986328125, 0.319122314453125, 0.35094451904296875, 0.3827667236328125, 0.41458892822265625, 0.4464111328125, 0.47823333740234375, 0.5100555419921875, 0.5418777465820312, 0.573699951171875, 0.6055221557617188, 0.6373443603515625, 0.6691665649414062, 0.70098876953125, 0.7328109741210938, 0.7646331787109375, 0.7964553833007812, 0.828277587890625, 0.8600997924804688, 0.8919219970703125, 0.9237442016601562, 0.95556640625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 3.0, 4.0, 25.0, 36.0, 73.0, 130.0, 519.0, 94.0, 49.0, 37.0, 12.0, 5.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-80.2357177734375, -78.34186553955078, -76.44800567626953, -74.55415344238281, -72.66029357910156, -70.76644134521484, -68.87258911132812, -66.97872924804688, -65.08487701416016, -63.19102096557617, -61.29716491699219, -59.40331268310547, -57.509456634521484, -55.6156005859375, -53.72174835205078, -51.8278923034668, -49.93403625488281, -48.04018020629883, -46.146324157714844, -44.252471923828125, -42.35861587524414, -40.464759826660156, -38.57090759277344, -36.67705154418945, -34.78319549560547, -32.889339447021484, -30.995485305786133, -29.10163116455078, -27.207775115966797, -25.313919067382812, -23.42006492614746, -21.52621078491211, -19.632354736328125, -17.73849868774414, -15.844644546508789, -13.950789451599121, -12.056934356689453, -10.163079261779785, -8.269224166870117, -6.375369071960449, -4.481513977050781, -2.5876588821411133, -0.6938037872314453, 1.2000513076782227, 3.0939064025878906, 4.987761497497559, 6.881616592407227, 8.775471687316895, 10.669326782226562, 12.56318187713623, 14.457036972045898, 16.35089111328125, 18.244747161865234, 20.13860321044922, 22.03245735168457, 23.926311492919922, 25.820167541503906, 27.71402359008789, 29.607877731323242, 31.501731872558594, 33.39558792114258, 35.28944396972656, 37.18329620361328, 39.077152252197266, 40.97100830078125]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 6.0, 10.0, 7.0, 11.0, 8.0, 15.0, 11.0, 24.0, 29.0, 28.0, 43.0, 34.0, 110.0, 374.0, 62.0, 32.0, 29.0, 30.0, 32.0, 29.0, 14.0, 12.0, 14.0, 15.0, 13.0, 2.0, 3.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-52.86162185668945, -51.583953857421875, -50.30628204345703, -49.02861404418945, -47.75094223022461, -46.47327423095703, -45.19560241699219, -43.91793441772461, -42.64026641845703, -41.36259841918945, -40.08492660522461, -38.80725860595703, -37.52958679199219, -36.25191879272461, -34.974246978759766, -33.69657897949219, -32.418907165527344, -31.141237258911133, -29.863567352294922, -28.58589744567871, -27.3082275390625, -26.030559539794922, -24.75288963317871, -23.4752197265625, -22.19754981994629, -20.919879913330078, -19.642210006713867, -18.364540100097656, -17.086872100830078, -15.80920124053955, -14.531532287597656, -13.253862380981445, -11.976188659667969, -10.698518753051758, -9.420848846435547, -8.143179893493652, -6.865509986877441, -5.5878400802612305, -4.310170650482178, -3.032501220703125, -1.754831314086914, -0.4771616458892822, 0.8005080223083496, 2.0781776905059814, 3.3558473587036133, 4.633517265319824, 5.911186695098877, 7.18885612487793, 8.46652603149414, 9.744195938110352, 11.021865844726562, 12.299534797668457, 13.577204704284668, 14.854874610900879, 16.132543563842773, 17.410213470458984, 18.687883377075195, 19.965553283691406, 21.243223190307617, 22.520893096923828, 23.798561096191406, 25.07623291015625, 26.353900909423828, 27.63157081604004, 28.90924072265625]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 5.0, 4.0, 8.0, 7.0, 12.0, 12.0, 14.0, 16.0, 13.0, 26.0, 17.0, 25.0, 35.0, 31.0, 64.0, 123.0, 210.0, 85.0, 45.0, 38.0, 35.0, 23.0, 27.0, 14.0, 18.0, 14.0, 15.0, 13.0, 12.0, 12.0, 9.0, 3.0, 6.0, 7.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.427734375, -2.350067138671875, -2.27239990234375, -2.194732666015625, -2.1170654296875, -2.039398193359375, -1.96173095703125, -1.884063720703125, -1.806396484375, -1.728729248046875, -1.65106201171875, -1.573394775390625, -1.4957275390625, -1.418060302734375, -1.34039306640625, -1.262725830078125, -1.18505859375, -1.107391357421875, -1.02972412109375, -0.952056884765625, -0.8743896484375, -0.796722412109375, -0.71905517578125, -0.641387939453125, -0.563720703125, -0.486053466796875, -0.40838623046875, -0.330718994140625, -0.2530517578125, -0.175384521484375, -0.09771728515625, -0.020050048828125, 0.0576171875, 0.135284423828125, 0.21295166015625, 0.290618896484375, 0.3682861328125, 0.445953369140625, 0.52362060546875, 0.601287841796875, 0.678955078125, 0.756622314453125, 0.83428955078125, 0.911956787109375, 0.9896240234375, 1.067291259765625, 1.14495849609375, 1.222625732421875, 1.30029296875, 1.377960205078125, 1.45562744140625, 1.533294677734375, 1.6109619140625, 1.688629150390625, 1.76629638671875, 1.843963623046875, 1.921630859375, 1.999298095703125, 2.07696533203125, 2.154632568359375, 2.2322998046875, 2.309967041015625, 2.38763427734375, 2.465301513671875, 2.54296875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 3.0, 7.0, 10.0, 17.0, 20.0, 22.0, 33.0, 53.0, 62.0, 115.0, 209.0, 456.0, 953.0, 2562.0, 9164.0, 8181894.0, 181542.0, 7312.0, 2254.0, 856.0, 410.0, 202.0, 139.0, 62.0, 48.0, 38.0, 26.0, 18.0, 10.0, 14.0, 8.0, 10.0, 11.0, 4.0, 7.0, 7.0, 0.0, 2.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 3.0], "bins": [-17.026226043701172, -16.416513442993164, -15.80679988861084, -15.197086334228516, -14.587372779846191, -13.977659225463867, -13.36794662475586, -12.758233070373535, -12.148519515991211, -11.538805961608887, -10.929093360900879, -10.319379806518555, -9.70966625213623, -9.099952697753906, -8.490240097045898, -7.880526542663574, -7.270813941955566, -6.6611008644104, -6.051387310028076, -5.44167423248291, -4.831960678100586, -4.22224760055542, -3.612534523010254, -3.0028209686279297, -2.3931078910827637, -1.7833945751190186, -1.173681378364563, -0.5639681816101074, 0.045745134353637695, 0.6554584503173828, 1.2651715278625488, 1.874885082244873, 2.484598159790039, 3.094311475753784, 3.7040247917175293, 4.313737869262695, 4.9234514236450195, 5.5331645011901855, 6.142877578735352, 6.752591133117676, 7.362304210662842, 7.972017288208008, 8.581730842590332, 9.191444396972656, 9.801156997680664, 10.410870552062988, 11.020584106445312, 11.63029670715332, 12.240010261535645, 12.849723815917969, 13.459436416625977, 14.0691499710083, 14.678863525390625, 15.288576126098633, 15.898289680480957, 16.50800323486328, 17.11771583557129, 17.727428436279297, 18.337142944335938, 18.946855545043945, 19.556568145751953, 20.166282653808594, 20.7759952545166, 21.38570785522461, 21.99542236328125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 5.0, 5.0, 3.0, 2.0, 3.0, 4.0, 6.0, 4.0, 5.0, 3.0, 5.0, 2.0, 4.0, 6.0, 3.0, 7.0, 4.0, 4.0, 2.0, 3.0, 5.0, 8.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.60777473449707, -11.981675148010254, -11.355575561523438, -10.729476928710938, -10.103377342224121, -9.477277755737305, -8.851179122924805, -8.225079536437988, -7.598979949951172, -6.9728803634643555, -6.346781253814697, -5.720682144165039, -5.094582557678223, -4.468482971191406, -3.842383861541748, -3.21628475189209, -2.5901851654052734, -1.9640858173370361, -1.3379864692687988, -0.7118871212005615, -0.08578777313232422, 0.5403115749359131, 1.1664109230041504, 1.7925100326538086, 2.418609619140625, 3.0447089672088623, 3.6708083152770996, 4.296907424926758, 4.923007011413574, 5.549106597900391, 6.175205707550049, 6.801304817199707, 7.427406311035156, 8.053505897521973, 8.679605484008789, 9.305704116821289, 9.931803703308105, 10.557903289794922, 11.184001922607422, 11.810101509094238, 12.436201095581055, 13.062300682067871, 13.688400268554688, 14.314498901367188, 14.940598487854004, 15.56669807434082, 16.19279670715332, 16.818897247314453, 17.444995880126953, 18.071094512939453, 18.697195053100586, 19.323293685913086, 19.94939422607422, 20.57549285888672, 21.20159149169922, 21.82769012451172, 22.45379066467285, 23.07988929748535, 23.705989837646484, 24.332088470458984, 24.958187103271484, 25.584287643432617, 26.210386276245117, 26.83648681640625, 27.46258544921875]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 11.0, 5.0, 14.0, 15.0, 23.0, 21.0, 36.0, 34.0, 51.0, 77.0, 111.0, 179.0, 331.0, 476.0, 933.0, 1743.0, 3626.0, 7828.0, 18582.0, 47421.0, 125364.0, 182082.0, 82217.0, 30337.0, 12185.0, 5318.0, 2431.0, 1193.0, 649.0, 350.0, 211.0, 131.0, 84.0, 53.0, 40.0, 36.0, 17.0, 18.0, 13.0, 3.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-18.234375, -17.6865234375, -17.138671875, -16.5908203125, -16.04296875, -15.4951171875, -14.947265625, -14.3994140625, -13.8515625, -13.3037109375, -12.755859375, -12.2080078125, -11.66015625, -11.1123046875, -10.564453125, -10.0166015625, -9.46875, -8.9208984375, -8.373046875, -7.8251953125, -7.27734375, -6.7294921875, -6.181640625, -5.6337890625, -5.0859375, -4.5380859375, -3.990234375, -3.4423828125, -2.89453125, -2.3466796875, -1.798828125, -1.2509765625, -0.703125, -0.1552734375, 0.392578125, 0.9404296875, 1.48828125, 2.0361328125, 2.583984375, 3.1318359375, 3.6796875, 4.2275390625, 4.775390625, 5.3232421875, 5.87109375, 6.4189453125, 6.966796875, 7.5146484375, 8.0625, 8.6103515625, 9.158203125, 9.7060546875, 10.25390625, 10.8017578125, 11.349609375, 11.8974609375, 12.4453125, 12.9931640625, 13.541015625, 14.0888671875, 14.63671875, 15.1845703125, 15.732421875, 16.2802734375, 16.828125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 4.0, 5.0, 3.0, 3.0, 5.0, 13.0, 9.0, 14.0, 15.0, 12.0, 20.0, 19.0, 32.0, 34.0, 45.0, 57.0, 67.0, 63.0, 59.0, 76.0, 57.0, 66.0, 49.0, 54.0, 41.0, 36.0, 33.0, 16.0, 22.0, 14.0, 16.0, 12.0, 10.0, 7.0, 5.0, 1.0, 4.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.70703125, -2.61669921875, -2.5263671875, -2.43603515625, -2.345703125, -2.25537109375, -2.1650390625, -2.07470703125, -1.984375, -1.89404296875, -1.8037109375, -1.71337890625, -1.623046875, -1.53271484375, -1.4423828125, -1.35205078125, -1.26171875, -1.17138671875, -1.0810546875, -0.99072265625, -0.900390625, -0.81005859375, -0.7197265625, -0.62939453125, -0.5390625, -0.44873046875, -0.3583984375, -0.26806640625, -0.177734375, -0.08740234375, 0.0029296875, 0.09326171875, 0.18359375, 0.27392578125, 0.3642578125, 0.45458984375, 0.544921875, 0.63525390625, 0.7255859375, 0.81591796875, 0.90625, 0.99658203125, 1.0869140625, 1.17724609375, 1.267578125, 1.35791015625, 1.4482421875, 1.53857421875, 1.62890625, 1.71923828125, 1.8095703125, 1.89990234375, 1.990234375, 2.08056640625, 2.1708984375, 2.26123046875, 2.3515625, 2.44189453125, 2.5322265625, 2.62255859375, 2.712890625, 2.80322265625, 2.8935546875, 2.98388671875, 3.07421875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 14.0, 21.0, 34.0, 87.0, 191.0, 106.0, 25.0, 9.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.65459632873535, -25.014572143554688, -23.374549865722656, -21.734527587890625, -20.09450340270996, -18.454479217529297, -16.814456939697266, -15.174433708190918, -13.53441047668457, -11.894387245178223, -10.254364013671875, -8.614340782165527, -6.97431755065918, -5.334294319152832, -3.6942710876464844, -2.0542478561401367, -0.41422462463378906, 1.2257986068725586, 2.8658218383789062, 4.505845069885254, 6.145868301391602, 7.785891532897949, 9.425914764404297, 11.065937995910645, 12.705961227416992, 14.34598445892334, 15.986007690429688, 17.62602996826172, 19.266054153442383, 20.906078338623047, 22.546100616455078, 24.18612289428711, 25.826148986816406, 27.466171264648438, 29.1061954498291, 30.746219635009766, 32.3862419128418, 34.02626419067383, 35.666290283203125, 37.306312561035156, 38.94633483886719, 40.58635711669922, 42.22637939453125, 43.86640548706055, 45.50642776489258, 47.14645004272461, 48.786476135253906, 50.42649841308594, 52.06652069091797, 53.70654296875, 55.34656524658203, 56.98659133911133, 58.62661361694336, 60.26663589477539, 61.90666198730469, 63.54668426513672, 65.18670654296875, 66.82672882080078, 68.46675109863281, 70.10677337646484, 71.74679565429688, 73.38682556152344, 75.02684783935547, 76.6668701171875, 78.30689239501953]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 8.0, 4.0, 8.0, 1.0, 4.0, 7.0, 4.0, 6.0, 15.0, 34.0, 73.0, 104.0, 92.0, 59.0, 22.0, 7.0, 9.0, 7.0, 7.0, 8.0, 3.0, 3.0, 0.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.888593673706055, -20.272724151611328, -19.6568546295166, -19.040985107421875, -18.42511558532715, -17.809246063232422, -17.193376541137695, -16.57750701904297, -15.961638450622559, -15.345768928527832, -14.729899406433105, -14.114029884338379, -13.498161315917969, -12.882291793823242, -12.266422271728516, -11.650552749633789, -11.034683227539062, -10.418813705444336, -9.80294418334961, -9.187074661254883, -8.571205139160156, -7.955336093902588, -7.3394670486450195, -6.723597526550293, -6.107728004455566, -5.49185848236084, -4.875988960266113, -4.260119915008545, -3.6442503929138184, -3.028380870819092, -2.4125115871429443, -1.7966423034667969, -1.1807708740234375, -0.5649014711380005, 0.05096793174743652, 0.6668373346328735, 1.2827067375183105, 1.898576259613037, 2.5144455432891846, 3.130314826965332, 3.7461843490600586, 4.362053871154785, 4.977923393249512, 5.59379243850708, 6.209661960601807, 6.825531482696533, 7.441400527954102, 8.057270050048828, 8.673139572143555, 9.289009094238281, 9.904878616333008, 10.520748138427734, 11.136617660522461, 11.752487182617188, 12.368355751037598, 12.984225273132324, 13.60009479522705, 14.215964317321777, 14.831833839416504, 15.44770336151123, 16.06357192993164, 16.679441452026367, 17.295310974121094, 17.91118049621582, 18.527050018310547]}, "eval/loss": 4.170833587646484, "eval/wer": 1.9509520031733438, "eval/runtime": 786.0537, "eval/samples_per_second": 3.361, "eval/steps_per_second": 0.281} \ No newline at end of file