diff --git "a/wandb/run-20220322_102259-2z8qc0km/files/wandb-summary.json" "b/wandb/run-20220322_102259-2z8qc0km/files/wandb-summary.json" new file mode 100644--- /dev/null +++ "b/wandb/run-20220322_102259-2z8qc0km/files/wandb-summary.json" @@ -0,0 +1 @@ +{"train/loss": 6.1228, "train/learning_rate": 2.929718309859155e-05, "train/epoch": 1.68, "train/global_step": 1500, "_runtime": 8985, "_timestamp": 1647953564, "_step": 1500, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 11.0, 8.0, 17.0, 11.0, 23.0, 20.0, 29.0, 38.0, 43.0, 47.0, 61.0, 47.0, 61.0, 56.0, 63.0, 61.0, 67.0, 63.0, 45.0, 41.0, 31.0, 27.0, 29.0, 24.0, 18.0, 8.0, 20.0, 13.0, 7.0, 9.0, 6.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.924598693847656, -54.596683502197266, -53.26877212524414, -51.94085693359375, -50.612945556640625, -49.285030364990234, -47.957115173339844, -46.62920379638672, -45.30128860473633, -43.97337341308594, -42.64546203613281, -41.31754684448242, -39.98963165283203, -38.661720275878906, -37.333805084228516, -36.005889892578125, -34.677978515625, -33.35006332397461, -32.022151947021484, -30.694236755371094, -29.366323471069336, -28.038410186767578, -26.710494995117188, -25.38258171081543, -24.054668426513672, -22.726755142211914, -21.398841857910156, -20.070926666259766, -18.743013381958008, -17.41510009765625, -16.08718490600586, -14.759271621704102, -13.431356430053711, -12.103443145751953, -10.775528907775879, -9.447614669799805, -8.119701385498047, -6.791787624359131, -5.463873863220215, -4.135959625244141, -2.808046340942383, -1.4801325798034668, -0.15221881866455078, 1.1756949424743652, 2.5036087036132812, 3.8315224647521973, 5.159436225891113, 6.4873504638671875, 7.815263748168945, 9.143177032470703, 10.471091270446777, 11.799005508422852, 13.12691879272461, 14.454832077026367, 15.782746315002441, 17.110660552978516, 18.438573837280273, 19.76648712158203, 21.094402313232422, 22.42231559753418, 23.750228881835938, 25.078142166137695, 26.406055450439453, 27.733970642089844, 29.0618839263916]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 7.0, 6.0, 6.0, 12.0, 15.0, 16.0, 19.0, 20.0, 23.0, 31.0, 32.0, 28.0, 39.0, 42.0, 44.0, 30.0, 33.0, 38.0, 46.0, 41.0, 37.0, 49.0, 40.0, 38.0, 38.0, 42.0, 35.0, 34.0, 24.0, 28.0, 21.0, 12.0, 15.0, 14.0, 7.0, 9.0, 8.0, 9.0, 8.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-40.80854034423828, -39.671661376953125, -38.53478240966797, -37.39790344238281, -36.261024475097656, -35.124141693115234, -33.98726272583008, -32.85038375854492, -31.713504791259766, -30.57662582397461, -29.439746856689453, -28.302865982055664, -27.165987014770508, -26.02910804748535, -24.892227172851562, -23.755348205566406, -22.61846923828125, -21.481590270996094, -20.344711303710938, -19.20783042907715, -18.070951461791992, -16.934072494506836, -15.797192573547363, -14.66031265258789, -13.523433685302734, -12.386554718017578, -11.249674797058105, -10.112794876098633, -8.975915908813477, -7.839036464691162, -6.702157020568848, -5.565277576446533, -4.428398132324219, -3.2915186882019043, -2.15463924407959, -1.0177597999572754, 0.11911964416503906, 1.2559990882873535, 2.392878532409668, 3.5297579765319824, 4.666637420654297, 5.803516864776611, 6.940396308898926, 8.077276229858398, 9.214155197143555, 10.351034164428711, 11.487914085388184, 12.624794006347656, 13.761672973632812, 14.898551940917969, 16.035430908203125, 17.172311782836914, 18.30919075012207, 19.446069717407227, 20.582950592041016, 21.719829559326172, 22.856708526611328, 23.993587493896484, 25.13046646118164, 26.26734733581543, 27.404226303100586, 28.541105270385742, 29.67798614501953, 30.814865112304688, 31.951744079589844]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 7.0, 7.0, 10.0, 14.0, 36.0, 50.0, 75.0, 98.0, 136.0, 212.0, 338.0, 498.0, 832.0, 1412.0, 2197.0, 3662.0, 6250.0, 10088.0, 17158.0, 30487.0, 54913.0, 105647.0, 220207.0, 469880.0, 831520.0, 986405.0, 718372.0, 367295.0, 172472.0, 86219.0, 45521.0, 25568.0, 14644.0, 8709.0, 5129.0, 3058.0, 1909.0, 1146.0, 799.0, 489.0, 280.0, 197.0, 134.0, 77.0, 49.0, 27.0, 17.0, 18.0, 11.0, 3.0, 6.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-28.984375, -28.114990234375, -27.24560546875, -26.376220703125, -25.5068359375, -24.637451171875, -23.76806640625, -22.898681640625, -22.029296875, -21.159912109375, -20.29052734375, -19.421142578125, -18.5517578125, -17.682373046875, -16.81298828125, -15.943603515625, -15.07421875, -14.204833984375, -13.33544921875, -12.466064453125, -11.5966796875, -10.727294921875, -9.85791015625, -8.988525390625, -8.119140625, -7.249755859375, -6.38037109375, -5.510986328125, -4.6416015625, -3.772216796875, -2.90283203125, -2.033447265625, -1.1640625, -0.294677734375, 0.57470703125, 1.444091796875, 2.3134765625, 3.182861328125, 4.05224609375, 4.921630859375, 5.791015625, 6.660400390625, 7.52978515625, 8.399169921875, 9.2685546875, 10.137939453125, 11.00732421875, 11.876708984375, 12.74609375, 13.615478515625, 14.48486328125, 15.354248046875, 16.2236328125, 17.093017578125, 17.96240234375, 18.831787109375, 19.701171875, 20.570556640625, 21.43994140625, 22.309326171875, 23.1787109375, 24.048095703125, 24.91748046875, 25.786865234375, 26.65625]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 3.0, 3.0, 5.0, 6.0, 2.0, 11.0, 15.0, 17.0, 22.0, 20.0, 25.0, 32.0, 32.0, 41.0, 38.0, 41.0, 34.0, 40.0, 47.0, 40.0, 39.0, 47.0, 43.0, 45.0, 36.0, 34.0, 38.0, 37.0, 31.0, 24.0, 28.0, 22.0, 18.0, 20.0, 14.0, 14.0, 9.0, 5.0, 10.0, 4.0, 3.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-25.75, -25.0087890625, -24.267578125, -23.5263671875, -22.78515625, -22.0439453125, -21.302734375, -20.5615234375, -19.8203125, -19.0791015625, -18.337890625, -17.5966796875, -16.85546875, -16.1142578125, -15.373046875, -14.6318359375, -13.890625, -13.1494140625, -12.408203125, -11.6669921875, -10.92578125, -10.1845703125, -9.443359375, -8.7021484375, -7.9609375, -7.2197265625, -6.478515625, -5.7373046875, -4.99609375, -4.2548828125, -3.513671875, -2.7724609375, -2.03125, -1.2900390625, -0.548828125, 0.1923828125, 0.93359375, 1.6748046875, 2.416015625, 3.1572265625, 3.8984375, 4.6396484375, 5.380859375, 6.1220703125, 6.86328125, 7.6044921875, 8.345703125, 9.0869140625, 9.828125, 10.5693359375, 11.310546875, 12.0517578125, 12.79296875, 13.5341796875, 14.275390625, 15.0166015625, 15.7578125, 16.4990234375, 17.240234375, 17.9814453125, 18.72265625, 19.4638671875, 20.205078125, 20.9462890625, 21.6875]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 7.0, 7.0, 23.0, 28.0, 39.0, 56.0, 93.0, 147.0, 253.0, 383.0, 538.0, 923.0, 1470.0, 2305.0, 3752.0, 5761.0, 9023.0, 14238.0, 22257.0, 35709.0, 55865.0, 87714.0, 137501.0, 211912.0, 326674.0, 492127.0, 677517.0, 682456.0, 496331.0, 330173.0, 215649.0, 139021.0, 88782.0, 56821.0, 36055.0, 22937.0, 14512.0, 9315.0, 5865.0, 3686.0, 2352.0, 1499.0, 916.0, 630.0, 334.0, 254.0, 134.0, 103.0, 49.0, 41.0, 23.0, 13.0, 6.0, 9.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.96875, -19.303466796875, -18.63818359375, -17.972900390625, -17.3076171875, -16.642333984375, -15.97705078125, -15.311767578125, -14.646484375, -13.981201171875, -13.31591796875, -12.650634765625, -11.9853515625, -11.320068359375, -10.65478515625, -9.989501953125, -9.32421875, -8.658935546875, -7.99365234375, -7.328369140625, -6.6630859375, -5.997802734375, -5.33251953125, -4.667236328125, -4.001953125, -3.336669921875, -2.67138671875, -2.006103515625, -1.3408203125, -0.675537109375, -0.01025390625, 0.655029296875, 1.3203125, 1.985595703125, 2.65087890625, 3.316162109375, 3.9814453125, 4.646728515625, 5.31201171875, 5.977294921875, 6.642578125, 7.307861328125, 7.97314453125, 8.638427734375, 9.3037109375, 9.968994140625, 10.63427734375, 11.299560546875, 11.96484375, 12.630126953125, 13.29541015625, 13.960693359375, 14.6259765625, 15.291259765625, 15.95654296875, 16.621826171875, 17.287109375, 17.952392578125, 18.61767578125, 19.282958984375, 19.9482421875, 20.613525390625, 21.27880859375, 21.944091796875, 22.609375]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 1.0, 5.0, 4.0, 7.0, 18.0, 14.0, 13.0, 14.0, 26.0, 37.0, 32.0, 35.0, 52.0, 55.0, 88.0, 101.0, 113.0, 139.0, 142.0, 202.0, 245.0, 235.0, 282.0, 322.0, 295.0, 265.0, 240.0, 220.0, 191.0, 126.0, 110.0, 98.0, 86.0, 52.0, 47.0, 35.0, 30.0, 16.0, 23.0, 7.0, 13.0, 13.0, 9.0, 6.0, 3.0, 8.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.2890625, -10.9642333984375, -10.639404296875, -10.3145751953125, -9.98974609375, -9.6649169921875, -9.340087890625, -9.0152587890625, -8.6904296875, -8.3656005859375, -8.040771484375, -7.7159423828125, -7.39111328125, -7.0662841796875, -6.741455078125, -6.4166259765625, -6.091796875, -5.7669677734375, -5.442138671875, -5.1173095703125, -4.79248046875, -4.4676513671875, -4.142822265625, -3.8179931640625, -3.4931640625, -3.1683349609375, -2.843505859375, -2.5186767578125, -2.19384765625, -1.8690185546875, -1.544189453125, -1.2193603515625, -0.89453125, -0.5697021484375, -0.244873046875, 0.0799560546875, 0.40478515625, 0.7296142578125, 1.054443359375, 1.3792724609375, 1.7041015625, 2.0289306640625, 2.353759765625, 2.6785888671875, 3.00341796875, 3.3282470703125, 3.653076171875, 3.9779052734375, 4.302734375, 4.6275634765625, 4.952392578125, 5.2772216796875, 5.60205078125, 5.9268798828125, 6.251708984375, 6.5765380859375, 6.9013671875, 7.2261962890625, 7.551025390625, 7.8758544921875, 8.20068359375, 8.5255126953125, 8.850341796875, 9.1751708984375, 9.5]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 11.0, 8.0, 13.0, 20.0, 36.0, 39.0, 28.0, 35.0, 50.0, 53.0, 51.0, 53.0, 64.0, 55.0, 64.0, 64.0, 46.0, 43.0, 48.0, 37.0, 31.0, 34.0, 28.0, 28.0, 17.0, 10.0, 7.0, 4.0, 5.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0], "bins": [-36.20097351074219, -35.283504486083984, -34.366031646728516, -33.44856262207031, -32.53109359741211, -31.613622665405273, -30.696151733398438, -29.778682708740234, -28.86121368408203, -27.943742752075195, -27.026273727416992, -26.108802795410156, -25.191333770751953, -24.273862838745117, -23.35639190673828, -22.438922882080078, -21.521451950073242, -20.603981018066406, -19.686511993408203, -18.769041061401367, -17.851572036743164, -16.934101104736328, -16.016632080078125, -15.099161148071289, -14.18169116973877, -13.26422119140625, -12.34675121307373, -11.429281234741211, -10.511810302734375, -9.594341278076172, -8.676870346069336, -7.759400367736816, -6.841930389404297, -5.924460411071777, -5.006990432739258, -4.08951997756958, -3.1720499992370605, -2.254580020904541, -1.3371095657348633, -0.41963958740234375, 0.4978303909301758, 1.4153004884719849, 2.332770586013794, 3.2502408027648926, 4.167710781097412, 5.085180759429932, 6.002651214599609, 6.920121192932129, 7.837591171264648, 8.755061149597168, 9.672531127929688, 10.590002059936523, 11.507471084594727, 12.424942016601562, 13.342411994934082, 14.259881973266602, 15.177351951599121, 16.09482192993164, 17.012292861938477, 17.92976188659668, 18.847232818603516, 19.76470184326172, 20.682172775268555, 21.59964370727539, 22.517112731933594]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 1.0, 2.0, 2.0, 10.0, 5.0, 7.0, 11.0, 11.0, 17.0, 14.0, 21.0, 18.0, 17.0, 30.0, 36.0, 39.0, 36.0, 25.0, 30.0, 37.0, 46.0, 45.0, 41.0, 45.0, 36.0, 38.0, 36.0, 37.0, 39.0, 34.0, 34.0, 17.0, 35.0, 24.0, 16.0, 20.0, 20.0, 8.0, 11.0, 8.0, 11.0, 11.0, 7.0, 2.0, 6.0, 4.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-23.624351501464844, -22.911901473999023, -22.199453353881836, -21.487003326416016, -20.774553298950195, -20.062103271484375, -19.349655151367188, -18.637205123901367, -17.924755096435547, -17.212305068969727, -16.49985694885254, -15.787406921386719, -15.074956893920898, -14.362507820129395, -13.65005874633789, -12.93760871887207, -12.225160598754883, -11.512711524963379, -10.800261497497559, -10.087812423706055, -9.375362396240234, -8.66291332244873, -7.950464248657227, -7.2380146980285645, -6.525565147399902, -5.81311559677124, -5.100666046142578, -4.388216972351074, -3.675767421722412, -2.96331787109375, -2.250868797302246, -1.538419246673584, -0.8259716033935547, -0.11352217197418213, 0.5989272594451904, 1.3113765716552734, 2.0238261222839355, 2.7362756729125977, 3.4487247467041016, 4.161174297332764, 4.873623847961426, 5.586073398590088, 6.29852294921875, 7.010972023010254, 7.723421573638916, 8.435871124267578, 9.148320198059082, 9.860769271850586, 10.573219299316406, 11.28566837310791, 11.99811840057373, 12.710567474365234, 13.423017501831055, 14.135466575622559, 14.847915649414062, 15.560365676879883, 16.272815704345703, 16.985265731811523, 17.69771385192871, 18.41016387939453, 19.12261390686035, 19.835063934326172, 20.54751205444336, 21.25996208190918, 21.972410202026367]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 3.0, 8.0, 8.0, 12.0, 30.0, 37.0, 36.0, 79.0, 101.0, 148.0, 194.0, 284.0, 418.0, 610.0, 956.0, 1338.0, 2028.0, 2989.0, 4531.0, 6721.0, 10561.0, 16893.0, 27558.0, 47399.0, 85140.0, 158483.0, 256441.0, 187023.0, 99180.0, 54548.0, 31319.0, 19093.0, 11834.0, 7561.0, 4939.0, 3296.0, 2128.0, 1458.0, 983.0, 678.0, 464.0, 320.0, 229.0, 158.0, 93.0, 81.0, 59.0, 30.0, 23.0, 26.0, 11.0, 9.0, 4.0, 3.0, 4.0, 2.0, 4.0, 1.0], "bins": [-9.5625, -9.2694091796875, -8.976318359375, -8.6832275390625, -8.39013671875, -8.0970458984375, -7.803955078125, -7.5108642578125, -7.2177734375, -6.9246826171875, -6.631591796875, -6.3385009765625, -6.04541015625, -5.7523193359375, -5.459228515625, -5.1661376953125, -4.873046875, -4.5799560546875, -4.286865234375, -3.9937744140625, -3.70068359375, -3.4075927734375, -3.114501953125, -2.8214111328125, -2.5283203125, -2.2352294921875, -1.942138671875, -1.6490478515625, -1.35595703125, -1.0628662109375, -0.769775390625, -0.4766845703125, -0.18359375, 0.1094970703125, 0.402587890625, 0.6956787109375, 0.98876953125, 1.2818603515625, 1.574951171875, 1.8680419921875, 2.1611328125, 2.4542236328125, 2.747314453125, 3.0404052734375, 3.33349609375, 3.6265869140625, 3.919677734375, 4.2127685546875, 4.505859375, 4.7989501953125, 5.092041015625, 5.3851318359375, 5.67822265625, 5.9713134765625, 6.264404296875, 6.5574951171875, 6.8505859375, 7.1436767578125, 7.436767578125, 7.7298583984375, 8.02294921875, 8.3160400390625, 8.609130859375, 8.9022216796875, 9.1953125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 4.0, 5.0, 1.0, 6.0, 5.0, 2.0, 5.0, 7.0, 5.0, 21.0, 19.0, 18.0, 20.0, 18.0, 24.0, 30.0, 29.0, 23.0, 31.0, 29.0, 43.0, 46.0, 42.0, 35.0, 34.0, 44.0, 38.0, 40.0, 33.0, 36.0, 31.0, 31.0, 23.0, 34.0, 28.0, 27.0, 15.0, 18.0, 18.0, 15.0, 14.0, 11.0, 10.0, 9.0, 12.0, 7.0, 3.0, 3.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-20.5, -19.838623046875, -19.17724609375, -18.515869140625, -17.8544921875, -17.193115234375, -16.53173828125, -15.870361328125, -15.208984375, -14.547607421875, -13.88623046875, -13.224853515625, -12.5634765625, -11.902099609375, -11.24072265625, -10.579345703125, -9.91796875, -9.256591796875, -8.59521484375, -7.933837890625, -7.2724609375, -6.611083984375, -5.94970703125, -5.288330078125, -4.626953125, -3.965576171875, -3.30419921875, -2.642822265625, -1.9814453125, -1.320068359375, -0.65869140625, 0.002685546875, 0.6640625, 1.325439453125, 1.98681640625, 2.648193359375, 3.3095703125, 3.970947265625, 4.63232421875, 5.293701171875, 5.955078125, 6.616455078125, 7.27783203125, 7.939208984375, 8.6005859375, 9.261962890625, 9.92333984375, 10.584716796875, 11.24609375, 11.907470703125, 12.56884765625, 13.230224609375, 13.8916015625, 14.552978515625, 15.21435546875, 15.875732421875, 16.537109375, 17.198486328125, 17.85986328125, 18.521240234375, 19.1826171875, 19.843994140625, 20.50537109375, 21.166748046875, 21.828125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [4.0, 4.0, 0.0, 0.0, 1.0, 3.0, 8.0, 4.0, 7.0, 13.0, 7.0, 7.0, 5.0, 22.0, 21.0, 37.0, 44.0, 44.0, 72.0, 98.0, 122.0, 173.0, 234.0, 380.0, 539.0, 894.0, 1559.0, 2941.0, 6631.0, 21651.0, 926357.0, 63079.0, 12931.0, 4804.0, 2267.0, 1250.0, 752.0, 465.0, 317.0, 210.0, 143.0, 119.0, 76.0, 67.0, 58.0, 36.0, 29.0, 18.0, 18.0, 13.0, 10.0, 7.0, 3.0, 4.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-34.59375, -33.470703125, -32.34765625, -31.224609375, -30.1015625, -28.978515625, -27.85546875, -26.732421875, -25.609375, -24.486328125, -23.36328125, -22.240234375, -21.1171875, -19.994140625, -18.87109375, -17.748046875, -16.625, -15.501953125, -14.37890625, -13.255859375, -12.1328125, -11.009765625, -9.88671875, -8.763671875, -7.640625, -6.517578125, -5.39453125, -4.271484375, -3.1484375, -2.025390625, -0.90234375, 0.220703125, 1.34375, 2.466796875, 3.58984375, 4.712890625, 5.8359375, 6.958984375, 8.08203125, 9.205078125, 10.328125, 11.451171875, 12.57421875, 13.697265625, 14.8203125, 15.943359375, 17.06640625, 18.189453125, 19.3125, 20.435546875, 21.55859375, 22.681640625, 23.8046875, 24.927734375, 26.05078125, 27.173828125, 28.296875, 29.419921875, 30.54296875, 31.666015625, 32.7890625, 33.912109375, 35.03515625, 36.158203125, 37.28125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 4.0, 3.0, 4.0, 10.0, 3.0, 6.0, 11.0, 13.0, 11.0, 22.0, 21.0, 28.0, 17.0, 23.0, 20.0, 33.0, 33.0, 38.0, 33.0, 40.0, 33.0, 29.0, 42.0, 39.0, 34.0, 35.0, 38.0, 57.0, 37.0, 30.0, 26.0, 38.0, 19.0, 21.0, 19.0, 15.0, 18.0, 17.0, 22.0, 11.0, 7.0, 12.0, 7.0, 6.0, 6.0, 3.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-14.6328125, -14.1463623046875, -13.659912109375, -13.1734619140625, -12.68701171875, -12.2005615234375, -11.714111328125, -11.2276611328125, -10.7412109375, -10.2547607421875, -9.768310546875, -9.2818603515625, -8.79541015625, -8.3089599609375, -7.822509765625, -7.3360595703125, -6.849609375, -6.3631591796875, -5.876708984375, -5.3902587890625, -4.90380859375, -4.4173583984375, -3.930908203125, -3.4444580078125, -2.9580078125, -2.4715576171875, -1.985107421875, -1.4986572265625, -1.01220703125, -0.5257568359375, -0.039306640625, 0.4471435546875, 0.93359375, 1.4200439453125, 1.906494140625, 2.3929443359375, 2.87939453125, 3.3658447265625, 3.852294921875, 4.3387451171875, 4.8251953125, 5.3116455078125, 5.798095703125, 6.2845458984375, 6.77099609375, 7.2574462890625, 7.743896484375, 8.2303466796875, 8.716796875, 9.2032470703125, 9.689697265625, 10.1761474609375, 10.66259765625, 11.1490478515625, 11.635498046875, 12.1219482421875, 12.6083984375, 13.0948486328125, 13.581298828125, 14.0677490234375, 14.55419921875, 15.0406494140625, 15.527099609375, 16.0135498046875, 16.5]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 7.0, 6.0, 4.0, 7.0, 9.0, 10.0, 12.0, 18.0, 22.0, 17.0, 36.0, 30.0, 62.0, 86.0, 95.0, 102.0, 144.0, 207.0, 307.0, 418.0, 625.0, 1058.0, 1909.0, 3732.0, 8261.0, 23395.0, 909264.0, 68168.0, 16662.0, 6441.0, 2952.0, 1641.0, 854.0, 513.0, 372.0, 253.0, 206.0, 131.0, 135.0, 82.0, 69.0, 55.0, 45.0, 33.0, 27.0, 17.0, 18.0, 14.0, 6.0, 6.0, 6.0, 5.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.595703125, -3.475250244140625, -3.35479736328125, -3.234344482421875, -3.1138916015625, -2.993438720703125, -2.87298583984375, -2.752532958984375, -2.632080078125, -2.511627197265625, -2.39117431640625, -2.270721435546875, -2.1502685546875, -2.029815673828125, -1.90936279296875, -1.788909912109375, -1.66845703125, -1.548004150390625, -1.42755126953125, -1.307098388671875, -1.1866455078125, -1.066192626953125, -0.94573974609375, -0.825286865234375, -0.704833984375, -0.584381103515625, -0.46392822265625, -0.343475341796875, -0.2230224609375, -0.102569580078125, 0.01788330078125, 0.138336181640625, 0.2587890625, 0.379241943359375, 0.49969482421875, 0.620147705078125, 0.7406005859375, 0.861053466796875, 0.98150634765625, 1.101959228515625, 1.222412109375, 1.342864990234375, 1.46331787109375, 1.583770751953125, 1.7042236328125, 1.824676513671875, 1.94512939453125, 2.065582275390625, 2.18603515625, 2.306488037109375, 2.42694091796875, 2.547393798828125, 2.6678466796875, 2.788299560546875, 2.90875244140625, 3.029205322265625, 3.149658203125, 3.270111083984375, 3.39056396484375, 3.511016845703125, 3.6314697265625, 3.751922607421875, 3.87237548828125, 3.992828369140625, 4.11328125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 5.0, 3.0, 2.0, 2.0, 3.0, 4.0, 4.0, 4.0, 7.0, 13.0, 13.0, 13.0, 11.0, 20.0, 38.0, 34.0, 64.0, 69.0, 90.0, 105.0, 95.0, 103.0, 69.0, 65.0, 49.0, 33.0, 27.0, 12.0, 10.0, 11.0, 4.0, 10.0, 1.0, 5.0, 3.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.50422477722168e-05, -7.261987775564194e-05, -7.019750773906708e-05, -6.777513772249222e-05, -6.535276770591736e-05, -6.29303976893425e-05, -6.050802767276764e-05, -5.808565765619278e-05, -5.566328763961792e-05, -5.324091762304306e-05, -5.08185476064682e-05, -4.839617758989334e-05, -4.597380757331848e-05, -4.355143755674362e-05, -4.112906754016876e-05, -3.87066975235939e-05, -3.628432750701904e-05, -3.386195749044418e-05, -3.1439587473869324e-05, -2.9017217457294464e-05, -2.6594847440719604e-05, -2.4172477424144745e-05, -2.1750107407569885e-05, -1.9327737390995026e-05, -1.6905367374420166e-05, -1.4482997357845306e-05, -1.2060627341270447e-05, -9.638257324695587e-06, -7.2158873081207275e-06, -4.793517291545868e-06, -2.3711472749710083e-06, 5.122274160385132e-08, 2.473592758178711e-06, 4.8959627747535706e-06, 7.31833279132843e-06, 9.74070280790329e-06, 1.216307282447815e-05, 1.4585442841053009e-05, 1.700781285762787e-05, 1.9430182874202728e-05, 2.1852552890777588e-05, 2.4274922907352448e-05, 2.6697292923927307e-05, 2.9119662940502167e-05, 3.1542032957077026e-05, 3.3964402973651886e-05, 3.6386772990226746e-05, 3.8809143006801605e-05, 4.1231513023376465e-05, 4.3653883039951324e-05, 4.6076253056526184e-05, 4.8498623073101044e-05, 5.09209930896759e-05, 5.334336310625076e-05, 5.576573312282562e-05, 5.818810313940048e-05, 6.061047315597534e-05, 6.30328431725502e-05, 6.545521318912506e-05, 6.787758320569992e-05, 7.029995322227478e-05, 7.272232323884964e-05, 7.51446932554245e-05, 7.756706327199936e-05, 7.998943328857422e-05]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 8.0, 20.0, 16.0, 24.0, 29.0, 53.0, 85.0, 124.0, 159.0, 286.0, 398.0, 627.0, 930.0, 1470.0, 2428.0, 3819.0, 6291.0, 10784.0, 18099.0, 30478.0, 51743.0, 90466.0, 159165.0, 247139.0, 179415.0, 101323.0, 58183.0, 34172.0, 20071.0, 11947.0, 7200.0, 4382.0, 2647.0, 1642.0, 980.0, 645.0, 427.0, 272.0, 219.0, 116.0, 98.0, 55.0, 36.0, 27.0, 15.0, 18.0, 10.0, 5.0, 6.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.9755859375, -0.9447174072265625, -0.913848876953125, -0.8829803466796875, -0.85211181640625, -0.8212432861328125, -0.790374755859375, -0.7595062255859375, -0.7286376953125, -0.6977691650390625, -0.666900634765625, -0.6360321044921875, -0.60516357421875, -0.5742950439453125, -0.543426513671875, -0.5125579833984375, -0.481689453125, -0.4508209228515625, -0.419952392578125, -0.3890838623046875, -0.35821533203125, -0.3273468017578125, -0.296478271484375, -0.2656097412109375, -0.2347412109375, -0.2038726806640625, -0.173004150390625, -0.1421356201171875, -0.11126708984375, -0.0803985595703125, -0.049530029296875, -0.0186614990234375, 0.01220703125, 0.0430755615234375, 0.073944091796875, 0.1048126220703125, 0.13568115234375, 0.1665496826171875, 0.197418212890625, 0.2282867431640625, 0.2591552734375, 0.2900238037109375, 0.320892333984375, 0.3517608642578125, 0.38262939453125, 0.4134979248046875, 0.444366455078125, 0.4752349853515625, 0.506103515625, 0.5369720458984375, 0.567840576171875, 0.5987091064453125, 0.62957763671875, 0.6604461669921875, 0.691314697265625, 0.7221832275390625, 0.7530517578125, 0.7839202880859375, 0.814788818359375, 0.8456573486328125, 0.87652587890625, 0.9073944091796875, 0.938262939453125, 0.9691314697265625, 1.0]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 2.0, 5.0, 2.0, 4.0, 6.0, 7.0, 11.0, 13.0, 20.0, 30.0, 21.0, 32.0, 26.0, 45.0, 52.0, 61.0, 65.0, 65.0, 71.0, 74.0, 63.0, 55.0, 53.0, 47.0, 29.0, 34.0, 22.0, 16.0, 10.0, 15.0, 9.0, 9.0, 5.0, 6.0, 6.0, 1.0, 5.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.52734375, -0.5114707946777344, -0.49559783935546875, -0.4797248840332031, -0.4638519287109375, -0.4479789733886719, -0.43210601806640625, -0.4162330627441406, -0.400360107421875, -0.3844871520996094, -0.36861419677734375, -0.3527412414550781, -0.3368682861328125, -0.3209953308105469, -0.30512237548828125, -0.2892494201660156, -0.27337646484375, -0.2575035095214844, -0.24163055419921875, -0.22575759887695312, -0.2098846435546875, -0.19401168823242188, -0.17813873291015625, -0.16226577758789062, -0.146392822265625, -0.13051986694335938, -0.11464691162109375, -0.09877395629882812, -0.0829010009765625, -0.06702804565429688, -0.05115509033203125, -0.035282135009765625, -0.0194091796875, -0.003536224365234375, 0.01233673095703125, 0.028209686279296875, 0.0440826416015625, 0.059955596923828125, 0.07582855224609375, 0.09170150756835938, 0.107574462890625, 0.12344741821289062, 0.13932037353515625, 0.15519332885742188, 0.1710662841796875, 0.18693923950195312, 0.20281219482421875, 0.21868515014648438, 0.23455810546875, 0.2504310607910156, 0.26630401611328125, 0.2821769714355469, 0.2980499267578125, 0.3139228820800781, 0.32979583740234375, 0.3456687927246094, 0.361541748046875, 0.3774147033691406, 0.39328765869140625, 0.4091606140136719, 0.4250335693359375, 0.4409065246582031, 0.45677947998046875, 0.4726524353027344, 0.488525390625]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 12.0, 8.0, 9.0, 12.0, 20.0, 21.0, 35.0, 35.0, 34.0, 37.0, 56.0, 58.0, 48.0, 45.0, 67.0, 66.0, 52.0, 54.0, 54.0, 51.0, 42.0, 31.0, 37.0, 29.0, 32.0, 15.0, 12.0, 9.0, 8.0, 6.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0], "bins": [-33.52090835571289, -32.65898513793945, -31.79706382751465, -30.935142517089844, -30.073219299316406, -29.2112979888916, -28.349376678466797, -27.48745346069336, -26.625530242919922, -25.763608932495117, -24.90168571472168, -24.039764404296875, -23.177841186523438, -22.315919876098633, -21.453998565673828, -20.59207534790039, -19.730154037475586, -18.86823272705078, -18.006309509277344, -17.14438819885254, -16.2824649810791, -15.420543670654297, -14.558621406555176, -13.696699142456055, -12.834776878356934, -11.972854614257812, -11.110932350158691, -10.24901008605957, -9.387088775634766, -8.525165557861328, -7.663244247436523, -6.801321983337402, -5.939401626586914, -5.077479362487793, -4.215557098388672, -3.353635311126709, -2.491713047027588, -1.6297907829284668, -0.7678689956665039, 0.09405326843261719, 0.9559755325317383, 1.8178976774215698, 2.6798198223114014, 3.5417418479919434, 4.4036641120910645, 5.2655863761901855, 6.127508163452148, 6.9894304275512695, 7.851352691650391, 8.713274955749512, 9.575197219848633, 10.437118530273438, 11.299041748046875, 12.16096305847168, 13.0228853225708, 13.884807586669922, 14.746729850769043, 15.608652114868164, 16.47057342529297, 17.332496643066406, 18.19441795349121, 19.05634117126465, 19.918262481689453, 20.78018569946289, 21.642107009887695]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 7.0, 6.0, 6.0, 7.0, 13.0, 8.0, 17.0, 17.0, 19.0, 18.0, 20.0, 29.0, 36.0, 37.0, 31.0, 31.0, 26.0, 42.0, 40.0, 47.0, 48.0, 39.0, 29.0, 35.0, 43.0, 37.0, 37.0, 37.0, 27.0, 24.0, 25.0, 34.0, 15.0, 17.0, 21.0, 8.0, 10.0, 14.0, 8.0, 10.0, 8.0, 6.0, 4.0, 2.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-21.819080352783203, -21.159732818603516, -20.500385284423828, -19.841035842895508, -19.18168830871582, -18.522340774536133, -17.862991333007812, -17.203643798828125, -16.544296264648438, -15.88494873046875, -15.225600242614746, -14.566251754760742, -13.906904220581055, -13.247556686401367, -12.588208198547363, -11.92885971069336, -11.269512176513672, -10.610164642333984, -9.95081615447998, -9.291467666625977, -8.632120132446289, -7.972772121429443, -7.313424110412598, -6.654076099395752, -5.994728088378906, -5.3353800773620605, -4.676032066345215, -4.016684055328369, -3.3573360443115234, -2.6979880332946777, -2.038640022277832, -1.3792920112609863, -0.7199459075927734, -0.060597896575927734, 0.598750114440918, 1.2580981254577637, 1.9174461364746094, 2.576794147491455, 3.236142158508301, 3.8954901695251465, 4.554838180541992, 5.214186191558838, 5.873534202575684, 6.532882213592529, 7.192230224609375, 7.851578235626221, 8.510926246643066, 9.17027473449707, 9.829622268676758, 10.488969802856445, 11.14831829071045, 11.807666778564453, 12.46701431274414, 13.126361846923828, 13.785710334777832, 14.445058822631836, 15.104406356811523, 15.763753890991211, 16.42310333251953, 17.08245086669922, 17.741798400878906, 18.401145935058594, 19.06049346923828, 19.7198429107666, 20.37919044494629]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 1.0, 11.0, 18.0, 17.0, 33.0, 42.0, 56.0, 96.0, 183.0, 233.0, 442.0, 656.0, 1054.0, 1745.0, 2908.0, 5129.0, 8847.0, 15569.0, 27083.0, 47452.0, 80762.0, 124252.0, 164374.0, 173852.0, 146020.0, 100524.0, 61847.0, 35958.0, 20677.0, 11976.0, 6795.0, 3912.0, 2331.0, 1457.0, 853.0, 507.0, 322.0, 198.0, 144.0, 81.0, 53.0, 25.0, 22.0, 15.0, 9.0, 4.0, 9.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.9375, -22.17919921875, -21.4208984375, -20.66259765625, -19.904296875, -19.14599609375, -18.3876953125, -17.62939453125, -16.87109375, -16.11279296875, -15.3544921875, -14.59619140625, -13.837890625, -13.07958984375, -12.3212890625, -11.56298828125, -10.8046875, -10.04638671875, -9.2880859375, -8.52978515625, -7.771484375, -7.01318359375, -6.2548828125, -5.49658203125, -4.73828125, -3.97998046875, -3.2216796875, -2.46337890625, -1.705078125, -0.94677734375, -0.1884765625, 0.56982421875, 1.328125, 2.08642578125, 2.8447265625, 3.60302734375, 4.361328125, 5.11962890625, 5.8779296875, 6.63623046875, 7.39453125, 8.15283203125, 8.9111328125, 9.66943359375, 10.427734375, 11.18603515625, 11.9443359375, 12.70263671875, 13.4609375, 14.21923828125, 14.9775390625, 15.73583984375, 16.494140625, 17.25244140625, 18.0107421875, 18.76904296875, 19.52734375, 20.28564453125, 21.0439453125, 21.80224609375, 22.560546875, 23.31884765625, 24.0771484375, 24.83544921875, 25.59375]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 7.0, 2.0, 5.0, 9.0, 7.0, 8.0, 16.0, 15.0, 18.0, 17.0, 30.0, 27.0, 21.0, 27.0, 39.0, 39.0, 39.0, 45.0, 46.0, 47.0, 45.0, 48.0, 37.0, 38.0, 45.0, 31.0, 37.0, 40.0, 24.0, 23.0, 26.0, 26.0, 20.0, 20.0, 15.0, 11.0, 11.0, 10.0, 8.0, 7.0, 5.0, 6.0, 5.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-22.5625, -21.915283203125, -21.26806640625, -20.620849609375, -19.9736328125, -19.326416015625, -18.67919921875, -18.031982421875, -17.384765625, -16.737548828125, -16.09033203125, -15.443115234375, -14.7958984375, -14.148681640625, -13.50146484375, -12.854248046875, -12.20703125, -11.559814453125, -10.91259765625, -10.265380859375, -9.6181640625, -8.970947265625, -8.32373046875, -7.676513671875, -7.029296875, -6.382080078125, -5.73486328125, -5.087646484375, -4.4404296875, -3.793212890625, -3.14599609375, -2.498779296875, -1.8515625, -1.204345703125, -0.55712890625, 0.090087890625, 0.7373046875, 1.384521484375, 2.03173828125, 2.678955078125, 3.326171875, 3.973388671875, 4.62060546875, 5.267822265625, 5.9150390625, 6.562255859375, 7.20947265625, 7.856689453125, 8.50390625, 9.151123046875, 9.79833984375, 10.445556640625, 11.0927734375, 11.739990234375, 12.38720703125, 13.034423828125, 13.681640625, 14.328857421875, 14.97607421875, 15.623291015625, 16.2705078125, 16.917724609375, 17.56494140625, 18.212158203125, 18.859375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 1.0, 8.0, 5.0, 7.0, 18.0, 14.0, 39.0, 50.0, 83.0, 116.0, 171.0, 289.0, 405.0, 592.0, 911.0, 1527.0, 2318.0, 3669.0, 5486.0, 8477.0, 13042.0, 20222.0, 30079.0, 45188.0, 64279.0, 86358.0, 108644.0, 124086.0, 124761.0, 111484.0, 89380.0, 67036.0, 47238.0, 32059.0, 21350.0, 13841.0, 8918.0, 5806.0, 3758.0, 2374.0, 1618.0, 967.0, 632.0, 438.0, 260.0, 202.0, 121.0, 87.0, 56.0, 31.0, 26.0, 14.0, 8.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0, 3.0], "bins": [-19.578125, -18.967529296875, -18.35693359375, -17.746337890625, -17.1357421875, -16.525146484375, -15.91455078125, -15.303955078125, -14.693359375, -14.082763671875, -13.47216796875, -12.861572265625, -12.2509765625, -11.640380859375, -11.02978515625, -10.419189453125, -9.80859375, -9.197998046875, -8.58740234375, -7.976806640625, -7.3662109375, -6.755615234375, -6.14501953125, -5.534423828125, -4.923828125, -4.313232421875, -3.70263671875, -3.092041015625, -2.4814453125, -1.870849609375, -1.26025390625, -0.649658203125, -0.0390625, 0.571533203125, 1.18212890625, 1.792724609375, 2.4033203125, 3.013916015625, 3.62451171875, 4.235107421875, 4.845703125, 5.456298828125, 6.06689453125, 6.677490234375, 7.2880859375, 7.898681640625, 8.50927734375, 9.119873046875, 9.73046875, 10.341064453125, 10.95166015625, 11.562255859375, 12.1728515625, 12.783447265625, 13.39404296875, 14.004638671875, 14.615234375, 15.225830078125, 15.83642578125, 16.447021484375, 17.0576171875, 17.668212890625, 18.27880859375, 18.889404296875, 19.5]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 3.0, 5.0, 3.0, 7.0, 9.0, 11.0, 11.0, 24.0, 21.0, 21.0, 28.0, 27.0, 35.0, 34.0, 33.0, 36.0, 36.0, 43.0, 50.0, 52.0, 40.0, 56.0, 35.0, 40.0, 31.0, 41.0, 28.0, 44.0, 27.0, 24.0, 21.0, 23.0, 16.0, 12.0, 12.0, 20.0, 12.0, 5.0, 8.0, 6.0, 7.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.234375, -14.778564453125, -14.32275390625, -13.866943359375, -13.4111328125, -12.955322265625, -12.49951171875, -12.043701171875, -11.587890625, -11.132080078125, -10.67626953125, -10.220458984375, -9.7646484375, -9.308837890625, -8.85302734375, -8.397216796875, -7.94140625, -7.485595703125, -7.02978515625, -6.573974609375, -6.1181640625, -5.662353515625, -5.20654296875, -4.750732421875, -4.294921875, -3.839111328125, -3.38330078125, -2.927490234375, -2.4716796875, -2.015869140625, -1.56005859375, -1.104248046875, -0.6484375, -0.192626953125, 0.26318359375, 0.718994140625, 1.1748046875, 1.630615234375, 2.08642578125, 2.542236328125, 2.998046875, 3.453857421875, 3.90966796875, 4.365478515625, 4.8212890625, 5.277099609375, 5.73291015625, 6.188720703125, 6.64453125, 7.100341796875, 7.55615234375, 8.011962890625, 8.4677734375, 8.923583984375, 9.37939453125, 9.835205078125, 10.291015625, 10.746826171875, 11.20263671875, 11.658447265625, 12.1142578125, 12.570068359375, 13.02587890625, 13.481689453125, 13.9375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 1.0, 6.0, 7.0, 15.0, 18.0, 22.0, 52.0, 71.0, 108.0, 184.0, 265.0, 418.0, 688.0, 1104.0, 1831.0, 3366.0, 5924.0, 10997.0, 20369.0, 37645.0, 68995.0, 116547.0, 169604.0, 193278.0, 164236.0, 110507.0, 64643.0, 35108.0, 19078.0, 10166.0, 5468.0, 3156.0, 1857.0, 1073.0, 633.0, 429.0, 243.0, 155.0, 101.0, 66.0, 51.0, 30.0, 21.0, 10.0, 7.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.71875, -4.54681396484375, -4.3748779296875, -4.20294189453125, -4.031005859375, -3.85906982421875, -3.6871337890625, -3.51519775390625, -3.34326171875, -3.17132568359375, -2.9993896484375, -2.82745361328125, -2.655517578125, -2.48358154296875, -2.3116455078125, -2.13970947265625, -1.9677734375, -1.79583740234375, -1.6239013671875, -1.45196533203125, -1.280029296875, -1.10809326171875, -0.9361572265625, -0.76422119140625, -0.59228515625, -0.42034912109375, -0.2484130859375, -0.07647705078125, 0.095458984375, 0.26739501953125, 0.4393310546875, 0.61126708984375, 0.783203125, 0.95513916015625, 1.1270751953125, 1.29901123046875, 1.470947265625, 1.64288330078125, 1.8148193359375, 1.98675537109375, 2.15869140625, 2.33062744140625, 2.5025634765625, 2.67449951171875, 2.846435546875, 3.01837158203125, 3.1903076171875, 3.36224365234375, 3.5341796875, 3.70611572265625, 3.8780517578125, 4.04998779296875, 4.221923828125, 4.39385986328125, 4.5657958984375, 4.73773193359375, 4.90966796875, 5.08160400390625, 5.2535400390625, 5.42547607421875, 5.597412109375, 5.76934814453125, 5.9412841796875, 6.11322021484375, 6.28515625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 8.0, 3.0, 3.0, 7.0, 7.0, 12.0, 13.0, 17.0, 21.0, 16.0, 21.0, 33.0, 36.0, 43.0, 48.0, 46.0, 64.0, 47.0, 42.0, 51.0, 54.0, 50.0, 44.0, 39.0, 45.0, 33.0, 35.0, 27.0, 24.0, 24.0, 16.0, 8.0, 8.0, 11.0, 11.0, 8.0, 5.0, 5.0, 4.0, 6.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0003809928894042969, -0.0003685168921947479, -0.000356040894985199, -0.00034356489777565, -0.0003310889005661011, -0.0003186129033565521, -0.0003061369061470032, -0.0002936609089374542, -0.0002811849117279053, -0.0002687089145183563, -0.0002562329173088074, -0.00024375692009925842, -0.00023128092288970947, -0.00021880492568016052, -0.00020632892847061157, -0.00019385293126106262, -0.00018137693405151367, -0.00016890093684196472, -0.00015642493963241577, -0.00014394894242286682, -0.00013147294521331787, -0.00011899694800376892, -0.00010652095079421997, -9.404495358467102e-05, -8.156895637512207e-05, -6.909295916557312e-05, -5.661696195602417e-05, -4.414096474647522e-05, -3.166496753692627e-05, -1.918897032737732e-05, -6.712973117828369e-06, 5.763024091720581e-06, 1.823902130126953e-05, 3.071501851081848e-05, 4.319101572036743e-05, 5.566701292991638e-05, 6.814301013946533e-05, 8.061900734901428e-05, 9.309500455856323e-05, 0.00010557100176811218, 0.00011804699897766113, 0.00013052299618721008, 0.00014299899339675903, 0.00015547499060630798, 0.00016795098781585693, 0.00018042698502540588, 0.00019290298223495483, 0.00020537897944450378, 0.00021785497665405273, 0.00023033097386360168, 0.00024280697107315063, 0.0002552829682826996, 0.00026775896549224854, 0.0002802349627017975, 0.00029271095991134644, 0.0003051869571208954, 0.00031766295433044434, 0.0003301389515399933, 0.00034261494874954224, 0.0003550909459590912, 0.00036756694316864014, 0.0003800429403781891, 0.00039251893758773804, 0.000404994934797287, 0.00041747093200683594]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 7.0, 8.0, 8.0, 17.0, 23.0, 47.0, 68.0, 82.0, 149.0, 226.0, 380.0, 625.0, 996.0, 1580.0, 2650.0, 4260.0, 7270.0, 12118.0, 20653.0, 34633.0, 57115.0, 90245.0, 129186.0, 158455.0, 159502.0, 130694.0, 91912.0, 57905.0, 35256.0, 21186.0, 12504.0, 7478.0, 4495.0, 2632.0, 1581.0, 995.0, 623.0, 354.0, 247.0, 137.0, 96.0, 61.0, 43.0, 24.0, 14.0, 10.0, 8.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.87109375, -4.72357177734375, -4.5760498046875, -4.42852783203125, -4.281005859375, -4.13348388671875, -3.9859619140625, -3.83843994140625, -3.69091796875, -3.54339599609375, -3.3958740234375, -3.24835205078125, -3.100830078125, -2.95330810546875, -2.8057861328125, -2.65826416015625, -2.5107421875, -2.36322021484375, -2.2156982421875, -2.06817626953125, -1.920654296875, -1.77313232421875, -1.6256103515625, -1.47808837890625, -1.33056640625, -1.18304443359375, -1.0355224609375, -0.88800048828125, -0.740478515625, -0.59295654296875, -0.4454345703125, -0.29791259765625, -0.150390625, -0.00286865234375, 0.1446533203125, 0.29217529296875, 0.439697265625, 0.58721923828125, 0.7347412109375, 0.88226318359375, 1.02978515625, 1.17730712890625, 1.3248291015625, 1.47235107421875, 1.619873046875, 1.76739501953125, 1.9149169921875, 2.06243896484375, 2.2099609375, 2.35748291015625, 2.5050048828125, 2.65252685546875, 2.800048828125, 2.94757080078125, 3.0950927734375, 3.24261474609375, 3.39013671875, 3.53765869140625, 3.6851806640625, 3.83270263671875, 3.980224609375, 4.12774658203125, 4.2752685546875, 4.42279052734375, 4.5703125]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 4.0, 4.0, 6.0, 9.0, 5.0, 6.0, 16.0, 27.0, 26.0, 46.0, 39.0, 60.0, 54.0, 60.0, 71.0, 73.0, 58.0, 75.0, 56.0, 51.0, 43.0, 40.0, 33.0, 35.0, 21.0, 28.0, 11.0, 10.0, 10.0, 7.0, 4.0, 0.0, 2.0, 5.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.681640625, -1.613922119140625, -1.54620361328125, -1.478485107421875, -1.4107666015625, -1.343048095703125, -1.27532958984375, -1.207611083984375, -1.139892578125, -1.072174072265625, -1.00445556640625, -0.936737060546875, -0.8690185546875, -0.801300048828125, -0.73358154296875, -0.665863037109375, -0.59814453125, -0.530426025390625, -0.46270751953125, -0.394989013671875, -0.3272705078125, -0.259552001953125, -0.19183349609375, -0.124114990234375, -0.056396484375, 0.011322021484375, 0.07904052734375, 0.146759033203125, 0.2144775390625, 0.282196044921875, 0.34991455078125, 0.417633056640625, 0.4853515625, 0.553070068359375, 0.62078857421875, 0.688507080078125, 0.7562255859375, 0.823944091796875, 0.89166259765625, 0.959381103515625, 1.027099609375, 1.094818115234375, 1.16253662109375, 1.230255126953125, 1.2979736328125, 1.365692138671875, 1.43341064453125, 1.501129150390625, 1.56884765625, 1.636566162109375, 1.70428466796875, 1.772003173828125, 1.8397216796875, 1.907440185546875, 1.97515869140625, 2.042877197265625, 2.110595703125, 2.178314208984375, 2.24603271484375, 2.313751220703125, 2.3814697265625, 2.449188232421875, 2.51690673828125, 2.584625244140625, 2.65234375]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 3.0, 11.0, 19.0, 21.0, 18.0, 22.0, 19.0, 35.0, 34.0, 35.0, 43.0, 50.0, 69.0, 61.0, 59.0, 62.0, 56.0, 48.0, 56.0, 48.0, 50.0, 38.0, 24.0, 33.0, 14.0, 20.0, 20.0, 14.0, 3.0, 8.0, 1.0, 5.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-29.108938217163086, -28.323537826538086, -27.538135528564453, -26.752735137939453, -25.967334747314453, -25.18193244934082, -24.39653205871582, -23.611129760742188, -22.825729370117188, -22.040328979492188, -21.254926681518555, -20.469526290893555, -19.684123992919922, -18.898723602294922, -18.113323211669922, -17.327922821044922, -16.54252052307129, -15.757119178771973, -14.971717834472656, -14.186317443847656, -13.40091609954834, -12.615514755249023, -11.830114364624023, -11.044713020324707, -10.25931167602539, -9.473910331726074, -8.688508987426758, -7.903108596801758, -7.117707252502441, -6.332305908203125, -5.546905040740967, -4.761504173278809, -3.9761009216308594, -3.190699815750122, -2.4052987098693848, -1.6198976039886475, -0.8344964981079102, -0.04909539222717285, 0.7363057136535645, 1.5217065811157227, 2.307107925415039, 3.0925090312957764, 3.8779101371765137, 4.663311004638672, 5.448712348937988, 6.234113693237305, 7.019514560699463, 7.804915428161621, 8.590316772460938, 9.375718116760254, 10.16111946105957, 10.94651985168457, 11.731921195983887, 12.517322540283203, 13.302722930908203, 14.08812427520752, 14.873525619506836, 15.658926963806152, 16.44432830810547, 17.22972869873047, 18.01512908935547, 18.8005313873291, 19.5859317779541, 20.371334075927734, 21.156734466552734]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 9.0, 8.0, 6.0, 7.0, 15.0, 12.0, 20.0, 17.0, 13.0, 26.0, 22.0, 22.0, 25.0, 28.0, 30.0, 29.0, 42.0, 39.0, 31.0, 38.0, 49.0, 42.0, 37.0, 38.0, 49.0, 33.0, 37.0, 32.0, 27.0, 30.0, 29.0, 24.0, 15.0, 21.0, 14.0, 12.0, 18.0, 7.0, 8.0, 11.0, 10.0, 6.0, 5.0, 6.0, 3.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.1672420501709, -20.513273239135742, -19.85930633544922, -19.205337524414062, -18.551368713378906, -17.89739990234375, -17.243432998657227, -16.58946418762207, -15.93549633026123, -15.28152847290039, -14.627559661865234, -13.973591804504395, -13.319623947143555, -12.665655136108398, -12.011687278747559, -11.357719421386719, -10.703750610351562, -10.049782752990723, -9.395813941955566, -8.741846084594727, -8.08787727355957, -7.4339094161987305, -6.779941558837891, -6.125973224639893, -5.4720048904418945, -4.8180365562438965, -4.164068222045898, -3.5101003646850586, -2.8561320304870605, -2.2021636962890625, -1.5481956005096436, -0.8942275047302246, -0.24025726318359375, 0.41371095180511475, 1.0676791667938232, 1.7216473817825317, 2.3756155967712402, 3.0295839309692383, 3.6835520267486572, 4.337520122528076, 4.991488456726074, 5.645456790924072, 6.29942512512207, 6.95339298248291, 7.607361316680908, 8.261329650878906, 8.915297508239746, 9.569265365600586, 10.223234176635742, 10.877202033996582, 11.531170845031738, 12.185138702392578, 12.839107513427734, 13.493075370788574, 14.147043228149414, 14.80101203918457, 15.45497989654541, 16.10894775390625, 16.762916564941406, 17.416885375976562, 18.070852279663086, 18.724821090698242, 19.3787899017334, 20.032756805419922, 20.686725616455078]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 8.0, 5.0, 15.0, 23.0, 36.0, 55.0, 99.0, 149.0, 227.0, 418.0, 644.0, 1134.0, 1847.0, 3042.0, 5173.0, 8849.0, 15459.0, 26355.0, 46473.0, 81211.0, 144041.0, 255361.0, 436849.0, 655070.0, 769838.0, 670137.0, 452911.0, 269377.0, 151325.0, 84967.0, 48078.0, 27157.0, 15707.0, 8972.0, 5378.0, 3192.0, 1869.0, 1126.0, 635.0, 411.0, 252.0, 145.0, 94.0, 69.0, 25.0, 31.0, 21.0, 8.0, 6.0, 5.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.65625, -17.078125, -16.5, -15.921875, -15.34375, -14.765625, -14.1875, -13.609375, -13.03125, -12.453125, -11.875, -11.296875, -10.71875, -10.140625, -9.5625, -8.984375, -8.40625, -7.828125, -7.25, -6.671875, -6.09375, -5.515625, -4.9375, -4.359375, -3.78125, -3.203125, -2.625, -2.046875, -1.46875, -0.890625, -0.3125, 0.265625, 0.84375, 1.421875, 2.0, 2.578125, 3.15625, 3.734375, 4.3125, 4.890625, 5.46875, 6.046875, 6.625, 7.203125, 7.78125, 8.359375, 8.9375, 9.515625, 10.09375, 10.671875, 11.25, 11.828125, 12.40625, 12.984375, 13.5625, 14.140625, 14.71875, 15.296875, 15.875, 16.453125, 17.03125, 17.609375, 18.1875, 18.765625, 19.34375]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 6.0, 6.0, 8.0, 5.0, 11.0, 16.0, 17.0, 15.0, 18.0, 23.0, 15.0, 28.0, 29.0, 32.0, 26.0, 47.0, 32.0, 37.0, 44.0, 40.0, 37.0, 46.0, 32.0, 43.0, 37.0, 35.0, 48.0, 45.0, 24.0, 23.0, 23.0, 31.0, 16.0, 14.0, 21.0, 16.0, 13.0, 8.0, 6.0, 9.0, 7.0, 8.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.4765625, -14.0130615234375, -13.549560546875, -13.0860595703125, -12.62255859375, -12.1590576171875, -11.695556640625, -11.2320556640625, -10.7685546875, -10.3050537109375, -9.841552734375, -9.3780517578125, -8.91455078125, -8.4510498046875, -7.987548828125, -7.5240478515625, -7.060546875, -6.5970458984375, -6.133544921875, -5.6700439453125, -5.20654296875, -4.7430419921875, -4.279541015625, -3.8160400390625, -3.3525390625, -2.8890380859375, -2.425537109375, -1.9620361328125, -1.49853515625, -1.0350341796875, -0.571533203125, -0.1080322265625, 0.35546875, 0.8189697265625, 1.282470703125, 1.7459716796875, 2.20947265625, 2.6729736328125, 3.136474609375, 3.5999755859375, 4.0634765625, 4.5269775390625, 4.990478515625, 5.4539794921875, 5.91748046875, 6.3809814453125, 6.844482421875, 7.3079833984375, 7.771484375, 8.2349853515625, 8.698486328125, 9.1619873046875, 9.62548828125, 10.0889892578125, 10.552490234375, 11.0159912109375, 11.4794921875, 11.9429931640625, 12.406494140625, 12.8699951171875, 13.33349609375, 13.7969970703125, 14.260498046875, 14.7239990234375, 15.1875]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [4.0, 1.0, 4.0, 7.0, 16.0, 20.0, 41.0, 58.0, 110.0, 147.0, 240.0, 365.0, 577.0, 821.0, 1244.0, 1925.0, 2824.0, 4431.0, 6733.0, 10522.0, 15827.0, 24410.0, 37043.0, 56023.0, 83943.0, 123164.0, 176347.0, 244645.0, 325140.0, 405761.0, 463161.0, 476740.0, 437160.0, 362299.0, 281769.0, 206253.0, 145995.0, 100054.0, 67897.0, 45277.0, 29568.0, 19718.0, 12753.0, 8261.0, 5262.0, 3503.0, 2199.0, 1407.0, 972.0, 580.0, 409.0, 253.0, 153.0, 102.0, 59.0, 35.0, 32.0, 15.0, 11.0, 5.0, 3.0, 4.0, 1.0, 1.0], "bins": [-11.890625, -11.5098876953125, -11.129150390625, -10.7484130859375, -10.36767578125, -9.9869384765625, -9.606201171875, -9.2254638671875, -8.8447265625, -8.4639892578125, -8.083251953125, -7.7025146484375, -7.32177734375, -6.9410400390625, -6.560302734375, -6.1795654296875, -5.798828125, -5.4180908203125, -5.037353515625, -4.6566162109375, -4.27587890625, -3.8951416015625, -3.514404296875, -3.1336669921875, -2.7529296875, -2.3721923828125, -1.991455078125, -1.6107177734375, -1.22998046875, -0.8492431640625, -0.468505859375, -0.0877685546875, 0.29296875, 0.6737060546875, 1.054443359375, 1.4351806640625, 1.81591796875, 2.1966552734375, 2.577392578125, 2.9581298828125, 3.3388671875, 3.7196044921875, 4.100341796875, 4.4810791015625, 4.86181640625, 5.2425537109375, 5.623291015625, 6.0040283203125, 6.384765625, 6.7655029296875, 7.146240234375, 7.5269775390625, 7.90771484375, 8.2884521484375, 8.669189453125, 9.0499267578125, 9.4306640625, 9.8114013671875, 10.192138671875, 10.5728759765625, 10.95361328125, 11.3343505859375, 11.715087890625, 12.0958251953125, 12.4765625]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 10.0, 9.0, 11.0, 11.0, 4.0, 12.0, 13.0, 21.0, 32.0, 24.0, 34.0, 48.0, 69.0, 71.0, 86.0, 114.0, 132.0, 137.0, 163.0, 170.0, 203.0, 214.0, 222.0, 241.0, 218.0, 221.0, 215.0, 224.0, 168.0, 179.0, 140.0, 117.0, 114.0, 102.0, 69.0, 62.0, 48.0, 42.0, 28.0, 21.0, 15.0, 18.0, 4.0, 7.0, 9.0, 2.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3203125, -7.0950927734375, -6.869873046875, -6.6446533203125, -6.41943359375, -6.1942138671875, -5.968994140625, -5.7437744140625, -5.5185546875, -5.2933349609375, -5.068115234375, -4.8428955078125, -4.61767578125, -4.3924560546875, -4.167236328125, -3.9420166015625, -3.716796875, -3.4915771484375, -3.266357421875, -3.0411376953125, -2.81591796875, -2.5906982421875, -2.365478515625, -2.1402587890625, -1.9150390625, -1.6898193359375, -1.464599609375, -1.2393798828125, -1.01416015625, -0.7889404296875, -0.563720703125, -0.3385009765625, -0.11328125, 0.1119384765625, 0.337158203125, 0.5623779296875, 0.78759765625, 1.0128173828125, 1.238037109375, 1.4632568359375, 1.6884765625, 1.9136962890625, 2.138916015625, 2.3641357421875, 2.58935546875, 2.8145751953125, 3.039794921875, 3.2650146484375, 3.490234375, 3.7154541015625, 3.940673828125, 4.1658935546875, 4.39111328125, 4.6163330078125, 4.841552734375, 5.0667724609375, 5.2919921875, 5.5172119140625, 5.742431640625, 5.9676513671875, 6.19287109375, 6.4180908203125, 6.643310546875, 6.8685302734375, 7.09375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 4.0, 4.0, 4.0, 12.0, 12.0, 23.0, 18.0, 28.0, 31.0, 49.0, 65.0, 49.0, 52.0, 58.0, 58.0, 73.0, 66.0, 69.0, 58.0, 47.0, 36.0, 48.0, 35.0, 25.0, 21.0, 12.0, 10.0, 11.0, 13.0, 4.0, 2.0, 5.0, 4.0, 1.0, 3.0, 3.0, 2.0, 3.0], "bins": [-28.861404418945312, -28.17311668395996, -27.48482894897461, -26.796541213989258, -26.108253479003906, -25.419965744018555, -24.731678009033203, -24.043392181396484, -23.3551025390625, -22.66681480407715, -21.978527069091797, -21.290239334106445, -20.601951599121094, -19.913663864135742, -19.22537612915039, -18.537090301513672, -17.84880256652832, -17.16051483154297, -16.472227096557617, -15.783939361572266, -15.095651626586914, -14.407363891601562, -13.719077110290527, -13.030789375305176, -12.342501640319824, -11.654213905334473, -10.965926170349121, -10.277639389038086, -9.589351654052734, -8.901063919067383, -8.212776184082031, -7.52448844909668, -6.836199760437012, -6.14791202545166, -5.459624290466309, -4.771337032318115, -4.083049297332764, -3.394761562347412, -2.7064743041992188, -2.018186569213867, -1.3298988342285156, -0.6416112184524536, 0.0466763973236084, 0.7349638938903809, 1.4232516288757324, 2.111539363861084, 2.7998266220092773, 3.488114356994629, 4.1764020919799805, 4.864689826965332, 5.552977561950684, 6.241264820098877, 6.9295525550842285, 7.61784029006958, 8.306127548217773, 8.994415283203125, 9.682703018188477, 10.370990753173828, 11.05927848815918, 11.747566223144531, 12.435853958129883, 13.124141693115234, 13.81242847442627, 14.500716209411621, 15.189003944396973]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 5.0, 3.0, 2.0, 5.0, 7.0, 5.0, 11.0, 9.0, 9.0, 24.0, 23.0, 23.0, 27.0, 35.0, 37.0, 24.0, 28.0, 35.0, 35.0, 49.0, 34.0, 40.0, 44.0, 41.0, 33.0, 40.0, 43.0, 43.0, 40.0, 36.0, 25.0, 27.0, 29.0, 23.0, 17.0, 16.0, 14.0, 18.0, 8.0, 5.0, 6.0, 10.0, 6.0, 9.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.344175338745117, -16.79852294921875, -16.252872467041016, -15.707220077514648, -15.161567687988281, -14.61591625213623, -14.07026481628418, -13.524612426757812, -12.978960990905762, -12.433309555053711, -11.887657165527344, -11.342005729675293, -10.796354293823242, -10.250701904296875, -9.705050468444824, -9.159399032592773, -8.613746643066406, -8.068095207214355, -7.522442817687988, -6.9767913818359375, -6.4311394691467285, -5.8854875564575195, -5.339836120605469, -4.79418420791626, -4.248532295227051, -3.702880382537842, -3.157228708267212, -2.611577033996582, -2.065925121307373, -1.520273208618164, -0.9746215343475342, -0.4289698600769043, 0.11668205261230469, 0.6623338460922241, 1.2079856395721436, 1.753637433052063, 2.2992892265319824, 2.8449411392211914, 3.3905928134918213, 3.936244487762451, 4.48189640045166, 5.027548313140869, 5.573200225830078, 6.118851661682129, 6.664503574371338, 7.210155487060547, 7.755806922912598, 8.301458358764648, 8.847110748291016, 9.392762184143066, 9.938414573669434, 10.484066009521484, 11.029718399047852, 11.575369834899902, 12.121021270751953, 12.66667366027832, 13.212325096130371, 13.757976531982422, 14.303628921508789, 14.84928035736084, 15.39493179321289, 15.940584182739258, 16.486236572265625, 17.03188705444336, 17.577539443969727]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 13.0, 8.0, 21.0, 15.0, 41.0, 51.0, 66.0, 123.0, 153.0, 232.0, 368.0, 511.0, 822.0, 1259.0, 1845.0, 2848.0, 4253.0, 6450.0, 9905.0, 14836.0, 23213.0, 35464.0, 54410.0, 81281.0, 118559.0, 158632.0, 160228.0, 123265.0, 85307.0, 57006.0, 37340.0, 24260.0, 15763.0, 10302.0, 6653.0, 4477.0, 2905.0, 1878.0, 1265.0, 841.0, 564.0, 377.0, 237.0, 161.0, 107.0, 83.0, 65.0, 31.0, 26.0, 10.0, 8.0, 7.0, 4.0, 7.0, 4.0, 1.0, 3.0], "bins": [-3.248046875, -3.1497802734375, -3.051513671875, -2.9532470703125, -2.85498046875, -2.7567138671875, -2.658447265625, -2.5601806640625, -2.4619140625, -2.3636474609375, -2.265380859375, -2.1671142578125, -2.06884765625, -1.9705810546875, -1.872314453125, -1.7740478515625, -1.67578125, -1.5775146484375, -1.479248046875, -1.3809814453125, -1.28271484375, -1.1844482421875, -1.086181640625, -0.9879150390625, -0.8896484375, -0.7913818359375, -0.693115234375, -0.5948486328125, -0.49658203125, -0.3983154296875, -0.300048828125, -0.2017822265625, -0.103515625, -0.0052490234375, 0.093017578125, 0.1912841796875, 0.28955078125, 0.3878173828125, 0.486083984375, 0.5843505859375, 0.6826171875, 0.7808837890625, 0.879150390625, 0.9774169921875, 1.07568359375, 1.1739501953125, 1.272216796875, 1.3704833984375, 1.46875, 1.5670166015625, 1.665283203125, 1.7635498046875, 1.86181640625, 1.9600830078125, 2.058349609375, 2.1566162109375, 2.2548828125, 2.3531494140625, 2.451416015625, 2.5496826171875, 2.64794921875, 2.7462158203125, 2.844482421875, 2.9427490234375, 3.041015625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 8.0, 6.0, 12.0, 6.0, 12.0, 15.0, 19.0, 22.0, 20.0, 26.0, 27.0, 30.0, 36.0, 29.0, 37.0, 36.0, 37.0, 41.0, 39.0, 51.0, 36.0, 41.0, 34.0, 37.0, 36.0, 39.0, 34.0, 35.0, 36.0, 18.0, 22.0, 23.0, 15.0, 17.0, 12.0, 13.0, 7.0, 7.0, 9.0, 7.0, 5.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-17.234375, -16.691162109375, -16.14794921875, -15.604736328125, -15.0615234375, -14.518310546875, -13.97509765625, -13.431884765625, -12.888671875, -12.345458984375, -11.80224609375, -11.259033203125, -10.7158203125, -10.172607421875, -9.62939453125, -9.086181640625, -8.54296875, -7.999755859375, -7.45654296875, -6.913330078125, -6.3701171875, -5.826904296875, -5.28369140625, -4.740478515625, -4.197265625, -3.654052734375, -3.11083984375, -2.567626953125, -2.0244140625, -1.481201171875, -0.93798828125, -0.394775390625, 0.1484375, 0.691650390625, 1.23486328125, 1.778076171875, 2.3212890625, 2.864501953125, 3.40771484375, 3.950927734375, 4.494140625, 5.037353515625, 5.58056640625, 6.123779296875, 6.6669921875, 7.210205078125, 7.75341796875, 8.296630859375, 8.83984375, 9.383056640625, 9.92626953125, 10.469482421875, 11.0126953125, 11.555908203125, 12.09912109375, 12.642333984375, 13.185546875, 13.728759765625, 14.27197265625, 14.815185546875, 15.3583984375, 15.901611328125, 16.44482421875, 16.988037109375, 17.53125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 10.0, 10.0, 2.0, 8.0, 7.0, 14.0, 16.0, 21.0, 31.0, 47.0, 52.0, 81.0, 82.0, 126.0, 160.0, 203.0, 323.0, 409.0, 606.0, 872.0, 1443.0, 2670.0, 5029.0, 10684.0, 24860.0, 71037.0, 869219.0, 32552.0, 13588.0, 6134.0, 3121.0, 1725.0, 1013.0, 654.0, 455.0, 331.0, 231.0, 166.0, 128.0, 96.0, 73.0, 69.0, 54.0, 34.0, 40.0, 20.0, 9.0, 5.0, 7.0, 4.0, 8.0, 4.0, 8.0, 5.0, 1.0, 2.0, 1.0, 2.0], "bins": [-9.34375, -9.052978515625, -8.76220703125, -8.471435546875, -8.1806640625, -7.889892578125, -7.59912109375, -7.308349609375, -7.017578125, -6.726806640625, -6.43603515625, -6.145263671875, -5.8544921875, -5.563720703125, -5.27294921875, -4.982177734375, -4.69140625, -4.400634765625, -4.10986328125, -3.819091796875, -3.5283203125, -3.237548828125, -2.94677734375, -2.656005859375, -2.365234375, -2.074462890625, -1.78369140625, -1.492919921875, -1.2021484375, -0.911376953125, -0.62060546875, -0.329833984375, -0.0390625, 0.251708984375, 0.54248046875, 0.833251953125, 1.1240234375, 1.414794921875, 1.70556640625, 1.996337890625, 2.287109375, 2.577880859375, 2.86865234375, 3.159423828125, 3.4501953125, 3.740966796875, 4.03173828125, 4.322509765625, 4.61328125, 4.904052734375, 5.19482421875, 5.485595703125, 5.7763671875, 6.067138671875, 6.35791015625, 6.648681640625, 6.939453125, 7.230224609375, 7.52099609375, 7.811767578125, 8.1025390625, 8.393310546875, 8.68408203125, 8.974853515625, 9.265625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 5.0, 6.0, 8.0, 10.0, 8.0, 5.0, 8.0, 10.0, 16.0, 27.0, 17.0, 29.0, 34.0, 28.0, 40.0, 42.0, 43.0, 42.0, 46.0, 36.0, 46.0, 39.0, 46.0, 34.0, 56.0, 39.0, 29.0, 41.0, 39.0, 32.0, 25.0, 19.0, 24.0, 17.0, 12.0, 14.0, 11.0, 7.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.7109375, -14.277587890625, -13.84423828125, -13.410888671875, -12.9775390625, -12.544189453125, -12.11083984375, -11.677490234375, -11.244140625, -10.810791015625, -10.37744140625, -9.944091796875, -9.5107421875, -9.077392578125, -8.64404296875, -8.210693359375, -7.77734375, -7.343994140625, -6.91064453125, -6.477294921875, -6.0439453125, -5.610595703125, -5.17724609375, -4.743896484375, -4.310546875, -3.877197265625, -3.44384765625, -3.010498046875, -2.5771484375, -2.143798828125, -1.71044921875, -1.277099609375, -0.84375, -0.410400390625, 0.02294921875, 0.456298828125, 0.8896484375, 1.322998046875, 1.75634765625, 2.189697265625, 2.623046875, 3.056396484375, 3.48974609375, 3.923095703125, 4.3564453125, 4.789794921875, 5.22314453125, 5.656494140625, 6.08984375, 6.523193359375, 6.95654296875, 7.389892578125, 7.8232421875, 8.256591796875, 8.68994140625, 9.123291015625, 9.556640625, 9.989990234375, 10.42333984375, 10.856689453125, 11.2900390625, 11.723388671875, 12.15673828125, 12.590087890625, 13.0234375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 7.0, 11.0, 7.0, 16.0, 22.0, 43.0, 40.0, 53.0, 80.0, 106.0, 163.0, 281.0, 393.0, 711.0, 1631.0, 3433.0, 10692.0, 90013.0, 920125.0, 12912.0, 4002.0, 1697.0, 793.0, 469.0, 276.0, 172.0, 129.0, 73.0, 61.0, 37.0, 28.0, 17.0, 18.0, 18.0, 12.0, 3.0, 6.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.46875, -4.337554931640625, -4.20635986328125, -4.075164794921875, -3.9439697265625, -3.812774658203125, -3.68157958984375, -3.550384521484375, -3.419189453125, -3.287994384765625, -3.15679931640625, -3.025604248046875, -2.8944091796875, -2.763214111328125, -2.63201904296875, -2.500823974609375, -2.36962890625, -2.238433837890625, -2.10723876953125, -1.976043701171875, -1.8448486328125, -1.713653564453125, -1.58245849609375, -1.451263427734375, -1.320068359375, -1.188873291015625, -1.05767822265625, -0.926483154296875, -0.7952880859375, -0.664093017578125, -0.53289794921875, -0.401702880859375, -0.2705078125, -0.139312744140625, -0.00811767578125, 0.123077392578125, 0.2542724609375, 0.385467529296875, 0.51666259765625, 0.647857666015625, 0.779052734375, 0.910247802734375, 1.04144287109375, 1.172637939453125, 1.3038330078125, 1.435028076171875, 1.56622314453125, 1.697418212890625, 1.82861328125, 1.959808349609375, 2.09100341796875, 2.222198486328125, 2.3533935546875, 2.484588623046875, 2.61578369140625, 2.746978759765625, 2.878173828125, 3.009368896484375, 3.14056396484375, 3.271759033203125, 3.4029541015625, 3.534149169921875, 3.66534423828125, 3.796539306640625, 3.927734375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 9.0, 6.0, 1.0, 9.0, 4.0, 10.0, 20.0, 17.0, 22.0, 19.0, 21.0, 32.0, 27.0, 44.0, 69.0, 56.0, 66.0, 61.0, 74.0, 58.0, 53.0, 55.0, 43.0, 48.0, 34.0, 28.0, 35.0, 18.0, 11.0, 8.0, 9.0, 6.0, 6.0, 4.0, 9.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.574920654296875e-05, -2.4971552193164825e-05, -2.41938978433609e-05, -2.3416243493556976e-05, -2.2638589143753052e-05, -2.1860934793949127e-05, -2.1083280444145203e-05, -2.0305626094341278e-05, -1.9527971744537354e-05, -1.875031739473343e-05, -1.7972663044929504e-05, -1.719500869512558e-05, -1.6417354345321655e-05, -1.563969999551773e-05, -1.4862045645713806e-05, -1.4084391295909882e-05, -1.3306736946105957e-05, -1.2529082596302032e-05, -1.1751428246498108e-05, -1.0973773896694183e-05, -1.0196119546890259e-05, -9.418465197086334e-06, -8.64081084728241e-06, -7.863156497478485e-06, -7.0855021476745605e-06, -6.307847797870636e-06, -5.5301934480667114e-06, -4.752539098262787e-06, -3.974884748458862e-06, -3.1972303986549377e-06, -2.419576048851013e-06, -1.6419216990470886e-06, -8.642673492431641e-07, -8.66129994392395e-08, 6.910413503646851e-07, 1.4686957001686096e-06, 2.246350049972534e-06, 3.0240043997764587e-06, 3.8016587495803833e-06, 4.579313099384308e-06, 5.356967449188232e-06, 6.134621798992157e-06, 6.9122761487960815e-06, 7.689930498600006e-06, 8.46758484840393e-06, 9.245239198207855e-06, 1.002289354801178e-05, 1.0800547897815704e-05, 1.1578202247619629e-05, 1.2355856597423553e-05, 1.3133510947227478e-05, 1.3911165297031403e-05, 1.4688819646835327e-05, 1.5466473996639252e-05, 1.6244128346443176e-05, 1.70217826962471e-05, 1.7799437046051025e-05, 1.857709139585495e-05, 1.9354745745658875e-05, 2.01324000954628e-05, 2.0910054445266724e-05, 2.1687708795070648e-05, 2.2465363144874573e-05, 2.3243017494678497e-05, 2.4020671844482422e-05]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 7.0, 14.0, 16.0, 28.0, 37.0, 52.0, 71.0, 112.0, 181.0, 312.0, 432.0, 663.0, 1168.0, 1736.0, 2904.0, 4995.0, 8753.0, 15812.0, 30171.0, 63757.0, 149076.0, 376570.0, 219337.0, 86438.0, 39355.0, 20069.0, 10886.0, 6163.0, 3640.0, 2134.0, 1310.0, 833.0, 496.0, 369.0, 220.0, 158.0, 91.0, 64.0, 31.0, 30.0, 24.0, 9.0, 15.0, 5.0, 5.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0859375, -1.0493621826171875, -1.012786865234375, -0.9762115478515625, -0.93963623046875, -0.9030609130859375, -0.866485595703125, -0.8299102783203125, -0.7933349609375, -0.7567596435546875, -0.720184326171875, -0.6836090087890625, -0.64703369140625, -0.6104583740234375, -0.573883056640625, -0.5373077392578125, -0.500732421875, -0.4641571044921875, -0.427581787109375, -0.3910064697265625, -0.35443115234375, -0.3178558349609375, -0.281280517578125, -0.2447052001953125, -0.2081298828125, -0.1715545654296875, -0.134979248046875, -0.0984039306640625, -0.06182861328125, -0.0252532958984375, 0.011322021484375, 0.0478973388671875, 0.08447265625, 0.1210479736328125, 0.157623291015625, 0.1941986083984375, 0.23077392578125, 0.2673492431640625, 0.303924560546875, 0.3404998779296875, 0.3770751953125, 0.4136505126953125, 0.450225830078125, 0.4868011474609375, 0.52337646484375, 0.5599517822265625, 0.596527099609375, 0.6331024169921875, 0.669677734375, 0.7062530517578125, 0.742828369140625, 0.7794036865234375, 0.81597900390625, 0.8525543212890625, 0.889129638671875, 0.9257049560546875, 0.9622802734375, 0.9988555908203125, 1.035430908203125, 1.0720062255859375, 1.10858154296875, 1.1451568603515625, 1.181732177734375, 1.2183074951171875, 1.2548828125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 6.0, 7.0, 6.0, 7.0, 17.0, 7.0, 16.0, 14.0, 22.0, 25.0, 42.0, 60.0, 71.0, 82.0, 80.0, 89.0, 94.0, 79.0, 58.0, 53.0, 36.0, 26.0, 17.0, 17.0, 13.0, 7.0, 8.0, 8.0, 8.0, 7.0, 6.0, 7.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.424560546875, -0.4090080261230469, -0.39345550537109375, -0.3779029846191406, -0.3623504638671875, -0.3467979431152344, -0.33124542236328125, -0.3156929016113281, -0.300140380859375, -0.2845878601074219, -0.26903533935546875, -0.2534828186035156, -0.2379302978515625, -0.22237777709960938, -0.20682525634765625, -0.19127273559570312, -0.17572021484375, -0.16016769409179688, -0.14461517333984375, -0.12906265258789062, -0.1135101318359375, -0.09795761108398438, -0.08240509033203125, -0.06685256958007812, -0.051300048828125, -0.035747528076171875, -0.02019500732421875, -0.004642486572265625, 0.0109100341796875, 0.026462554931640625, 0.04201507568359375, 0.057567596435546875, 0.0731201171875, 0.08867263793945312, 0.10422515869140625, 0.11977767944335938, 0.1353302001953125, 0.15088272094726562, 0.16643524169921875, 0.18198776245117188, 0.197540283203125, 0.21309280395507812, 0.22864532470703125, 0.24419784545898438, 0.2597503662109375, 0.2753028869628906, 0.29085540771484375, 0.3064079284667969, 0.32196044921875, 0.3375129699707031, 0.35306549072265625, 0.3686180114746094, 0.3841705322265625, 0.3997230529785156, 0.41527557373046875, 0.4308280944824219, 0.446380615234375, 0.4619331359863281, 0.47748565673828125, 0.4930381774902344, 0.5085906982421875, 0.5241432189941406, 0.5396957397460938, 0.5552482604980469, 0.57080078125]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 6.0, 8.0, 11.0, 18.0, 17.0, 30.0, 31.0, 40.0, 62.0, 48.0, 51.0, 64.0, 52.0, 60.0, 74.0, 70.0, 55.0, 51.0, 42.0, 43.0, 41.0, 28.0, 24.0, 17.0, 12.0, 8.0, 12.0, 9.0, 2.0, 6.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0], "bins": [-27.527267456054688, -26.856971740722656, -26.186676025390625, -25.516380310058594, -24.846084594726562, -24.1757869720459, -23.505491256713867, -22.835195541381836, -22.164899826049805, -21.494604110717773, -20.824308395385742, -20.15401268005371, -19.483715057373047, -18.813419342041016, -18.143123626708984, -17.472827911376953, -16.802532196044922, -16.13223648071289, -15.46194076538086, -14.791644096374512, -14.12134838104248, -13.45105266571045, -12.780755996704102, -12.11046028137207, -11.440164566040039, -10.769868850708008, -10.099573135375977, -9.429276466369629, -8.758980751037598, -8.088685035705566, -7.418388843536377, -6.7480926513671875, -6.07779598236084, -5.407500267028809, -4.737204074859619, -4.06690788269043, -3.3966121673583984, -2.726316213607788, -2.0560202598571777, -1.3857240676879883, -0.715428352355957, -0.04513239860534668, 0.6251635551452637, 1.295459508895874, 1.9657554626464844, 2.6360514163970947, 3.306347370147705, 3.9766435623168945, 4.646939277648926, 5.317234992980957, 5.9875311851501465, 6.657827377319336, 7.328123092651367, 7.998418807983398, 8.66871452331543, 9.339011192321777, 10.009306907653809, 10.67960262298584, 11.349899291992188, 12.020195007324219, 12.69049072265625, 13.360786437988281, 14.031082153320312, 14.70137882232666, 15.371674537658691]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 2.0, 4.0, 7.0, 6.0, 8.0, 12.0, 14.0, 25.0, 18.0, 26.0, 25.0, 39.0, 33.0, 27.0, 24.0, 30.0, 51.0, 42.0, 31.0, 44.0, 40.0, 40.0, 37.0, 36.0, 48.0, 40.0, 42.0, 35.0, 21.0, 30.0, 27.0, 22.0, 16.0, 18.0, 10.0, 21.0, 6.0, 6.0, 8.0, 6.0, 8.0, 10.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.94837188720703, -16.411834716796875, -15.875295639038086, -15.33875846862793, -14.802220344543457, -14.265682220458984, -13.729144096374512, -13.192605972290039, -12.656068801879883, -12.11953067779541, -11.582992553710938, -11.046455383300781, -10.509917259216309, -9.973379135131836, -9.436841011047363, -8.90030288696289, -8.363764762878418, -7.827226638793945, -7.290688991546631, -6.754150867462158, -6.217613220214844, -5.681075096130371, -5.144536972045898, -4.607998847961426, -4.071461200714111, -3.5349233150482178, -2.998385429382324, -2.4618473052978516, -1.925309419631958, -1.3887715339660645, -0.8522334098815918, -0.31569552421569824, 0.2208423614501953, 0.7573803067207336, 1.293918251991272, 1.830456256866455, 2.3669941425323486, 2.903532028198242, 3.440070152282715, 3.9766080379486084, 4.513145923614502, 5.049684047698975, 5.586221694946289, 6.122759819030762, 6.659297943115234, 7.195835590362549, 7.7323737144470215, 8.268911361694336, 8.805449485778809, 9.341987609863281, 9.878525733947754, 10.415063858032227, 10.951601028442383, 11.488139152526855, 12.024677276611328, 12.5612154006958, 13.097753524780273, 13.634291648864746, 14.170829772949219, 14.707366943359375, 15.243905067443848, 15.78044319152832, 16.31698226928711, 16.853519439697266, 17.390056610107422]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 9.0, 5.0, 4.0, 12.0, 22.0, 27.0, 50.0, 83.0, 112.0, 173.0, 292.0, 462.0, 674.0, 1076.0, 1603.0, 2676.0, 4376.0, 7120.0, 11773.0, 19334.0, 31951.0, 51332.0, 77723.0, 109007.0, 135455.0, 145307.0, 134368.0, 107962.0, 76015.0, 49693.0, 31422.0, 18910.0, 11487.0, 6769.0, 4241.0, 2599.0, 1626.0, 973.0, 671.0, 409.0, 276.0, 179.0, 115.0, 62.0, 47.0, 27.0, 20.0, 19.0, 9.0, 0.0, 5.0, 0.0, 3.0, 3.0, 1.0], "bins": [-16.71875, -16.2337646484375, -15.748779296875, -15.2637939453125, -14.77880859375, -14.2938232421875, -13.808837890625, -13.3238525390625, -12.8388671875, -12.3538818359375, -11.868896484375, -11.3839111328125, -10.89892578125, -10.4139404296875, -9.928955078125, -9.4439697265625, -8.958984375, -8.4739990234375, -7.989013671875, -7.5040283203125, -7.01904296875, -6.5340576171875, -6.049072265625, -5.5640869140625, -5.0791015625, -4.5941162109375, -4.109130859375, -3.6241455078125, -3.13916015625, -2.6541748046875, -2.169189453125, -1.6842041015625, -1.19921875, -0.7142333984375, -0.229248046875, 0.2557373046875, 0.74072265625, 1.2257080078125, 1.710693359375, 2.1956787109375, 2.6806640625, 3.1656494140625, 3.650634765625, 4.1356201171875, 4.62060546875, 5.1055908203125, 5.590576171875, 6.0755615234375, 6.560546875, 7.0455322265625, 7.530517578125, 8.0155029296875, 8.50048828125, 8.9854736328125, 9.470458984375, 9.9554443359375, 10.4404296875, 10.9254150390625, 11.410400390625, 11.8953857421875, 12.38037109375, 12.8653564453125, 13.350341796875, 13.8353271484375, 14.3203125]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 4.0, 6.0, 2.0, 6.0, 5.0, 8.0, 11.0, 12.0, 20.0, 18.0, 30.0, 25.0, 28.0, 37.0, 34.0, 33.0, 32.0, 42.0, 39.0, 33.0, 43.0, 25.0, 39.0, 36.0, 45.0, 29.0, 42.0, 41.0, 31.0, 40.0, 20.0, 23.0, 28.0, 25.0, 20.0, 13.0, 13.0, 11.0, 8.0, 10.0, 4.0, 11.0, 2.0, 6.0, 4.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.09375, -15.591064453125, -15.08837890625, -14.585693359375, -14.0830078125, -13.580322265625, -13.07763671875, -12.574951171875, -12.072265625, -11.569580078125, -11.06689453125, -10.564208984375, -10.0615234375, -9.558837890625, -9.05615234375, -8.553466796875, -8.05078125, -7.548095703125, -7.04541015625, -6.542724609375, -6.0400390625, -5.537353515625, -5.03466796875, -4.531982421875, -4.029296875, -3.526611328125, -3.02392578125, -2.521240234375, -2.0185546875, -1.515869140625, -1.01318359375, -0.510498046875, -0.0078125, 0.494873046875, 0.99755859375, 1.500244140625, 2.0029296875, 2.505615234375, 3.00830078125, 3.510986328125, 4.013671875, 4.516357421875, 5.01904296875, 5.521728515625, 6.0244140625, 6.527099609375, 7.02978515625, 7.532470703125, 8.03515625, 8.537841796875, 9.04052734375, 9.543212890625, 10.0458984375, 10.548583984375, 11.05126953125, 11.553955078125, 12.056640625, 12.559326171875, 13.06201171875, 13.564697265625, 14.0673828125, 14.570068359375, 15.07275390625, 15.575439453125, 16.078125]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 5.0, 10.0, 9.0, 13.0, 36.0, 40.0, 84.0, 132.0, 178.0, 313.0, 479.0, 768.0, 1122.0, 1737.0, 2769.0, 4256.0, 6676.0, 10552.0, 16157.0, 24669.0, 37280.0, 55287.0, 78153.0, 102655.0, 121563.0, 129294.0, 120495.0, 100360.0, 75723.0, 54123.0, 36156.0, 23886.0, 15539.0, 10063.0, 6468.0, 4194.0, 2604.0, 1668.0, 1107.0, 758.0, 455.0, 283.0, 159.0, 102.0, 58.0, 44.0, 27.0, 23.0, 14.0, 8.0, 5.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.5234375, -12.0833740234375, -11.643310546875, -11.2032470703125, -10.76318359375, -10.3231201171875, -9.883056640625, -9.4429931640625, -9.0029296875, -8.5628662109375, -8.122802734375, -7.6827392578125, -7.24267578125, -6.8026123046875, -6.362548828125, -5.9224853515625, -5.482421875, -5.0423583984375, -4.602294921875, -4.1622314453125, -3.72216796875, -3.2821044921875, -2.842041015625, -2.4019775390625, -1.9619140625, -1.5218505859375, -1.081787109375, -0.6417236328125, -0.20166015625, 0.2384033203125, 0.678466796875, 1.1185302734375, 1.55859375, 1.9986572265625, 2.438720703125, 2.8787841796875, 3.31884765625, 3.7589111328125, 4.198974609375, 4.6390380859375, 5.0791015625, 5.5191650390625, 5.959228515625, 6.3992919921875, 6.83935546875, 7.2794189453125, 7.719482421875, 8.1595458984375, 8.599609375, 9.0396728515625, 9.479736328125, 9.9197998046875, 10.35986328125, 10.7999267578125, 11.239990234375, 11.6800537109375, 12.1201171875, 12.5601806640625, 13.000244140625, 13.4403076171875, 13.88037109375, 14.3204345703125, 14.760498046875, 15.2005615234375, 15.640625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 3.0, 7.0, 6.0, 5.0, 10.0, 4.0, 7.0, 13.0, 14.0, 24.0, 23.0, 21.0, 32.0, 27.0, 33.0, 30.0, 46.0, 34.0, 39.0, 42.0, 37.0, 51.0, 48.0, 36.0, 34.0, 35.0, 35.0, 30.0, 29.0, 35.0, 39.0, 19.0, 20.0, 21.0, 23.0, 22.0, 12.0, 14.0, 7.0, 10.0, 7.0, 4.0, 6.0, 6.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0], "bins": [-11.75, -11.40087890625, -11.0517578125, -10.70263671875, -10.353515625, -10.00439453125, -9.6552734375, -9.30615234375, -8.95703125, -8.60791015625, -8.2587890625, -7.90966796875, -7.560546875, -7.21142578125, -6.8623046875, -6.51318359375, -6.1640625, -5.81494140625, -5.4658203125, -5.11669921875, -4.767578125, -4.41845703125, -4.0693359375, -3.72021484375, -3.37109375, -3.02197265625, -2.6728515625, -2.32373046875, -1.974609375, -1.62548828125, -1.2763671875, -0.92724609375, -0.578125, -0.22900390625, 0.1201171875, 0.46923828125, 0.818359375, 1.16748046875, 1.5166015625, 1.86572265625, 2.21484375, 2.56396484375, 2.9130859375, 3.26220703125, 3.611328125, 3.96044921875, 4.3095703125, 4.65869140625, 5.0078125, 5.35693359375, 5.7060546875, 6.05517578125, 6.404296875, 6.75341796875, 7.1025390625, 7.45166015625, 7.80078125, 8.14990234375, 8.4990234375, 8.84814453125, 9.197265625, 9.54638671875, 9.8955078125, 10.24462890625, 10.59375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 3.0, 1.0, 4.0, 8.0, 12.0, 19.0, 28.0, 42.0, 46.0, 74.0, 114.0, 166.0, 278.0, 438.0, 605.0, 964.0, 1454.0, 2172.0, 3292.0, 5184.0, 8001.0, 12405.0, 18921.0, 28756.0, 43168.0, 62300.0, 85070.0, 109493.0, 125826.0, 127503.0, 114088.0, 92007.0, 67413.0, 47067.0, 31447.0, 21003.0, 13733.0, 8768.0, 5817.0, 3675.0, 2478.0, 1639.0, 1042.0, 678.0, 489.0, 280.0, 215.0, 127.0, 92.0, 57.0, 35.0, 20.0, 22.0, 9.0, 8.0, 4.0, 6.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.15625, -3.0579833984375, -2.959716796875, -2.8614501953125, -2.76318359375, -2.6649169921875, -2.566650390625, -2.4683837890625, -2.3701171875, -2.2718505859375, -2.173583984375, -2.0753173828125, -1.97705078125, -1.8787841796875, -1.780517578125, -1.6822509765625, -1.583984375, -1.4857177734375, -1.387451171875, -1.2891845703125, -1.19091796875, -1.0926513671875, -0.994384765625, -0.8961181640625, -0.7978515625, -0.6995849609375, -0.601318359375, -0.5030517578125, -0.40478515625, -0.3065185546875, -0.208251953125, -0.1099853515625, -0.01171875, 0.0865478515625, 0.184814453125, 0.2830810546875, 0.38134765625, 0.4796142578125, 0.577880859375, 0.6761474609375, 0.7744140625, 0.8726806640625, 0.970947265625, 1.0692138671875, 1.16748046875, 1.2657470703125, 1.364013671875, 1.4622802734375, 1.560546875, 1.6588134765625, 1.757080078125, 1.8553466796875, 1.95361328125, 2.0518798828125, 2.150146484375, 2.2484130859375, 2.3466796875, 2.4449462890625, 2.543212890625, 2.6414794921875, 2.73974609375, 2.8380126953125, 2.936279296875, 3.0345458984375, 3.1328125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 2.0, 4.0, 4.0, 10.0, 9.0, 9.0, 14.0, 15.0, 23.0, 24.0, 25.0, 27.0, 38.0, 43.0, 35.0, 42.0, 37.0, 41.0, 39.0, 49.0, 52.0, 48.0, 38.0, 42.0, 39.0, 37.0, 26.0, 32.0, 25.0, 25.0, 20.0, 21.0, 18.0, 12.0, 13.0, 8.0, 13.0, 9.0, 7.0, 7.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.0003399848937988281, -0.0003300197422504425, -0.0003200545907020569, -0.00031008943915367126, -0.00030012428760528564, -0.0002901591360569, -0.0002801939845085144, -0.0002702288329601288, -0.00026026368141174316, -0.00025029852986335754, -0.00024033337831497192, -0.0002303682267665863, -0.00022040307521820068, -0.00021043792366981506, -0.00020047277212142944, -0.00019050762057304382, -0.0001805424690246582, -0.00017057731747627258, -0.00016061216592788696, -0.00015064701437950134, -0.00014068186283111572, -0.0001307167112827301, -0.00012075155973434448, -0.00011078640818595886, -0.00010082125663757324, -9.085610508918762e-05, -8.0890953540802e-05, -7.092580199241638e-05, -6.096065044403076e-05, -5.099549889564514e-05, -4.103034734725952e-05, -3.10651957988739e-05, -2.110004425048828e-05, -1.1134892702102661e-05, -1.169741153717041e-06, 8.795410394668579e-06, 1.87605619430542e-05, 2.872571349143982e-05, 3.869086503982544e-05, 4.865601658821106e-05, 5.862116813659668e-05, 6.85863196849823e-05, 7.855147123336792e-05, 8.851662278175354e-05, 9.848177433013916e-05, 0.00010844692587852478, 0.0001184120774269104, 0.00012837722897529602, 0.00013834238052368164, 0.00014830753207206726, 0.00015827268362045288, 0.0001682378351688385, 0.00017820298671722412, 0.00018816813826560974, 0.00019813328981399536, 0.00020809844136238098, 0.0002180635929107666, 0.00022802874445915222, 0.00023799389600753784, 0.00024795904755592346, 0.0002579241991043091, 0.0002678893506526947, 0.0002778545022010803, 0.00028781965374946594, 0.00029778480529785156]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 7.0, 6.0, 10.0, 10.0, 22.0, 33.0, 54.0, 76.0, 156.0, 209.0, 341.0, 463.0, 782.0, 1149.0, 1882.0, 3068.0, 4887.0, 7701.0, 12180.0, 19339.0, 30172.0, 45352.0, 65505.0, 89005.0, 111255.0, 126429.0, 126897.0, 112727.0, 90685.0, 66856.0, 46383.0, 30343.0, 19823.0, 12969.0, 8122.0, 5074.0, 3123.0, 1968.0, 1286.0, 797.0, 509.0, 332.0, 187.0, 130.0, 87.0, 64.0, 46.0, 17.0, 13.0, 16.0, 2.0, 7.0, 6.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.072265625, -2.969970703125, -2.86767578125, -2.765380859375, -2.6630859375, -2.560791015625, -2.45849609375, -2.356201171875, -2.25390625, -2.151611328125, -2.04931640625, -1.947021484375, -1.8447265625, -1.742431640625, -1.64013671875, -1.537841796875, -1.435546875, -1.333251953125, -1.23095703125, -1.128662109375, -1.0263671875, -0.924072265625, -0.82177734375, -0.719482421875, -0.6171875, -0.514892578125, -0.41259765625, -0.310302734375, -0.2080078125, -0.105712890625, -0.00341796875, 0.098876953125, 0.201171875, 0.303466796875, 0.40576171875, 0.508056640625, 0.6103515625, 0.712646484375, 0.81494140625, 0.917236328125, 1.01953125, 1.121826171875, 1.22412109375, 1.326416015625, 1.4287109375, 1.531005859375, 1.63330078125, 1.735595703125, 1.837890625, 1.940185546875, 2.04248046875, 2.144775390625, 2.2470703125, 2.349365234375, 2.45166015625, 2.553955078125, 2.65625, 2.758544921875, 2.86083984375, 2.963134765625, 3.0654296875, 3.167724609375, 3.27001953125, 3.372314453125, 3.474609375]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 5.0, 3.0, 3.0, 1.0, 8.0, 10.0, 9.0, 14.0, 18.0, 15.0, 21.0, 19.0, 35.0, 38.0, 43.0, 52.0, 56.0, 51.0, 65.0, 62.0, 44.0, 49.0, 48.0, 50.0, 48.0, 51.0, 29.0, 30.0, 26.0, 22.0, 23.0, 14.0, 15.0, 6.0, 8.0, 0.0, 5.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.671875, -1.6157379150390625, -1.559600830078125, -1.5034637451171875, -1.44732666015625, -1.3911895751953125, -1.335052490234375, -1.2789154052734375, -1.2227783203125, -1.1666412353515625, -1.110504150390625, -1.0543670654296875, -0.99822998046875, -0.9420928955078125, -0.885955810546875, -0.8298187255859375, -0.773681640625, -0.7175445556640625, -0.661407470703125, -0.6052703857421875, -0.54913330078125, -0.4929962158203125, -0.436859130859375, -0.3807220458984375, -0.3245849609375, -0.2684478759765625, -0.212310791015625, -0.1561737060546875, -0.10003662109375, -0.0438995361328125, 0.012237548828125, 0.0683746337890625, 0.12451171875, 0.1806488037109375, 0.236785888671875, 0.2929229736328125, 0.34906005859375, 0.4051971435546875, 0.461334228515625, 0.5174713134765625, 0.5736083984375, 0.6297454833984375, 0.685882568359375, 0.7420196533203125, 0.79815673828125, 0.8542938232421875, 0.910430908203125, 0.9665679931640625, 1.022705078125, 1.0788421630859375, 1.134979248046875, 1.1911163330078125, 1.24725341796875, 1.3033905029296875, 1.359527587890625, 1.4156646728515625, 1.4718017578125, 1.5279388427734375, 1.584075927734375, 1.6402130126953125, 1.69635009765625, 1.7524871826171875, 1.808624267578125, 1.8647613525390625, 1.9208984375]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 6.0, 8.0, 6.0, 13.0, 18.0, 22.0, 25.0, 28.0, 37.0, 39.0, 44.0, 56.0, 52.0, 65.0, 41.0, 73.0, 66.0, 67.0, 52.0, 48.0, 32.0, 29.0, 29.0, 32.0, 18.0, 24.0, 15.0, 14.0, 8.0, 8.0, 6.0, 3.0, 3.0, 8.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-22.756816864013672, -22.167016983032227, -21.57721519470215, -20.987415313720703, -20.397613525390625, -19.80781364440918, -19.2180118560791, -18.628211975097656, -18.038410186767578, -17.448610305786133, -16.858808517456055, -16.26900863647461, -15.679206848144531, -15.089406967163086, -14.499606132507324, -13.909805297851562, -13.320005416870117, -12.730204582214355, -12.140403747558594, -11.550602912902832, -10.96080207824707, -10.371002197265625, -9.781201362609863, -9.191400527954102, -8.60159969329834, -8.011798858642578, -7.421998023986816, -6.832197666168213, -6.242396831512451, -5.6525959968566895, -5.062795639038086, -4.472994804382324, -3.8831958770751953, -3.2933950424194336, -2.703594446182251, -2.1137938499450684, -1.5239930152893066, -0.9341921806335449, -0.3443915843963623, 0.2454090118408203, 0.835209846496582, 1.4250105619430542, 2.0148112773895264, 2.604611873626709, 3.1944127082824707, 3.7842135429382324, 4.374013900756836, 4.963814735412598, 5.553615570068359, 6.143416404724121, 6.733217239379883, 7.323017597198486, 7.912818431854248, 8.502618789672852, 9.092419624328613, 9.682220458984375, 10.272021293640137, 10.861822128295898, 11.45162296295166, 12.041423797607422, 12.631223678588867, 13.221025466918945, 13.81082534790039, 14.400626182556152, 14.990427017211914]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 2.0, 5.0, 6.0, 8.0, 4.0, 9.0, 9.0, 14.0, 15.0, 18.0, 21.0, 22.0, 24.0, 23.0, 27.0, 30.0, 28.0, 46.0, 27.0, 43.0, 29.0, 47.0, 38.0, 38.0, 42.0, 30.0, 31.0, 40.0, 26.0, 24.0, 33.0, 34.0, 33.0, 23.0, 19.0, 22.0, 18.0, 15.0, 12.0, 14.0, 10.0, 10.0, 3.0, 7.0, 3.0, 4.0, 5.0, 5.0, 3.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.034360885620117, -15.506206512451172, -14.978053092956543, -14.449899673461914, -13.921745300292969, -13.393590927124023, -12.865437507629395, -12.337284088134766, -11.80912971496582, -11.280975341796875, -10.752821922302246, -10.224668502807617, -9.696514129638672, -9.168359756469727, -8.640206336975098, -8.112052917480469, -7.583898544311523, -7.055744647979736, -6.527590751647949, -5.999436855316162, -5.471282958984375, -4.943129062652588, -4.414975166320801, -3.8868212699890137, -3.3586673736572266, -2.8305134773254395, -2.3023595809936523, -1.7742056846618652, -1.2460517883300781, -0.717897891998291, -0.1897439956665039, 0.3384099006652832, 0.8665637969970703, 1.3947176933288574, 1.9228715896606445, 2.4510254859924316, 2.9791793823242188, 3.507333278656006, 4.035487174987793, 4.56364107131958, 5.091794967651367, 5.619948863983154, 6.148102760314941, 6.6762566566467285, 7.204410552978516, 7.732564449310303, 8.26071834564209, 8.788871765136719, 9.317026138305664, 9.84518051147461, 10.373333930969238, 10.901487350463867, 11.429641723632812, 11.957796096801758, 12.485949516296387, 13.014102935791016, 13.542257308959961, 14.070411682128906, 14.598565101623535, 15.126718521118164, 15.65487289428711, 16.183027267456055, 16.711181640625, 17.239334106445312, 17.767488479614258]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 11.0, 8.0, 14.0, 21.0, 30.0, 53.0, 98.0, 154.0, 238.0, 376.0, 625.0, 982.0, 1464.0, 2464.0, 3905.0, 6419.0, 10538.0, 16949.0, 27872.0, 46007.0, 75811.0, 124776.0, 203870.0, 320333.0, 469743.0, 603160.0, 639572.0, 552049.0, 403279.0, 263844.0, 163962.0, 99339.0, 60853.0, 36315.0, 22232.0, 13777.0, 8508.0, 5283.0, 3354.0, 2059.0, 1362.0, 894.0, 614.0, 367.0, 245.0, 179.0, 99.0, 54.0, 43.0, 30.0, 22.0, 15.0, 10.0, 3.0, 2.0, 4.0, 0.0, 4.0], "bins": [-12.9765625, -12.57470703125, -12.1728515625, -11.77099609375, -11.369140625, -10.96728515625, -10.5654296875, -10.16357421875, -9.76171875, -9.35986328125, -8.9580078125, -8.55615234375, -8.154296875, -7.75244140625, -7.3505859375, -6.94873046875, -6.546875, -6.14501953125, -5.7431640625, -5.34130859375, -4.939453125, -4.53759765625, -4.1357421875, -3.73388671875, -3.33203125, -2.93017578125, -2.5283203125, -2.12646484375, -1.724609375, -1.32275390625, -0.9208984375, -0.51904296875, -0.1171875, 0.28466796875, 0.6865234375, 1.08837890625, 1.490234375, 1.89208984375, 2.2939453125, 2.69580078125, 3.09765625, 3.49951171875, 3.9013671875, 4.30322265625, 4.705078125, 5.10693359375, 5.5087890625, 5.91064453125, 6.3125, 6.71435546875, 7.1162109375, 7.51806640625, 7.919921875, 8.32177734375, 8.7236328125, 9.12548828125, 9.52734375, 9.92919921875, 10.3310546875, 10.73291015625, 11.134765625, 11.53662109375, 11.9384765625, 12.34033203125, 12.7421875]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 9.0, 5.0, 6.0, 6.0, 11.0, 8.0, 10.0, 8.0, 13.0, 14.0, 20.0, 20.0, 31.0, 28.0, 41.0, 31.0, 36.0, 30.0, 29.0, 43.0, 40.0, 54.0, 45.0, 49.0, 34.0, 36.0, 33.0, 37.0, 27.0, 25.0, 38.0, 32.0, 23.0, 21.0, 30.0, 13.0, 17.0, 10.0, 7.0, 11.0, 8.0, 6.0, 2.0, 5.0, 5.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.4453125, -12.0377197265625, -11.630126953125, -11.2225341796875, -10.81494140625, -10.4073486328125, -9.999755859375, -9.5921630859375, -9.1845703125, -8.7769775390625, -8.369384765625, -7.9617919921875, -7.55419921875, -7.1466064453125, -6.739013671875, -6.3314208984375, -5.923828125, -5.5162353515625, -5.108642578125, -4.7010498046875, -4.29345703125, -3.8858642578125, -3.478271484375, -3.0706787109375, -2.6630859375, -2.2554931640625, -1.847900390625, -1.4403076171875, -1.03271484375, -0.6251220703125, -0.217529296875, 0.1900634765625, 0.59765625, 1.0052490234375, 1.412841796875, 1.8204345703125, 2.22802734375, 2.6356201171875, 3.043212890625, 3.4508056640625, 3.8583984375, 4.2659912109375, 4.673583984375, 5.0811767578125, 5.48876953125, 5.8963623046875, 6.303955078125, 6.7115478515625, 7.119140625, 7.5267333984375, 7.934326171875, 8.3419189453125, 8.74951171875, 9.1571044921875, 9.564697265625, 9.9722900390625, 10.3798828125, 10.7874755859375, 11.195068359375, 11.6026611328125, 12.01025390625, 12.4178466796875, 12.825439453125, 13.2330322265625, 13.640625]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [2.0, 6.0, 5.0, 9.0, 7.0, 30.0, 23.0, 43.0, 64.0, 109.0, 171.0, 234.0, 364.0, 618.0, 913.0, 1512.0, 2402.0, 3873.0, 6371.0, 10112.0, 15989.0, 26361.0, 41700.0, 65244.0, 101679.0, 152273.0, 221742.0, 302827.0, 388768.0, 459167.0, 491591.0, 470515.0, 404453.0, 320326.0, 236419.0, 164116.0, 110222.0, 72325.0, 45981.0, 28813.0, 17818.0, 11191.0, 6727.0, 4207.0, 2585.0, 1587.0, 990.0, 701.0, 401.0, 250.0, 178.0, 115.0, 60.0, 45.0, 22.0, 16.0, 16.0, 7.0, 4.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-9.8125, -9.4918212890625, -9.171142578125, -8.8504638671875, -8.52978515625, -8.2091064453125, -7.888427734375, -7.5677490234375, -7.2470703125, -6.9263916015625, -6.605712890625, -6.2850341796875, -5.96435546875, -5.6436767578125, -5.322998046875, -5.0023193359375, -4.681640625, -4.3609619140625, -4.040283203125, -3.7196044921875, -3.39892578125, -3.0782470703125, -2.757568359375, -2.4368896484375, -2.1162109375, -1.7955322265625, -1.474853515625, -1.1541748046875, -0.83349609375, -0.5128173828125, -0.192138671875, 0.1285400390625, 0.44921875, 0.7698974609375, 1.090576171875, 1.4112548828125, 1.73193359375, 2.0526123046875, 2.373291015625, 2.6939697265625, 3.0146484375, 3.3353271484375, 3.656005859375, 3.9766845703125, 4.29736328125, 4.6180419921875, 4.938720703125, 5.2593994140625, 5.580078125, 5.9007568359375, 6.221435546875, 6.5421142578125, 6.86279296875, 7.1834716796875, 7.504150390625, 7.8248291015625, 8.1455078125, 8.4661865234375, 8.786865234375, 9.1075439453125, 9.42822265625, 9.7489013671875, 10.069580078125, 10.3902587890625, 10.7109375]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 1.0, 3.0, 4.0, 12.0, 5.0, 7.0, 14.0, 19.0, 30.0, 32.0, 34.0, 50.0, 63.0, 48.0, 80.0, 82.0, 114.0, 106.0, 146.0, 171.0, 210.0, 187.0, 194.0, 209.0, 213.0, 226.0, 221.0, 192.0, 207.0, 197.0, 150.0, 143.0, 119.0, 118.0, 84.0, 72.0, 70.0, 68.0, 34.0, 31.0, 22.0, 22.0, 20.0, 17.0, 7.0, 4.0, 7.0, 3.0, 5.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-6.40625, -6.22210693359375, -6.0379638671875, -5.85382080078125, -5.669677734375, -5.48553466796875, -5.3013916015625, -5.11724853515625, -4.93310546875, -4.74896240234375, -4.5648193359375, -4.38067626953125, -4.196533203125, -4.01239013671875, -3.8282470703125, -3.64410400390625, -3.4599609375, -3.27581787109375, -3.0916748046875, -2.90753173828125, -2.723388671875, -2.53924560546875, -2.3551025390625, -2.17095947265625, -1.98681640625, -1.80267333984375, -1.6185302734375, -1.43438720703125, -1.250244140625, -1.06610107421875, -0.8819580078125, -0.69781494140625, -0.513671875, -0.32952880859375, -0.1453857421875, 0.03875732421875, 0.222900390625, 0.40704345703125, 0.5911865234375, 0.77532958984375, 0.95947265625, 1.14361572265625, 1.3277587890625, 1.51190185546875, 1.696044921875, 1.88018798828125, 2.0643310546875, 2.24847412109375, 2.4326171875, 2.61676025390625, 2.8009033203125, 2.98504638671875, 3.169189453125, 3.35333251953125, 3.5374755859375, 3.72161865234375, 3.90576171875, 4.08990478515625, 4.2740478515625, 4.45819091796875, 4.642333984375, 4.82647705078125, 5.0106201171875, 5.19476318359375, 5.37890625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 2.0, 8.0, 6.0, 6.0, 11.0, 13.0, 11.0, 24.0, 28.0, 20.0, 30.0, 36.0, 25.0, 31.0, 40.0, 44.0, 40.0, 49.0, 50.0, 53.0, 47.0, 46.0, 40.0, 39.0, 46.0, 40.0, 40.0, 27.0, 35.0, 19.0, 14.0, 13.0, 12.0, 6.0, 10.0, 6.0, 6.0, 9.0, 4.0, 1.0, 8.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-12.15737247467041, -11.751374244689941, -11.345376014709473, -10.939377784729004, -10.533379554748535, -10.127381324768066, -9.721382141113281, -9.315383911132812, -8.909385681152344, -8.503387451171875, -8.097389221191406, -7.6913909912109375, -7.285392761230469, -6.87939453125, -6.473395824432373, -6.067397594451904, -5.661399841308594, -5.255401611328125, -4.849403381347656, -4.4434051513671875, -4.037406921386719, -3.631408452987671, -3.225409984588623, -2.8194117546081543, -2.4134135246276855, -2.007415294647217, -1.6014169454574585, -1.1954185962677002, -0.7894203662872314, -0.3834221363067627, 0.022576332092285156, 0.4285745620727539, 0.8345727920532227, 1.2405710220336914, 1.6465693712234497, 2.052567720413208, 2.4585659503936768, 2.8645641803741455, 3.2705626487731934, 3.676560878753662, 4.082559108734131, 4.4885573387146, 4.894555568695068, 5.300554275512695, 5.706552505493164, 6.112550735473633, 6.518548965454102, 6.92454719543457, 7.330545425415039, 7.736543655395508, 8.142541885375977, 8.548540115356445, 8.954538345336914, 9.360536575317383, 9.766534805297852, 10.17253303527832, 10.578531265258789, 10.984529495239258, 11.390527725219727, 11.796525955200195, 12.202524185180664, 12.608522415161133, 13.014520645141602, 13.42051887512207, 13.826518058776855]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 5.0, 7.0, 14.0, 13.0, 19.0, 17.0, 16.0, 21.0, 25.0, 29.0, 23.0, 28.0, 23.0, 37.0, 49.0, 36.0, 46.0, 45.0, 49.0, 30.0, 49.0, 41.0, 42.0, 39.0, 24.0, 36.0, 35.0, 27.0, 32.0, 33.0, 19.0, 11.0, 11.0, 18.0, 12.0, 8.0, 9.0, 7.0, 4.0, 5.0, 1.0, 6.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-16.665420532226562, -16.176895141601562, -15.688370704650879, -15.199845314025879, -14.711319923400879, -14.222795486450195, -13.734270095825195, -13.245744705200195, -12.757219314575195, -12.268693923950195, -11.780169486999512, -11.291644096374512, -10.803118705749512, -10.314594268798828, -9.826068878173828, -9.337543487548828, -8.849018096923828, -8.360492706298828, -7.871967792510986, -7.3834428787231445, -6.8949174880981445, -6.406392574310303, -5.917867660522461, -5.429342269897461, -4.940817832946777, -4.4522929191589355, -3.9637675285339355, -3.4752426147460938, -2.9867172241210938, -2.498192310333252, -2.009667158126831, -1.5211420059204102, -1.0326166152954102, -0.5440914630889893, -0.055566370487213135, 0.432958722114563, 0.9214838743209839, 1.4100089073181152, 1.8985340595245361, 2.387059211730957, 2.875584363937378, 3.364109516143799, 3.8526346683502197, 4.341159820556641, 4.829684734344482, 5.318209648132324, 5.806735038757324, 6.295260429382324, 6.783785343170166, 7.272310256958008, 7.760835647583008, 8.249361038208008, 8.737885475158691, 9.226410865783691, 9.714936256408691, 10.203460693359375, 10.691986083984375, 11.180511474609375, 11.669035911560059, 12.157561302185059, 12.646086692810059, 13.134611129760742, 13.623136520385742, 14.111661911010742, 14.600187301635742]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 9.0, 8.0, 17.0, 12.0, 35.0, 40.0, 66.0, 77.0, 126.0, 206.0, 284.0, 435.0, 692.0, 1026.0, 1693.0, 2556.0, 4058.0, 6698.0, 10700.0, 16810.0, 26669.0, 42161.0, 65510.0, 98287.0, 140848.0, 169706.0, 150923.0, 108279.0, 72413.0, 46922.0, 30198.0, 19048.0, 11784.0, 7329.0, 4643.0, 2884.0, 1909.0, 1160.0, 800.0, 516.0, 340.0, 213.0, 159.0, 92.0, 60.0, 53.0, 33.0, 24.0, 16.0, 9.0, 13.0, 7.0, 2.0, 1.0, 0.0, 2.0, 3.0], "bins": [-2.501953125, -2.425262451171875, -2.34857177734375, -2.271881103515625, -2.1951904296875, -2.118499755859375, -2.04180908203125, -1.965118408203125, -1.888427734375, -1.811737060546875, -1.73504638671875, -1.658355712890625, -1.5816650390625, -1.504974365234375, -1.42828369140625, -1.351593017578125, -1.27490234375, -1.198211669921875, -1.12152099609375, -1.044830322265625, -0.9681396484375, -0.891448974609375, -0.81475830078125, -0.738067626953125, -0.661376953125, -0.584686279296875, -0.50799560546875, -0.431304931640625, -0.3546142578125, -0.277923583984375, -0.20123291015625, -0.124542236328125, -0.0478515625, 0.028839111328125, 0.10552978515625, 0.182220458984375, 0.2589111328125, 0.335601806640625, 0.41229248046875, 0.488983154296875, 0.565673828125, 0.642364501953125, 0.71905517578125, 0.795745849609375, 0.8724365234375, 0.949127197265625, 1.02581787109375, 1.102508544921875, 1.17919921875, 1.255889892578125, 1.33258056640625, 1.409271240234375, 1.4859619140625, 1.562652587890625, 1.63934326171875, 1.716033935546875, 1.792724609375, 1.869415283203125, 1.94610595703125, 2.022796630859375, 2.0994873046875, 2.176177978515625, 2.25286865234375, 2.329559326171875, 2.40625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 7.0, 4.0, 6.0, 17.0, 21.0, 17.0, 18.0, 24.0, 27.0, 25.0, 28.0, 28.0, 38.0, 38.0, 34.0, 46.0, 39.0, 46.0, 47.0, 26.0, 51.0, 52.0, 32.0, 39.0, 36.0, 38.0, 37.0, 30.0, 30.0, 17.0, 15.0, 12.0, 9.0, 15.0, 10.0, 8.0, 3.0, 9.0, 3.0, 6.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-17.171875, -16.6766357421875, -16.181396484375, -15.6861572265625, -15.19091796875, -14.6956787109375, -14.200439453125, -13.7052001953125, -13.2099609375, -12.7147216796875, -12.219482421875, -11.7242431640625, -11.22900390625, -10.7337646484375, -10.238525390625, -9.7432861328125, -9.248046875, -8.7528076171875, -8.257568359375, -7.7623291015625, -7.26708984375, -6.7718505859375, -6.276611328125, -5.7813720703125, -5.2861328125, -4.7908935546875, -4.295654296875, -3.8004150390625, -3.30517578125, -2.8099365234375, -2.314697265625, -1.8194580078125, -1.32421875, -0.8289794921875, -0.333740234375, 0.1614990234375, 0.65673828125, 1.1519775390625, 1.647216796875, 2.1424560546875, 2.6376953125, 3.1329345703125, 3.628173828125, 4.1234130859375, 4.61865234375, 5.1138916015625, 5.609130859375, 6.1043701171875, 6.599609375, 7.0948486328125, 7.590087890625, 8.0853271484375, 8.58056640625, 9.0758056640625, 9.571044921875, 10.0662841796875, 10.5615234375, 11.0567626953125, 11.552001953125, 12.0472412109375, 12.54248046875, 13.0377197265625, 13.532958984375, 14.0281982421875, 14.5234375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 6.0, 4.0, 20.0, 17.0, 19.0, 31.0, 38.0, 61.0, 61.0, 109.0, 137.0, 191.0, 301.0, 350.0, 502.0, 798.0, 1375.0, 2519.0, 5351.0, 12104.0, 29833.0, 870187.0, 78539.0, 24999.0, 10399.0, 4645.0, 2232.0, 1250.0, 759.0, 499.0, 364.0, 257.0, 165.0, 112.0, 79.0, 64.0, 48.0, 39.0, 24.0, 27.0, 13.0, 12.0, 4.0, 6.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.87890625, -7.63201904296875, -7.3851318359375, -7.13824462890625, -6.891357421875, -6.64447021484375, -6.3975830078125, -6.15069580078125, -5.90380859375, -5.65692138671875, -5.4100341796875, -5.16314697265625, -4.916259765625, -4.66937255859375, -4.4224853515625, -4.17559814453125, -3.9287109375, -3.68182373046875, -3.4349365234375, -3.18804931640625, -2.941162109375, -2.69427490234375, -2.4473876953125, -2.20050048828125, -1.95361328125, -1.70672607421875, -1.4598388671875, -1.21295166015625, -0.966064453125, -0.71917724609375, -0.4722900390625, -0.22540283203125, 0.021484375, 0.26837158203125, 0.5152587890625, 0.76214599609375, 1.009033203125, 1.25592041015625, 1.5028076171875, 1.74969482421875, 1.99658203125, 2.24346923828125, 2.4903564453125, 2.73724365234375, 2.984130859375, 3.23101806640625, 3.4779052734375, 3.72479248046875, 3.9716796875, 4.21856689453125, 4.4654541015625, 4.71234130859375, 4.959228515625, 5.20611572265625, 5.4530029296875, 5.69989013671875, 5.94677734375, 6.19366455078125, 6.4405517578125, 6.68743896484375, 6.934326171875, 7.18121337890625, 7.4281005859375, 7.67498779296875, 7.921875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 5.0, 2.0, 6.0, 4.0, 4.0, 8.0, 10.0, 12.0, 18.0, 14.0, 16.0, 24.0, 22.0, 24.0, 26.0, 37.0, 42.0, 40.0, 46.0, 46.0, 49.0, 49.0, 36.0, 44.0, 34.0, 33.0, 40.0, 37.0, 38.0, 32.0, 22.0, 20.0, 27.0, 31.0, 20.0, 13.0, 9.0, 13.0, 15.0, 11.0, 8.0, 9.0, 4.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.75, -10.40478515625, -10.0595703125, -9.71435546875, -9.369140625, -9.02392578125, -8.6787109375, -8.33349609375, -7.98828125, -7.64306640625, -7.2978515625, -6.95263671875, -6.607421875, -6.26220703125, -5.9169921875, -5.57177734375, -5.2265625, -4.88134765625, -4.5361328125, -4.19091796875, -3.845703125, -3.50048828125, -3.1552734375, -2.81005859375, -2.46484375, -2.11962890625, -1.7744140625, -1.42919921875, -1.083984375, -0.73876953125, -0.3935546875, -0.04833984375, 0.296875, 0.64208984375, 0.9873046875, 1.33251953125, 1.677734375, 2.02294921875, 2.3681640625, 2.71337890625, 3.05859375, 3.40380859375, 3.7490234375, 4.09423828125, 4.439453125, 4.78466796875, 5.1298828125, 5.47509765625, 5.8203125, 6.16552734375, 6.5107421875, 6.85595703125, 7.201171875, 7.54638671875, 7.8916015625, 8.23681640625, 8.58203125, 8.92724609375, 9.2724609375, 9.61767578125, 9.962890625, 10.30810546875, 10.6533203125, 10.99853515625, 11.34375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 5.0, 4.0, 7.0, 9.0, 10.0, 18.0, 31.0, 23.0, 40.0, 58.0, 90.0, 99.0, 155.0, 225.0, 332.0, 505.0, 767.0, 1461.0, 2815.0, 6685.0, 20603.0, 930662.0, 61614.0, 12449.0, 4656.0, 2081.0, 1158.0, 581.0, 443.0, 282.0, 190.0, 147.0, 91.0, 65.0, 62.0, 36.0, 25.0, 23.0, 16.0, 9.0, 8.0, 7.0, 2.0, 7.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.451171875, -2.374114990234375, -2.29705810546875, -2.220001220703125, -2.1429443359375, -2.065887451171875, -1.98883056640625, -1.911773681640625, -1.834716796875, -1.757659912109375, -1.68060302734375, -1.603546142578125, -1.5264892578125, -1.449432373046875, -1.37237548828125, -1.295318603515625, -1.21826171875, -1.141204833984375, -1.06414794921875, -0.987091064453125, -0.9100341796875, -0.832977294921875, -0.75592041015625, -0.678863525390625, -0.601806640625, -0.524749755859375, -0.44769287109375, -0.370635986328125, -0.2935791015625, -0.216522216796875, -0.13946533203125, -0.062408447265625, 0.0146484375, 0.091705322265625, 0.16876220703125, 0.245819091796875, 0.3228759765625, 0.399932861328125, 0.47698974609375, 0.554046630859375, 0.631103515625, 0.708160400390625, 0.78521728515625, 0.862274169921875, 0.9393310546875, 1.016387939453125, 1.09344482421875, 1.170501708984375, 1.24755859375, 1.324615478515625, 1.40167236328125, 1.478729248046875, 1.5557861328125, 1.632843017578125, 1.70989990234375, 1.786956787109375, 1.864013671875, 1.941070556640625, 2.01812744140625, 2.095184326171875, 2.1722412109375, 2.249298095703125, 2.32635498046875, 2.403411865234375, 2.48046875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 10.0, 11.0, 8.0, 10.0, 14.0, 16.0, 24.0, 15.0, 26.0, 39.0, 27.0, 44.0, 34.0, 51.0, 54.0, 58.0, 51.0, 69.0, 50.0, 41.0, 38.0, 46.0, 45.0, 28.0, 34.0, 21.0, 25.0, 20.0, 14.0, 13.0, 13.0, 11.0, 7.0, 8.0, 4.0, 5.0, 5.0, 2.0, 6.0, 1.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3887882232666016e-05, -1.3459473848342896e-05, -1.3031065464019775e-05, -1.2602657079696655e-05, -1.2174248695373535e-05, -1.1745840311050415e-05, -1.1317431926727295e-05, -1.0889023542404175e-05, -1.0460615158081055e-05, -1.0032206773757935e-05, -9.603798389434814e-06, -9.175390005111694e-06, -8.746981620788574e-06, -8.318573236465454e-06, -7.890164852142334e-06, -7.461756467819214e-06, -7.033348083496094e-06, -6.604939699172974e-06, -6.1765313148498535e-06, -5.748122930526733e-06, -5.319714546203613e-06, -4.891306161880493e-06, -4.462897777557373e-06, -4.034489393234253e-06, -3.606081008911133e-06, -3.1776726245880127e-06, -2.7492642402648926e-06, -2.3208558559417725e-06, -1.8924474716186523e-06, -1.4640390872955322e-06, -1.0356307029724121e-06, -6.07222318649292e-07, -1.7881393432617188e-07, 2.4959444999694824e-07, 6.780028343200684e-07, 1.1064112186431885e-06, 1.5348196029663086e-06, 1.9632279872894287e-06, 2.391636371612549e-06, 2.820044755935669e-06, 3.248453140258789e-06, 3.676861524581909e-06, 4.105269908905029e-06, 4.533678293228149e-06, 4.9620866775512695e-06, 5.39049506187439e-06, 5.81890344619751e-06, 6.24731183052063e-06, 6.67572021484375e-06, 7.10412859916687e-06, 7.53253698348999e-06, 7.96094536781311e-06, 8.38935375213623e-06, 8.81776213645935e-06, 9.24617052078247e-06, 9.67457890510559e-06, 1.0102987289428711e-05, 1.0531395673751831e-05, 1.0959804058074951e-05, 1.1388212442398071e-05, 1.1816620826721191e-05, 1.2245029211044312e-05, 1.2673437595367432e-05, 1.3101845979690552e-05, 1.3530254364013672e-05]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 5.0, 7.0, 17.0, 15.0, 14.0, 27.0, 55.0, 69.0, 109.0, 130.0, 201.0, 296.0, 462.0, 740.0, 1075.0, 1419.0, 2236.0, 3307.0, 4888.0, 7310.0, 10794.0, 15925.0, 24399.0, 37233.0, 59305.0, 98802.0, 195931.0, 257535.0, 124393.0, 71178.0, 44543.0, 28811.0, 18983.0, 12346.0, 8504.0, 5638.0, 3892.0, 2589.0, 1736.0, 1143.0, 796.0, 559.0, 375.0, 231.0, 176.0, 112.0, 87.0, 54.0, 42.0, 28.0, 15.0, 9.0, 7.0, 5.0, 5.0, 1.0, 1.0, 2.0], "bins": [-0.6796875, -0.659210205078125, -0.63873291015625, -0.618255615234375, -0.5977783203125, -0.577301025390625, -0.55682373046875, -0.536346435546875, -0.515869140625, -0.495391845703125, -0.47491455078125, -0.454437255859375, -0.4339599609375, -0.413482666015625, -0.39300537109375, -0.372528076171875, -0.35205078125, -0.331573486328125, -0.31109619140625, -0.290618896484375, -0.2701416015625, -0.249664306640625, -0.22918701171875, -0.208709716796875, -0.188232421875, -0.167755126953125, -0.14727783203125, -0.126800537109375, -0.1063232421875, -0.085845947265625, -0.06536865234375, -0.044891357421875, -0.0244140625, -0.003936767578125, 0.01654052734375, 0.037017822265625, 0.0574951171875, 0.077972412109375, 0.09844970703125, 0.118927001953125, 0.139404296875, 0.159881591796875, 0.18035888671875, 0.200836181640625, 0.2213134765625, 0.241790771484375, 0.26226806640625, 0.282745361328125, 0.30322265625, 0.323699951171875, 0.34417724609375, 0.364654541015625, 0.3851318359375, 0.405609130859375, 0.42608642578125, 0.446563720703125, 0.467041015625, 0.487518310546875, 0.50799560546875, 0.528472900390625, 0.5489501953125, 0.569427490234375, 0.58990478515625, 0.610382080078125, 0.630859375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 7.0, 5.0, 4.0, 2.0, 2.0, 7.0, 12.0, 14.0, 23.0, 20.0, 15.0, 11.0, 19.0, 19.0, 31.0, 34.0, 33.0, 41.0, 38.0, 36.0, 35.0, 50.0, 41.0, 39.0, 49.0, 40.0, 43.0, 45.0, 45.0, 20.0, 27.0, 22.0, 35.0, 20.0, 19.0, 19.0, 14.0, 22.0, 11.0, 6.0, 7.0, 5.0, 7.0, 5.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.405517578125, -0.39243316650390625, -0.3793487548828125, -0.36626434326171875, -0.353179931640625, -0.34009552001953125, -0.3270111083984375, -0.31392669677734375, -0.30084228515625, -0.28775787353515625, -0.2746734619140625, -0.26158905029296875, -0.248504638671875, -0.23542022705078125, -0.2223358154296875, -0.20925140380859375, -0.1961669921875, -0.18308258056640625, -0.1699981689453125, -0.15691375732421875, -0.143829345703125, -0.13074493408203125, -0.1176605224609375, -0.10457611083984375, -0.09149169921875, -0.07840728759765625, -0.0653228759765625, -0.05223846435546875, -0.039154052734375, -0.02606964111328125, -0.0129852294921875, 9.918212890625e-05, 0.01318359375, 0.02626800537109375, 0.0393524169921875, 0.05243682861328125, 0.065521240234375, 0.07860565185546875, 0.0916900634765625, 0.10477447509765625, 0.11785888671875, 0.13094329833984375, 0.1440277099609375, 0.15711212158203125, 0.170196533203125, 0.18328094482421875, 0.1963653564453125, 0.20944976806640625, 0.2225341796875, 0.23561859130859375, 0.2487030029296875, 0.26178741455078125, 0.274871826171875, 0.28795623779296875, 0.3010406494140625, 0.31412506103515625, 0.32720947265625, 0.34029388427734375, 0.3533782958984375, 0.36646270751953125, 0.379547119140625, 0.39263153076171875, 0.4057159423828125, 0.41880035400390625, 0.431884765625]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 5.0, 7.0, 9.0, 8.0, 11.0, 13.0, 18.0, 15.0, 36.0, 24.0, 25.0, 37.0, 35.0, 38.0, 41.0, 48.0, 44.0, 43.0, 61.0, 50.0, 45.0, 43.0, 40.0, 42.0, 47.0, 28.0, 39.0, 29.0, 24.0, 21.0, 11.0, 8.0, 8.0, 10.0, 6.0, 8.0, 8.0, 3.0, 4.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-11.899259567260742, -11.485990524291992, -11.072721481323242, -10.659452438354492, -10.246183395385742, -9.832914352416992, -9.419645309448242, -9.006376266479492, -8.593107223510742, -8.179838180541992, -7.766569137573242, -7.353300094604492, -6.940031051635742, -6.526762008666992, -6.113492965698242, -5.700223922729492, -5.286954879760742, -4.873685836791992, -4.460416793823242, -4.047147750854492, -3.633878707885742, -3.220609664916992, -2.807340621948242, -2.394071578979492, -1.9808025360107422, -1.5675334930419922, -1.1542644500732422, -0.7409954071044922, -0.3277263641357422, 0.08554267883300781, 0.4988117218017578, 0.9120807647705078, 1.3253498077392578, 1.7386188507080078, 2.151887893676758, 2.565156936645508, 2.978425979614258, 3.391695022583008, 3.804964065551758, 4.218233108520508, 4.631502151489258, 5.044771194458008, 5.458040237426758, 5.871309280395508, 6.284578323364258, 6.697847366333008, 7.111116409301758, 7.524385452270508, 7.937654495239258, 8.350923538208008, 8.764192581176758, 9.177461624145508, 9.590730667114258, 10.003999710083008, 10.417268753051758, 10.830537796020508, 11.243806838989258, 11.657075881958008, 12.070344924926758, 12.483613967895508, 12.896883010864258, 13.310152053833008, 13.723421096801758, 14.136690139770508, 14.549959182739258]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 5.0, 7.0, 12.0, 17.0, 17.0, 17.0, 20.0, 16.0, 32.0, 17.0, 31.0, 27.0, 26.0, 36.0, 48.0, 37.0, 44.0, 50.0, 41.0, 39.0, 46.0, 35.0, 47.0, 33.0, 34.0, 34.0, 30.0, 30.0, 31.0, 31.0, 20.0, 10.0, 14.0, 17.0, 12.0, 7.0, 9.0, 5.0, 5.0, 4.0, 2.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-16.59904670715332, -16.11166000366211, -15.624272346496582, -15.136884689331055, -14.649497032165527, -14.162109375, -13.674722671508789, -13.187335014343262, -12.699947357177734, -12.212559700012207, -11.725172996520996, -11.237785339355469, -10.750397682189941, -10.263010025024414, -9.775623321533203, -9.288235664367676, -8.800848960876465, -8.313461303710938, -7.826074123382568, -7.338686943054199, -6.851299285888672, -6.363912105560303, -5.876524925231934, -5.389137268066406, -4.901750087738037, -4.414362907409668, -3.9269752502441406, -3.4395880699157715, -2.9522006511688232, -2.464813232421875, -1.9774260520935059, -1.4900386333465576, -1.0026521682739258, -0.5152648091316223, -0.027877449989318848, 0.45950984954833984, 0.9468972682952881, 1.4342846870422363, 1.9216718673706055, 2.4090592861175537, 2.896446704864502, 3.38383412361145, 3.8712215423583984, 4.358608722686768, 4.845995903015137, 5.333383560180664, 5.820770740509033, 6.308157920837402, 6.79554557800293, 7.282932758331299, 7.770320415496826, 8.257707595825195, 8.745095252990723, 9.23248291015625, 9.719869613647461, 10.207257270812988, 10.694644927978516, 11.182032585144043, 11.669419288635254, 12.156806945800781, 12.644194602966309, 13.131582260131836, 13.618968963623047, 14.106356620788574, 14.593743324279785]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 9.0, 7.0, 7.0, 4.0, 25.0, 32.0, 37.0, 56.0, 90.0, 141.0, 215.0, 340.0, 523.0, 830.0, 1293.0, 1989.0, 3141.0, 4944.0, 7581.0, 12239.0, 19162.0, 29691.0, 45379.0, 65287.0, 89385.0, 111155.0, 126119.0, 126629.0, 113163.0, 90993.0, 66911.0, 46173.0, 30722.0, 19719.0, 12523.0, 7992.0, 5112.0, 3232.0, 2055.0, 1291.0, 836.0, 473.0, 371.0, 263.0, 153.0, 85.0, 66.0, 50.0, 30.0, 16.0, 11.0, 7.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-10.40625, -10.0709228515625, -9.735595703125, -9.4002685546875, -9.06494140625, -8.7296142578125, -8.394287109375, -8.0589599609375, -7.7236328125, -7.3883056640625, -7.052978515625, -6.7176513671875, -6.38232421875, -6.0469970703125, -5.711669921875, -5.3763427734375, -5.041015625, -4.7056884765625, -4.370361328125, -4.0350341796875, -3.69970703125, -3.3643798828125, -3.029052734375, -2.6937255859375, -2.3583984375, -2.0230712890625, -1.687744140625, -1.3524169921875, -1.01708984375, -0.6817626953125, -0.346435546875, -0.0111083984375, 0.32421875, 0.6595458984375, 0.994873046875, 1.3302001953125, 1.66552734375, 2.0008544921875, 2.336181640625, 2.6715087890625, 3.0068359375, 3.3421630859375, 3.677490234375, 4.0128173828125, 4.34814453125, 4.6834716796875, 5.018798828125, 5.3541259765625, 5.689453125, 6.0247802734375, 6.360107421875, 6.6954345703125, 7.03076171875, 7.3660888671875, 7.701416015625, 8.0367431640625, 8.3720703125, 8.7073974609375, 9.042724609375, 9.3780517578125, 9.71337890625, 10.0487060546875, 10.384033203125, 10.7193603515625, 11.0546875]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 5.0, 6.0, 5.0, 9.0, 6.0, 8.0, 20.0, 21.0, 16.0, 14.0, 22.0, 23.0, 29.0, 24.0, 30.0, 35.0, 35.0, 42.0, 43.0, 33.0, 47.0, 32.0, 49.0, 44.0, 40.0, 34.0, 33.0, 40.0, 27.0, 26.0, 27.0, 28.0, 18.0, 25.0, 21.0, 12.0, 18.0, 14.0, 10.0, 7.0, 8.0, 4.0, 1.0, 4.0, 4.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-14.578125, -14.13427734375, -13.6904296875, -13.24658203125, -12.802734375, -12.35888671875, -11.9150390625, -11.47119140625, -11.02734375, -10.58349609375, -10.1396484375, -9.69580078125, -9.251953125, -8.80810546875, -8.3642578125, -7.92041015625, -7.4765625, -7.03271484375, -6.5888671875, -6.14501953125, -5.701171875, -5.25732421875, -4.8134765625, -4.36962890625, -3.92578125, -3.48193359375, -3.0380859375, -2.59423828125, -2.150390625, -1.70654296875, -1.2626953125, -0.81884765625, -0.375, 0.06884765625, 0.5126953125, 0.95654296875, 1.400390625, 1.84423828125, 2.2880859375, 2.73193359375, 3.17578125, 3.61962890625, 4.0634765625, 4.50732421875, 4.951171875, 5.39501953125, 5.8388671875, 6.28271484375, 6.7265625, 7.17041015625, 7.6142578125, 8.05810546875, 8.501953125, 8.94580078125, 9.3896484375, 9.83349609375, 10.27734375, 10.72119140625, 11.1650390625, 11.60888671875, 12.052734375, 12.49658203125, 12.9404296875, 13.38427734375, 13.828125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 5.0, 9.0, 16.0, 19.0, 32.0, 36.0, 74.0, 129.0, 168.0, 268.0, 413.0, 704.0, 1060.0, 1633.0, 2517.0, 4167.0, 6568.0, 10058.0, 15967.0, 24823.0, 37371.0, 55383.0, 77923.0, 101771.0, 120611.0, 127506.0, 120506.0, 100925.0, 77742.0, 55352.0, 37153.0, 24391.0, 15684.0, 10165.0, 6282.0, 4006.0, 2598.0, 1634.0, 1053.0, 669.0, 401.0, 279.0, 177.0, 103.0, 74.0, 50.0, 29.0, 20.0, 15.0, 9.0, 4.0, 7.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-11.15625, -10.8128662109375, -10.469482421875, -10.1260986328125, -9.78271484375, -9.4393310546875, -9.095947265625, -8.7525634765625, -8.4091796875, -8.0657958984375, -7.722412109375, -7.3790283203125, -7.03564453125, -6.6922607421875, -6.348876953125, -6.0054931640625, -5.662109375, -5.3187255859375, -4.975341796875, -4.6319580078125, -4.28857421875, -3.9451904296875, -3.601806640625, -3.2584228515625, -2.9150390625, -2.5716552734375, -2.228271484375, -1.8848876953125, -1.54150390625, -1.1981201171875, -0.854736328125, -0.5113525390625, -0.16796875, 0.1754150390625, 0.518798828125, 0.8621826171875, 1.20556640625, 1.5489501953125, 1.892333984375, 2.2357177734375, 2.5791015625, 2.9224853515625, 3.265869140625, 3.6092529296875, 3.95263671875, 4.2960205078125, 4.639404296875, 4.9827880859375, 5.326171875, 5.6695556640625, 6.012939453125, 6.3563232421875, 6.69970703125, 7.0430908203125, 7.386474609375, 7.7298583984375, 8.0732421875, 8.4166259765625, 8.760009765625, 9.1033935546875, 9.44677734375, 9.7901611328125, 10.133544921875, 10.4769287109375, 10.8203125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 7.0, 4.0, 4.0, 9.0, 6.0, 14.0, 9.0, 22.0, 21.0, 11.0, 21.0, 26.0, 31.0, 32.0, 32.0, 41.0, 37.0, 40.0, 39.0, 49.0, 44.0, 38.0, 41.0, 27.0, 38.0, 31.0, 40.0, 31.0, 26.0, 29.0, 30.0, 25.0, 29.0, 16.0, 21.0, 9.0, 11.0, 17.0, 6.0, 11.0, 9.0, 8.0, 2.0, 3.0, 1.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.5546875, -9.2633056640625, -8.971923828125, -8.6805419921875, -8.38916015625, -8.0977783203125, -7.806396484375, -7.5150146484375, -7.2236328125, -6.9322509765625, -6.640869140625, -6.3494873046875, -6.05810546875, -5.7667236328125, -5.475341796875, -5.1839599609375, -4.892578125, -4.6011962890625, -4.309814453125, -4.0184326171875, -3.72705078125, -3.4356689453125, -3.144287109375, -2.8529052734375, -2.5615234375, -2.2701416015625, -1.978759765625, -1.6873779296875, -1.39599609375, -1.1046142578125, -0.813232421875, -0.5218505859375, -0.23046875, 0.0609130859375, 0.352294921875, 0.6436767578125, 0.93505859375, 1.2264404296875, 1.517822265625, 1.8092041015625, 2.1005859375, 2.3919677734375, 2.683349609375, 2.9747314453125, 3.26611328125, 3.5574951171875, 3.848876953125, 4.1402587890625, 4.431640625, 4.7230224609375, 5.014404296875, 5.3057861328125, 5.59716796875, 5.8885498046875, 6.179931640625, 6.4713134765625, 6.7626953125, 7.0540771484375, 7.345458984375, 7.6368408203125, 7.92822265625, 8.2196044921875, 8.510986328125, 8.8023681640625, 9.09375]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 9.0, 19.0, 13.0, 26.0, 29.0, 34.0, 50.0, 87.0, 120.0, 231.0, 358.0, 544.0, 938.0, 1463.0, 2439.0, 4100.0, 7152.0, 12354.0, 20954.0, 35352.0, 58086.0, 88537.0, 122550.0, 149611.0, 152742.0, 131324.0, 96992.0, 64933.0, 39814.0, 23921.0, 13806.0, 8153.0, 4805.0, 2722.0, 1562.0, 1015.0, 616.0, 409.0, 240.0, 135.0, 99.0, 57.0, 45.0, 32.0, 17.0, 11.0, 11.0, 13.0, 8.0, 5.0, 6.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0], "bins": [-3.283203125, -3.177703857421875, -3.07220458984375, -2.966705322265625, -2.8612060546875, -2.755706787109375, -2.65020751953125, -2.544708251953125, -2.439208984375, -2.333709716796875, -2.22821044921875, -2.122711181640625, -2.0172119140625, -1.911712646484375, -1.80621337890625, -1.700714111328125, -1.59521484375, -1.489715576171875, -1.38421630859375, -1.278717041015625, -1.1732177734375, -1.067718505859375, -0.96221923828125, -0.856719970703125, -0.751220703125, -0.645721435546875, -0.54022216796875, -0.434722900390625, -0.3292236328125, -0.223724365234375, -0.11822509765625, -0.012725830078125, 0.0927734375, 0.198272705078125, 0.30377197265625, 0.409271240234375, 0.5147705078125, 0.620269775390625, 0.72576904296875, 0.831268310546875, 0.936767578125, 1.042266845703125, 1.14776611328125, 1.253265380859375, 1.3587646484375, 1.464263916015625, 1.56976318359375, 1.675262451171875, 1.78076171875, 1.886260986328125, 1.99176025390625, 2.097259521484375, 2.2027587890625, 2.308258056640625, 2.41375732421875, 2.519256591796875, 2.624755859375, 2.730255126953125, 2.83575439453125, 2.941253662109375, 3.0467529296875, 3.152252197265625, 3.25775146484375, 3.363250732421875, 3.46875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 5.0, 4.0, 5.0, 8.0, 9.0, 5.0, 13.0, 8.0, 9.0, 7.0, 14.0, 15.0, 9.0, 15.0, 26.0, 31.0, 35.0, 36.0, 39.0, 41.0, 33.0, 45.0, 47.0, 34.0, 40.0, 49.0, 37.0, 31.0, 40.0, 27.0, 25.0, 41.0, 28.0, 34.0, 25.0, 18.0, 14.0, 10.0, 18.0, 9.0, 5.0, 12.0, 12.0, 9.0, 7.0, 5.0, 8.0, 3.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00024199485778808594, -0.0002345200628042221, -0.00022704526782035828, -0.00021957047283649445, -0.00021209567785263062, -0.00020462088286876678, -0.00019714608788490295, -0.00018967129290103912, -0.0001821964979171753, -0.00017472170293331146, -0.00016724690794944763, -0.0001597721129655838, -0.00015229731798171997, -0.00014482252299785614, -0.0001373477280139923, -0.00012987293303012848, -0.00012239813804626465, -0.00011492334306240082, -0.00010744854807853699, -9.997375309467316e-05, -9.249895811080933e-05, -8.50241631269455e-05, -7.754936814308167e-05, -7.007457315921783e-05, -6.2599778175354e-05, -5.512498319149017e-05, -4.765018820762634e-05, -4.017539322376251e-05, -3.270059823989868e-05, -2.522580325603485e-05, -1.775100827217102e-05, -1.027621328830719e-05, -2.8014183044433594e-06, 4.673376679420471e-06, 1.2148171663284302e-05, 1.9622966647148132e-05, 2.7097761631011963e-05, 3.4572556614875793e-05, 4.2047351598739624e-05, 4.9522146582603455e-05, 5.6996941566467285e-05, 6.447173655033112e-05, 7.194653153419495e-05, 7.942132651805878e-05, 8.689612150192261e-05, 9.437091648578644e-05, 0.00010184571146965027, 0.0001093205064535141, 0.00011679530143737793, 0.00012427009642124176, 0.0001317448914051056, 0.00013921968638896942, 0.00014669448137283325, 0.00015416927635669708, 0.0001616440713405609, 0.00016911886632442474, 0.00017659366130828857, 0.0001840684562921524, 0.00019154325127601624, 0.00019901804625988007, 0.0002064928412437439, 0.00021396763622760773, 0.00022144243121147156, 0.0002289172261953354, 0.00023639202117919922]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 7.0, 9.0, 18.0, 14.0, 25.0, 30.0, 38.0, 67.0, 96.0, 123.0, 244.0, 320.0, 499.0, 685.0, 1006.0, 1493.0, 2307.0, 3551.0, 5420.0, 8301.0, 12780.0, 19488.0, 30000.0, 44669.0, 63759.0, 86098.0, 108364.0, 123725.0, 124372.0, 111305.0, 90613.0, 67940.0, 47844.0, 31854.0, 21296.0, 13773.0, 9057.0, 5900.0, 3895.0, 2523.0, 1645.0, 1070.0, 751.0, 523.0, 314.0, 239.0, 163.0, 128.0, 78.0, 44.0, 38.0, 24.0, 15.0, 13.0, 4.0, 3.0, 3.0, 2.0], "bins": [-3.119140625, -3.02764892578125, -2.9361572265625, -2.84466552734375, -2.753173828125, -2.66168212890625, -2.5701904296875, -2.47869873046875, -2.38720703125, -2.29571533203125, -2.2042236328125, -2.11273193359375, -2.021240234375, -1.92974853515625, -1.8382568359375, -1.74676513671875, -1.6552734375, -1.56378173828125, -1.4722900390625, -1.38079833984375, -1.289306640625, -1.19781494140625, -1.1063232421875, -1.01483154296875, -0.92333984375, -0.83184814453125, -0.7403564453125, -0.64886474609375, -0.557373046875, -0.46588134765625, -0.3743896484375, -0.28289794921875, -0.19140625, -0.09991455078125, -0.0084228515625, 0.08306884765625, 0.174560546875, 0.26605224609375, 0.3575439453125, 0.44903564453125, 0.54052734375, 0.63201904296875, 0.7235107421875, 0.81500244140625, 0.906494140625, 0.99798583984375, 1.0894775390625, 1.18096923828125, 1.2724609375, 1.36395263671875, 1.4554443359375, 1.54693603515625, 1.638427734375, 1.72991943359375, 1.8214111328125, 1.91290283203125, 2.00439453125, 2.09588623046875, 2.1873779296875, 2.27886962890625, 2.370361328125, 2.46185302734375, 2.5533447265625, 2.64483642578125, 2.736328125]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 5.0, 7.0, 6.0, 12.0, 9.0, 18.0, 18.0, 22.0, 32.0, 34.0, 39.0, 50.0, 50.0, 58.0, 63.0, 63.0, 63.0, 56.0, 61.0, 53.0, 49.0, 42.0, 37.0, 33.0, 27.0, 19.0, 15.0, 12.0, 6.0, 11.0, 5.0, 6.0, 2.0, 2.0, 4.0, 3.0, 2.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.009765625, -1.949005126953125, -1.88824462890625, -1.827484130859375, -1.7667236328125, -1.705963134765625, -1.64520263671875, -1.584442138671875, -1.523681640625, -1.462921142578125, -1.40216064453125, -1.341400146484375, -1.2806396484375, -1.219879150390625, -1.15911865234375, -1.098358154296875, -1.03759765625, -0.976837158203125, -0.91607666015625, -0.855316162109375, -0.7945556640625, -0.733795166015625, -0.67303466796875, -0.612274169921875, -0.551513671875, -0.490753173828125, -0.42999267578125, -0.369232177734375, -0.3084716796875, -0.247711181640625, -0.18695068359375, -0.126190185546875, -0.0654296875, -0.004669189453125, 0.05609130859375, 0.116851806640625, 0.1776123046875, 0.238372802734375, 0.29913330078125, 0.359893798828125, 0.420654296875, 0.481414794921875, 0.54217529296875, 0.602935791015625, 0.6636962890625, 0.724456787109375, 0.78521728515625, 0.845977783203125, 0.90673828125, 0.967498779296875, 1.02825927734375, 1.089019775390625, 1.1497802734375, 1.210540771484375, 1.27130126953125, 1.332061767578125, 1.392822265625, 1.453582763671875, 1.51434326171875, 1.575103759765625, 1.6358642578125, 1.696624755859375, 1.75738525390625, 1.818145751953125, 1.87890625]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 6.0, 3.0, 5.0, 6.0, 8.0, 9.0, 6.0, 14.0, 16.0, 17.0, 23.0, 23.0, 25.0, 29.0, 41.0, 27.0, 57.0, 33.0, 45.0, 56.0, 48.0, 55.0, 49.0, 46.0, 41.0, 44.0, 44.0, 32.0, 36.0, 28.0, 24.0, 20.0, 16.0, 14.0, 11.0, 11.0, 9.0, 4.0, 9.0, 9.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.851200103759766, -12.450047492980957, -12.048893928527832, -11.647741317749023, -11.246587753295898, -10.84543514251709, -10.444282531738281, -10.043128967285156, -9.641975402832031, -9.240822792053223, -8.839669227600098, -8.438516616821289, -8.037363052368164, -7.6362104415893555, -7.235057353973389, -6.833904266357422, -6.432751655578613, -6.0315985679626465, -5.63044548034668, -5.229292869567871, -4.828139305114746, -4.4269866943359375, -4.025833606719971, -3.624680519104004, -3.223527431488037, -2.8223743438720703, -2.4212212562561035, -2.020068407058716, -1.618915319442749, -1.2177622318267822, -0.8166093826293945, -0.41545629501342773, -0.014302253723144531, 0.3868507742881775, 0.7880038022994995, 1.1891567707061768, 1.5903098583221436, 1.9914629459381104, 2.392615795135498, 2.793768882751465, 3.1949219703674316, 3.5960750579833984, 3.9972281455993652, 4.398381233215332, 4.799533843994141, 5.200687408447266, 5.601840019226074, 6.002993106842041, 6.404146194458008, 6.805299282073975, 7.206452369689941, 7.60760498046875, 8.008758544921875, 8.409911155700684, 8.811063766479492, 9.212217330932617, 9.613370895385742, 10.01452350616455, 10.415677070617676, 10.816829681396484, 11.21798324584961, 11.619135856628418, 12.020288467407227, 12.421442031860352, 12.82259464263916]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 6.0, 2.0, 6.0, 1.0, 4.0, 8.0, 8.0, 14.0, 13.0, 25.0, 19.0, 15.0, 28.0, 37.0, 28.0, 33.0, 32.0, 43.0, 40.0, 45.0, 33.0, 50.0, 36.0, 42.0, 33.0, 37.0, 40.0, 27.0, 37.0, 36.0, 30.0, 31.0, 30.0, 27.0, 21.0, 20.0, 11.0, 13.0, 13.0, 9.0, 6.0, 3.0, 5.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 3.0], "bins": [-17.322124481201172, -16.834665298461914, -16.34720802307129, -15.859748840332031, -15.372289657592773, -14.884831428527832, -14.39737319946289, -13.909914016723633, -13.422454833984375, -12.934996604919434, -12.447537422180176, -11.960079193115234, -11.472620010375977, -10.985161781311035, -10.497703552246094, -10.010244369506836, -9.522786140441895, -9.035327911376953, -8.547868728637695, -8.060410499572754, -7.572951316833496, -7.085493087768555, -6.598034381866455, -6.1105756759643555, -5.623116970062256, -5.135658264160156, -4.648199558258057, -4.160740852355957, -3.6732823848724365, -3.185823678970337, -2.6983652114868164, -2.210906505584717, -1.7234468460083008, -1.2359881401062012, -0.7485295534133911, -0.26107096672058105, 0.22638773918151855, 0.7138464450836182, 1.2013049125671387, 1.6887636184692383, 2.176222324371338, 2.6636810302734375, 3.151139736175537, 3.6385982036590576, 4.126056671142578, 4.613515853881836, 5.100974082946777, 5.588432788848877, 6.075891494750977, 6.563350200653076, 7.050808906555176, 7.538267135620117, 8.025726318359375, 8.513184547424316, 9.000642776489258, 9.488101959228516, 9.975561141967773, 10.463019371032715, 10.950478553771973, 11.437936782836914, 11.925395965576172, 12.412854194641113, 12.900312423706055, 13.387771606445312, 13.875229835510254]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [2.0, 5.0, 2.0, 3.0, 7.0, 14.0, 15.0, 28.0, 41.0, 75.0, 96.0, 183.0, 257.0, 413.0, 630.0, 1045.0, 1686.0, 2672.0, 4093.0, 6544.0, 10608.0, 16948.0, 27083.0, 43835.0, 69306.0, 110514.0, 173618.0, 265412.0, 385346.0, 504839.0, 579075.0, 560832.0, 464283.0, 338622.0, 228706.0, 148166.0, 93145.0, 58053.0, 36946.0, 22830.0, 14109.0, 8901.0, 5600.0, 3524.0, 2244.0, 1489.0, 890.0, 554.0, 354.0, 275.0, 131.0, 81.0, 68.0, 39.0, 28.0, 19.0, 9.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.7734375, -9.4564208984375, -9.139404296875, -8.8223876953125, -8.50537109375, -8.1883544921875, -7.871337890625, -7.5543212890625, -7.2373046875, -6.9202880859375, -6.603271484375, -6.2862548828125, -5.96923828125, -5.6522216796875, -5.335205078125, -5.0181884765625, -4.701171875, -4.3841552734375, -4.067138671875, -3.7501220703125, -3.43310546875, -3.1160888671875, -2.799072265625, -2.4820556640625, -2.1650390625, -1.8480224609375, -1.531005859375, -1.2139892578125, -0.89697265625, -0.5799560546875, -0.262939453125, 0.0540771484375, 0.37109375, 0.6881103515625, 1.005126953125, 1.3221435546875, 1.63916015625, 1.9561767578125, 2.273193359375, 2.5902099609375, 2.9072265625, 3.2242431640625, 3.541259765625, 3.8582763671875, 4.17529296875, 4.4923095703125, 4.809326171875, 5.1263427734375, 5.443359375, 5.7603759765625, 6.077392578125, 6.3944091796875, 6.71142578125, 7.0284423828125, 7.345458984375, 7.6624755859375, 7.9794921875, 8.2965087890625, 8.613525390625, 8.9305419921875, 9.24755859375, 9.5645751953125, 9.881591796875, 10.1986083984375, 10.515625]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 1.0, 4.0, 5.0, 9.0, 11.0, 11.0, 17.0, 8.0, 19.0, 17.0, 31.0, 24.0, 32.0, 36.0, 35.0, 22.0, 40.0, 38.0, 45.0, 40.0, 31.0, 32.0, 39.0, 37.0, 35.0, 41.0, 39.0, 33.0, 30.0, 31.0, 31.0, 27.0, 33.0, 16.0, 15.0, 17.0, 13.0, 16.0, 10.0, 9.0, 4.0, 5.0, 2.0, 4.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0], "bins": [-11.8515625, -11.510498046875, -11.16943359375, -10.828369140625, -10.4873046875, -10.146240234375, -9.80517578125, -9.464111328125, -9.123046875, -8.781982421875, -8.44091796875, -8.099853515625, -7.7587890625, -7.417724609375, -7.07666015625, -6.735595703125, -6.39453125, -6.053466796875, -5.71240234375, -5.371337890625, -5.0302734375, -4.689208984375, -4.34814453125, -4.007080078125, -3.666015625, -3.324951171875, -2.98388671875, -2.642822265625, -2.3017578125, -1.960693359375, -1.61962890625, -1.278564453125, -0.9375, -0.596435546875, -0.25537109375, 0.085693359375, 0.4267578125, 0.767822265625, 1.10888671875, 1.449951171875, 1.791015625, 2.132080078125, 2.47314453125, 2.814208984375, 3.1552734375, 3.496337890625, 3.83740234375, 4.178466796875, 4.51953125, 4.860595703125, 5.20166015625, 5.542724609375, 5.8837890625, 6.224853515625, 6.56591796875, 6.906982421875, 7.248046875, 7.589111328125, 7.93017578125, 8.271240234375, 8.6123046875, 8.953369140625, 9.29443359375, 9.635498046875, 9.9765625]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [6.0, 3.0, 2.0, 2.0, 5.0, 9.0, 14.0, 27.0, 26.0, 68.0, 110.0, 155.0, 224.0, 378.0, 626.0, 940.0, 1552.0, 2487.0, 4008.0, 6395.0, 10358.0, 16422.0, 25896.0, 40713.0, 62393.0, 93121.0, 137983.0, 194011.0, 263355.0, 336598.0, 401879.0, 442589.0, 447184.0, 413568.0, 352200.0, 281125.0, 210597.0, 150512.0, 103481.0, 69156.0, 45628.0, 29262.0, 18447.0, 11721.0, 7185.0, 4543.0, 2722.0, 1788.0, 1063.0, 625.0, 413.0, 259.0, 188.0, 107.0, 62.0, 36.0, 31.0, 28.0, 4.0, 4.0, 2.0, 2.0, 2.0, 4.0], "bins": [-8.109375, -7.85693359375, -7.6044921875, -7.35205078125, -7.099609375, -6.84716796875, -6.5947265625, -6.34228515625, -6.08984375, -5.83740234375, -5.5849609375, -5.33251953125, -5.080078125, -4.82763671875, -4.5751953125, -4.32275390625, -4.0703125, -3.81787109375, -3.5654296875, -3.31298828125, -3.060546875, -2.80810546875, -2.5556640625, -2.30322265625, -2.05078125, -1.79833984375, -1.5458984375, -1.29345703125, -1.041015625, -0.78857421875, -0.5361328125, -0.28369140625, -0.03125, 0.22119140625, 0.4736328125, 0.72607421875, 0.978515625, 1.23095703125, 1.4833984375, 1.73583984375, 1.98828125, 2.24072265625, 2.4931640625, 2.74560546875, 2.998046875, 3.25048828125, 3.5029296875, 3.75537109375, 4.0078125, 4.26025390625, 4.5126953125, 4.76513671875, 5.017578125, 5.27001953125, 5.5224609375, 5.77490234375, 6.02734375, 6.27978515625, 6.5322265625, 6.78466796875, 7.037109375, 7.28955078125, 7.5419921875, 7.79443359375, 8.046875]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 4.0, 9.0, 7.0, 4.0, 11.0, 20.0, 17.0, 26.0, 47.0, 38.0, 52.0, 77.0, 73.0, 118.0, 138.0, 160.0, 141.0, 175.0, 184.0, 213.0, 238.0, 212.0, 207.0, 218.0, 242.0, 187.0, 181.0, 172.0, 151.0, 128.0, 108.0, 93.0, 100.0, 70.0, 57.0, 52.0, 35.0, 23.0, 16.0, 20.0, 17.0, 16.0, 10.0, 5.0, 8.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.30859375, -5.14263916015625, -4.9766845703125, -4.81072998046875, -4.644775390625, -4.47882080078125, -4.3128662109375, -4.14691162109375, -3.98095703125, -3.81500244140625, -3.6490478515625, -3.48309326171875, -3.317138671875, -3.15118408203125, -2.9852294921875, -2.81927490234375, -2.6533203125, -2.48736572265625, -2.3214111328125, -2.15545654296875, -1.989501953125, -1.82354736328125, -1.6575927734375, -1.49163818359375, -1.32568359375, -1.15972900390625, -0.9937744140625, -0.82781982421875, -0.661865234375, -0.49591064453125, -0.3299560546875, -0.16400146484375, 0.001953125, 0.16790771484375, 0.3338623046875, 0.49981689453125, 0.665771484375, 0.83172607421875, 0.9976806640625, 1.16363525390625, 1.32958984375, 1.49554443359375, 1.6614990234375, 1.82745361328125, 1.993408203125, 2.15936279296875, 2.3253173828125, 2.49127197265625, 2.6572265625, 2.82318115234375, 2.9891357421875, 3.15509033203125, 3.321044921875, 3.48699951171875, 3.6529541015625, 3.81890869140625, 3.98486328125, 4.15081787109375, 4.3167724609375, 4.48272705078125, 4.648681640625, 4.81463623046875, 4.9805908203125, 5.14654541015625, 5.3125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 6.0, 9.0, 8.0, 7.0, 8.0, 14.0, 16.0, 16.0, 30.0, 23.0, 30.0, 39.0, 42.0, 53.0, 51.0, 49.0, 55.0, 39.0, 36.0, 58.0, 39.0, 48.0, 45.0, 39.0, 35.0, 33.0, 21.0, 34.0, 15.0, 24.0, 18.0, 12.0, 11.0, 8.0, 11.0, 6.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.844474792480469, -9.487083435058594, -9.129693031311035, -8.77230167388916, -8.414911270141602, -8.057519912719727, -7.700128555297852, -7.342737674713135, -6.985346794128418, -6.627955913543701, -6.270565032958984, -5.913173675537109, -5.555782794952393, -5.198391914367676, -4.841000556945801, -4.483609676361084, -4.126218795776367, -3.7688279151916504, -3.4114367961883545, -3.0540456771850586, -2.696654796600342, -2.339263916015625, -1.981872797012329, -1.6244816780090332, -1.2670907974243164, -0.9096997976303101, -0.5523087978363037, -0.19491779804229736, 0.16247320175170898, 0.5198642015457153, 0.8772552013397217, 1.2346463203430176, 1.592036247253418, 1.9494272470474243, 2.3068182468414307, 2.6642093658447266, 3.0216002464294434, 3.37899112701416, 3.736382246017456, 4.093773365020752, 4.451164245605469, 4.8085551261901855, 5.165946006774902, 5.523337364196777, 5.880728244781494, 6.238119125366211, 6.595510482788086, 6.952901363372803, 7.3102922439575195, 7.667683124542236, 8.025074005126953, 8.382465362548828, 8.739856719970703, 9.097247123718262, 9.454638481140137, 9.812028884887695, 10.16942024230957, 10.526811599731445, 10.884202003479004, 11.241593360900879, 11.598983764648438, 11.956375122070312, 12.313766479492188, 12.671157836914062, 13.028548240661621]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 7.0, 7.0, 12.0, 5.0, 11.0, 8.0, 17.0, 12.0, 19.0, 25.0, 33.0, 22.0, 39.0, 30.0, 38.0, 48.0, 33.0, 37.0, 47.0, 45.0, 44.0, 42.0, 42.0, 45.0, 44.0, 44.0, 34.0, 32.0, 28.0, 18.0, 29.0, 22.0, 18.0, 16.0, 13.0, 10.0, 12.0, 5.0, 2.0, 2.0, 5.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.543310165405273, -13.10470199584961, -12.666092872619629, -12.227484703063965, -11.788875579833984, -11.35026741027832, -10.91165828704834, -10.473050117492676, -10.034440994262695, -9.595832824707031, -9.15722370147705, -8.718615531921387, -8.280006408691406, -7.841398239135742, -7.402789115905762, -6.964180946350098, -6.525572299957275, -6.086963653564453, -5.648355007171631, -5.209746360778809, -4.771137714385986, -4.332529067993164, -3.893920660018921, -3.4553120136260986, -3.0167033672332764, -2.578094720840454, -2.139486074447632, -1.7008775472640991, -1.2622689008712769, -0.8236603736877441, -0.3850517272949219, 0.05355691909790039, 0.49216556549072266, 0.9307742118835449, 1.3693828582763672, 1.8079913854599, 2.2466001510620117, 2.685208559036255, 3.123817205429077, 3.5624258518218994, 4.001034736633301, 4.439643383026123, 4.878252029418945, 5.316860675811768, 5.75546932220459, 6.194077491760254, 6.632686614990234, 7.071294784545898, 7.509903430938721, 7.948512077331543, 8.387120246887207, 8.825729370117188, 9.264337539672852, 9.702946662902832, 10.141554832458496, 10.580163955688477, 11.01877212524414, 11.457380294799805, 11.895989418029785, 12.33459758758545, 12.77320671081543, 13.211814880371094, 13.650424003601074, 14.089032173156738, 14.527641296386719]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 6.0, 10.0, 16.0, 20.0, 21.0, 47.0, 69.0, 125.0, 175.0, 293.0, 472.0, 688.0, 1111.0, 1769.0, 2814.0, 4396.0, 7144.0, 11543.0, 18734.0, 31080.0, 51637.0, 86223.0, 140315.0, 203372.0, 184195.0, 118899.0, 72499.0, 43137.0, 25839.0, 15759.0, 9921.0, 6001.0, 3722.0, 2391.0, 1477.0, 942.0, 618.0, 418.0, 222.0, 163.0, 99.0, 68.0, 40.0, 22.0, 21.0, 14.0, 5.0, 6.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.732421875, -2.651641845703125, -2.57086181640625, -2.490081787109375, -2.4093017578125, -2.328521728515625, -2.24774169921875, -2.166961669921875, -2.086181640625, -2.005401611328125, -1.92462158203125, -1.843841552734375, -1.7630615234375, -1.682281494140625, -1.60150146484375, -1.520721435546875, -1.43994140625, -1.359161376953125, -1.27838134765625, -1.197601318359375, -1.1168212890625, -1.036041259765625, -0.95526123046875, -0.874481201171875, -0.793701171875, -0.712921142578125, -0.63214111328125, -0.551361083984375, -0.4705810546875, -0.389801025390625, -0.30902099609375, -0.228240966796875, -0.1474609375, -0.066680908203125, 0.01409912109375, 0.094879150390625, 0.1756591796875, 0.256439208984375, 0.33721923828125, 0.417999267578125, 0.498779296875, 0.579559326171875, 0.66033935546875, 0.741119384765625, 0.8218994140625, 0.902679443359375, 0.98345947265625, 1.064239501953125, 1.14501953125, 1.225799560546875, 1.30657958984375, 1.387359619140625, 1.4681396484375, 1.548919677734375, 1.62969970703125, 1.710479736328125, 1.791259765625, 1.872039794921875, 1.95281982421875, 2.033599853515625, 2.1143798828125, 2.195159912109375, 2.27593994140625, 2.356719970703125, 2.4375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 6.0, 1.0, 3.0, 14.0, 10.0, 13.0, 11.0, 16.0, 14.0, 21.0, 29.0, 33.0, 36.0, 27.0, 47.0, 28.0, 35.0, 48.0, 43.0, 48.0, 38.0, 48.0, 47.0, 48.0, 45.0, 50.0, 32.0, 23.0, 28.0, 28.0, 27.0, 27.0, 20.0, 14.0, 11.0, 9.0, 4.0, 8.0, 5.0, 5.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-15.40625, -14.9561767578125, -14.506103515625, -14.0560302734375, -13.60595703125, -13.1558837890625, -12.705810546875, -12.2557373046875, -11.8056640625, -11.3555908203125, -10.905517578125, -10.4554443359375, -10.00537109375, -9.5552978515625, -9.105224609375, -8.6551513671875, -8.205078125, -7.7550048828125, -7.304931640625, -6.8548583984375, -6.40478515625, -5.9547119140625, -5.504638671875, -5.0545654296875, -4.6044921875, -4.1544189453125, -3.704345703125, -3.2542724609375, -2.80419921875, -2.3541259765625, -1.904052734375, -1.4539794921875, -1.00390625, -0.5538330078125, -0.103759765625, 0.3463134765625, 0.79638671875, 1.2464599609375, 1.696533203125, 2.1466064453125, 2.5966796875, 3.0467529296875, 3.496826171875, 3.9468994140625, 4.39697265625, 4.8470458984375, 5.297119140625, 5.7471923828125, 6.197265625, 6.6473388671875, 7.097412109375, 7.5474853515625, 7.99755859375, 8.4476318359375, 8.897705078125, 9.3477783203125, 9.7978515625, 10.2479248046875, 10.697998046875, 11.1480712890625, 11.59814453125, 12.0482177734375, 12.498291015625, 12.9483642578125, 13.3984375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 5.0, 2.0, 4.0, 1.0, 5.0, 5.0, 10.0, 12.0, 10.0, 14.0, 24.0, 16.0, 36.0, 56.0, 64.0, 83.0, 97.0, 139.0, 189.0, 275.0, 398.0, 561.0, 868.0, 1440.0, 2647.0, 5663.0, 13415.0, 36854.0, 893808.0, 57094.0, 18759.0, 7556.0, 3379.0, 1772.0, 1031.0, 632.0, 466.0, 301.0, 250.0, 144.0, 116.0, 98.0, 65.0, 58.0, 46.0, 24.0, 17.0, 12.0, 7.0, 9.0, 10.0, 3.0, 7.0, 4.0, 2.0, 1.0, 5.0, 3.0, 1.0, 0.0, 1.0], "bins": [-7.765625, -7.5205078125, -7.275390625, -7.0302734375, -6.78515625, -6.5400390625, -6.294921875, -6.0498046875, -5.8046875, -5.5595703125, -5.314453125, -5.0693359375, -4.82421875, -4.5791015625, -4.333984375, -4.0888671875, -3.84375, -3.5986328125, -3.353515625, -3.1083984375, -2.86328125, -2.6181640625, -2.373046875, -2.1279296875, -1.8828125, -1.6376953125, -1.392578125, -1.1474609375, -0.90234375, -0.6572265625, -0.412109375, -0.1669921875, 0.078125, 0.3232421875, 0.568359375, 0.8134765625, 1.05859375, 1.3037109375, 1.548828125, 1.7939453125, 2.0390625, 2.2841796875, 2.529296875, 2.7744140625, 3.01953125, 3.2646484375, 3.509765625, 3.7548828125, 4.0, 4.2451171875, 4.490234375, 4.7353515625, 4.98046875, 5.2255859375, 5.470703125, 5.7158203125, 5.9609375, 6.2060546875, 6.451171875, 6.6962890625, 6.94140625, 7.1865234375, 7.431640625, 7.6767578125, 7.921875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 5.0, 5.0, 10.0, 6.0, 9.0, 7.0, 5.0, 9.0, 15.0, 25.0, 13.0, 23.0, 35.0, 27.0, 24.0, 28.0, 25.0, 31.0, 48.0, 48.0, 48.0, 42.0, 44.0, 42.0, 41.0, 30.0, 34.0, 42.0, 29.0, 34.0, 22.0, 24.0, 19.0, 30.0, 23.0, 21.0, 15.0, 8.0, 10.0, 11.0, 5.0, 7.0, 7.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-8.65625, -8.3865966796875, -8.116943359375, -7.8472900390625, -7.57763671875, -7.3079833984375, -7.038330078125, -6.7686767578125, -6.4990234375, -6.2293701171875, -5.959716796875, -5.6900634765625, -5.42041015625, -5.1507568359375, -4.881103515625, -4.6114501953125, -4.341796875, -4.0721435546875, -3.802490234375, -3.5328369140625, -3.26318359375, -2.9935302734375, -2.723876953125, -2.4542236328125, -2.1845703125, -1.9149169921875, -1.645263671875, -1.3756103515625, -1.10595703125, -0.8363037109375, -0.566650390625, -0.2969970703125, -0.02734375, 0.2423095703125, 0.511962890625, 0.7816162109375, 1.05126953125, 1.3209228515625, 1.590576171875, 1.8602294921875, 2.1298828125, 2.3995361328125, 2.669189453125, 2.9388427734375, 3.20849609375, 3.4781494140625, 3.747802734375, 4.0174560546875, 4.287109375, 4.5567626953125, 4.826416015625, 5.0960693359375, 5.36572265625, 5.6353759765625, 5.905029296875, 6.1746826171875, 6.4443359375, 6.7139892578125, 6.983642578125, 7.2532958984375, 7.52294921875, 7.7926025390625, 8.062255859375, 8.3319091796875, 8.6015625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 3.0, 5.0, 4.0, 1.0, 5.0, 6.0, 11.0, 12.0, 17.0, 31.0, 33.0, 41.0, 82.0, 72.0, 140.0, 184.0, 313.0, 456.0, 748.0, 1362.0, 2683.0, 6529.0, 22429.0, 945301.0, 49276.0, 10531.0, 3825.0, 1773.0, 949.0, 588.0, 371.0, 225.0, 163.0, 109.0, 78.0, 47.0, 47.0, 31.0, 19.0, 12.0, 18.0, 10.0, 8.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.6142578125, -1.5599365234375, -1.505615234375, -1.4512939453125, -1.39697265625, -1.3426513671875, -1.288330078125, -1.2340087890625, -1.1796875, -1.1253662109375, -1.071044921875, -1.0167236328125, -0.96240234375, -0.9080810546875, -0.853759765625, -0.7994384765625, -0.7451171875, -0.6907958984375, -0.636474609375, -0.5821533203125, -0.52783203125, -0.4735107421875, -0.419189453125, -0.3648681640625, -0.310546875, -0.2562255859375, -0.201904296875, -0.1475830078125, -0.09326171875, -0.0389404296875, 0.015380859375, 0.0697021484375, 0.1240234375, 0.1783447265625, 0.232666015625, 0.2869873046875, 0.34130859375, 0.3956298828125, 0.449951171875, 0.5042724609375, 0.55859375, 0.6129150390625, 0.667236328125, 0.7215576171875, 0.77587890625, 0.8302001953125, 0.884521484375, 0.9388427734375, 0.9931640625, 1.0474853515625, 1.101806640625, 1.1561279296875, 1.21044921875, 1.2647705078125, 1.319091796875, 1.3734130859375, 1.427734375, 1.4820556640625, 1.536376953125, 1.5906982421875, 1.64501953125, 1.6993408203125, 1.753662109375, 1.8079833984375, 1.8623046875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 7.0, 13.0, 10.0, 12.0, 13.0, 24.0, 25.0, 22.0, 34.0, 38.0, 47.0, 50.0, 42.0, 47.0, 67.0, 46.0, 41.0, 68.0, 48.0, 49.0, 47.0, 36.0, 29.0, 33.0, 21.0, 18.0, 23.0, 14.0, 14.0, 14.0, 14.0, 4.0, 11.0, 7.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0], "bins": [-1.3113021850585938e-05, -1.2735836207866669e-05, -1.23586505651474e-05, -1.1981464922428131e-05, -1.1604279279708862e-05, -1.1227093636989594e-05, -1.0849907994270325e-05, -1.0472722351551056e-05, -1.0095536708831787e-05, -9.718351066112518e-06, -9.34116542339325e-06, -8.96397978067398e-06, -8.586794137954712e-06, -8.209608495235443e-06, -7.832422852516174e-06, -7.4552372097969055e-06, -7.078051567077637e-06, -6.700865924358368e-06, -6.323680281639099e-06, -5.94649463891983e-06, -5.5693089962005615e-06, -5.192123353481293e-06, -4.814937710762024e-06, -4.437752068042755e-06, -4.060566425323486e-06, -3.6833807826042175e-06, -3.3061951398849487e-06, -2.92900949716568e-06, -2.551823854446411e-06, -2.1746382117271423e-06, -1.7974525690078735e-06, -1.4202669262886047e-06, -1.043081283569336e-06, -6.658956408500671e-07, -2.8870999813079834e-07, 8.847564458847046e-08, 4.6566128730773926e-07, 8.428469300270081e-07, 1.2200325727462769e-06, 1.5972182154655457e-06, 1.9744038581848145e-06, 2.3515895009040833e-06, 2.728775143623352e-06, 3.105960786342621e-06, 3.4831464290618896e-06, 3.8603320717811584e-06, 4.237517714500427e-06, 4.614703357219696e-06, 4.991888999938965e-06, 5.369074642658234e-06, 5.7462602853775024e-06, 6.123445928096771e-06, 6.50063157081604e-06, 6.877817213535309e-06, 7.255002856254578e-06, 7.632188498973846e-06, 8.009374141693115e-06, 8.386559784412384e-06, 8.763745427131653e-06, 9.140931069850922e-06, 9.51811671257019e-06, 9.89530235528946e-06, 1.0272487998008728e-05, 1.0649673640727997e-05, 1.1026859283447266e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 5.0, 14.0, 17.0, 19.0, 40.0, 52.0, 95.0, 161.0, 208.0, 339.0, 566.0, 960.0, 1544.0, 2641.0, 4495.0, 7561.0, 12934.0, 22403.0, 39599.0, 74781.0, 160250.0, 352895.0, 182984.0, 82050.0, 43642.0, 24109.0, 13975.0, 8128.0, 4887.0, 2793.0, 1747.0, 1005.0, 608.0, 372.0, 250.0, 154.0, 84.0, 57.0, 39.0, 24.0, 28.0, 11.0, 6.0, 11.0, 2.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.57568359375, -0.5574493408203125, -0.539215087890625, -0.5209808349609375, -0.50274658203125, -0.4845123291015625, -0.466278076171875, -0.4480438232421875, -0.4298095703125, -0.4115753173828125, -0.393341064453125, -0.3751068115234375, -0.35687255859375, -0.3386383056640625, -0.320404052734375, -0.3021697998046875, -0.283935546875, -0.2657012939453125, -0.247467041015625, -0.2292327880859375, -0.21099853515625, -0.1927642822265625, -0.174530029296875, -0.1562957763671875, -0.1380615234375, -0.1198272705078125, -0.101593017578125, -0.0833587646484375, -0.06512451171875, -0.0468902587890625, -0.028656005859375, -0.0104217529296875, 0.0078125, 0.0260467529296875, 0.044281005859375, 0.0625152587890625, 0.08074951171875, 0.0989837646484375, 0.117218017578125, 0.1354522705078125, 0.1536865234375, 0.1719207763671875, 0.190155029296875, 0.2083892822265625, 0.22662353515625, 0.2448577880859375, 0.263092041015625, 0.2813262939453125, 0.299560546875, 0.3177947998046875, 0.336029052734375, 0.3542633056640625, 0.37249755859375, 0.3907318115234375, 0.408966064453125, 0.4272003173828125, 0.4454345703125, 0.4636688232421875, 0.481903076171875, 0.5001373291015625, 0.51837158203125, 0.5366058349609375, 0.554840087890625, 0.5730743408203125, 0.59130859375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 6.0, 3.0, 5.0, 7.0, 6.0, 8.0, 17.0, 18.0, 14.0, 22.0, 20.0, 29.0, 27.0, 38.0, 40.0, 37.0, 39.0, 48.0, 40.0, 57.0, 53.0, 55.0, 54.0, 56.0, 42.0, 46.0, 31.0, 38.0, 22.0, 30.0, 24.0, 7.0, 15.0, 13.0, 13.0, 10.0, 8.0, 6.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.367919921875, -0.35793304443359375, -0.3479461669921875, -0.33795928955078125, -0.327972412109375, -0.31798553466796875, -0.3079986572265625, -0.29801177978515625, -0.28802490234375, -0.27803802490234375, -0.2680511474609375, -0.25806427001953125, -0.248077392578125, -0.23809051513671875, -0.2281036376953125, -0.21811676025390625, -0.2081298828125, -0.19814300537109375, -0.1881561279296875, -0.17816925048828125, -0.168182373046875, -0.15819549560546875, -0.1482086181640625, -0.13822174072265625, -0.12823486328125, -0.11824798583984375, -0.1082611083984375, -0.09827423095703125, -0.088287353515625, -0.07830047607421875, -0.0683135986328125, -0.05832672119140625, -0.04833984375, -0.03835296630859375, -0.0283660888671875, -0.01837921142578125, -0.008392333984375, 0.00159454345703125, 0.0115814208984375, 0.02156829833984375, 0.03155517578125, 0.04154205322265625, 0.0515289306640625, 0.06151580810546875, 0.071502685546875, 0.08148956298828125, 0.0914764404296875, 0.10146331787109375, 0.1114501953125, 0.12143707275390625, 0.1314239501953125, 0.14141082763671875, 0.151397705078125, 0.16138458251953125, 0.1713714599609375, 0.18135833740234375, 0.19134521484375, 0.20133209228515625, 0.2113189697265625, 0.22130584716796875, 0.231292724609375, 0.24127960205078125, 0.2512664794921875, 0.26125335693359375, 0.271240234375]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 9.0, 7.0, 6.0, 8.0, 13.0, 23.0, 15.0, 30.0, 26.0, 28.0, 44.0, 43.0, 46.0, 47.0, 49.0, 50.0, 45.0, 42.0, 46.0, 47.0, 51.0, 42.0, 41.0, 32.0, 27.0, 26.0, 29.0, 28.0, 18.0, 18.0, 15.0, 6.0, 14.0, 5.0, 4.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.62267017364502, -9.2692289352417, -8.915787696838379, -8.562346458435059, -8.208904266357422, -7.85546350479126, -7.502021789550781, -7.148580551147461, -6.795139312744141, -6.44169807434082, -6.0882568359375, -5.7348151206970215, -5.381373882293701, -5.027932643890381, -4.674490928649902, -4.321049690246582, -3.9676084518432617, -3.6141672134399414, -3.260725736618042, -2.9072842597961426, -2.5538430213928223, -2.200401782989502, -1.8469603061676025, -1.4935188293457031, -1.1400775909423828, -0.786636233329773, -0.4331948757171631, -0.07975351810455322, 0.27368783950805664, 0.6271291971206665, 0.9805705547332764, 1.3340120315551758, 1.6874523162841797, 2.0408935546875, 2.3943350315093994, 2.747776508331299, 3.101217746734619, 3.4546589851379395, 3.808100461959839, 4.161541938781738, 4.514983177185059, 4.868424415588379, 5.221865653991699, 5.575307369232178, 5.928748607635498, 6.282189846038818, 6.635631561279297, 6.989072799682617, 7.3425140380859375, 7.695955276489258, 8.049396514892578, 8.402837753295898, 8.756278991699219, 9.109721183776855, 9.463162422180176, 9.816603660583496, 10.170044898986816, 10.523486137390137, 10.876927375793457, 11.230368614196777, 11.583810806274414, 11.937252044677734, 12.290693283081055, 12.644134521484375, 12.997575759887695]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 6.0, 6.0, 8.0, 11.0, 4.0, 13.0, 12.0, 13.0, 16.0, 15.0, 30.0, 31.0, 28.0, 35.0, 32.0, 39.0, 42.0, 34.0, 39.0, 49.0, 43.0, 42.0, 45.0, 44.0, 40.0, 42.0, 43.0, 38.0, 27.0, 32.0, 16.0, 28.0, 18.0, 18.0, 19.0, 13.0, 10.0, 12.0, 4.0, 2.0, 2.0, 5.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.330594062805176, -12.897187232971191, -12.463780403137207, -12.030372619628906, -11.596965789794922, -11.163558959960938, -10.730152130126953, -10.296745300292969, -9.863338470458984, -9.429931640625, -8.996524810791016, -8.563117980957031, -8.12971019744873, -7.696303367614746, -7.262896537780762, -6.829489707946777, -6.396081924438477, -5.962675094604492, -5.52926778793335, -5.095860958099365, -4.662453651428223, -4.229046821594238, -3.795639991760254, -3.3622329235076904, -2.928825855255127, -2.4954187870025635, -2.06201171875, -1.6286048889160156, -1.1951978206634521, -0.7617907524108887, -0.3283839225769043, 0.10502314567565918, 0.5384302139282227, 0.9718372225761414, 1.40524423122406, 1.838651180267334, 2.2720582485198975, 2.705465316772461, 3.1388721466064453, 3.572279214859009, 4.005686283111572, 4.439093112945557, 4.872500419616699, 5.305907249450684, 5.739314079284668, 6.1727213859558105, 6.606128215789795, 7.0395355224609375, 7.472942352294922, 7.906349182128906, 8.33975601196289, 8.773162841796875, 9.206570625305176, 9.63997745513916, 10.073384284973145, 10.506791114807129, 10.94019889831543, 11.373605728149414, 11.807012557983398, 12.240419387817383, 12.673827171325684, 13.107234001159668, 13.540640830993652, 13.974047660827637, 14.407454490661621]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 7.0, 5.0, 16.0, 40.0, 45.0, 59.0, 96.0, 152.0, 227.0, 385.0, 667.0, 955.0, 1637.0, 2792.0, 4650.0, 7459.0, 12433.0, 20787.0, 34527.0, 54061.0, 80160.0, 109541.0, 132070.0, 140615.0, 129961.0, 105171.0, 76659.0, 51513.0, 32296.0, 19748.0, 11809.0, 7120.0, 4188.0, 2538.0, 1557.0, 986.0, 583.0, 386.0, 248.0, 134.0, 102.0, 55.0, 39.0, 29.0, 16.0, 9.0, 13.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.453125, -10.130859375, -9.80859375, -9.486328125, -9.1640625, -8.841796875, -8.51953125, -8.197265625, -7.875, -7.552734375, -7.23046875, -6.908203125, -6.5859375, -6.263671875, -5.94140625, -5.619140625, -5.296875, -4.974609375, -4.65234375, -4.330078125, -4.0078125, -3.685546875, -3.36328125, -3.041015625, -2.71875, -2.396484375, -2.07421875, -1.751953125, -1.4296875, -1.107421875, -0.78515625, -0.462890625, -0.140625, 0.181640625, 0.50390625, 0.826171875, 1.1484375, 1.470703125, 1.79296875, 2.115234375, 2.4375, 2.759765625, 3.08203125, 3.404296875, 3.7265625, 4.048828125, 4.37109375, 4.693359375, 5.015625, 5.337890625, 5.66015625, 5.982421875, 6.3046875, 6.626953125, 6.94921875, 7.271484375, 7.59375, 7.916015625, 8.23828125, 8.560546875, 8.8828125, 9.205078125, 9.52734375, 9.849609375, 10.171875]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 6.0, 9.0, 10.0, 8.0, 9.0, 17.0, 12.0, 14.0, 12.0, 30.0, 35.0, 25.0, 23.0, 25.0, 37.0, 34.0, 37.0, 42.0, 36.0, 44.0, 47.0, 42.0, 42.0, 46.0, 38.0, 40.0, 41.0, 30.0, 36.0, 30.0, 18.0, 17.0, 23.0, 10.0, 10.0, 13.0, 8.0, 10.0, 9.0, 11.0, 3.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.8828125, -12.48388671875, -12.0849609375, -11.68603515625, -11.287109375, -10.88818359375, -10.4892578125, -10.09033203125, -9.69140625, -9.29248046875, -8.8935546875, -8.49462890625, -8.095703125, -7.69677734375, -7.2978515625, -6.89892578125, -6.5, -6.10107421875, -5.7021484375, -5.30322265625, -4.904296875, -4.50537109375, -4.1064453125, -3.70751953125, -3.30859375, -2.90966796875, -2.5107421875, -2.11181640625, -1.712890625, -1.31396484375, -0.9150390625, -0.51611328125, -0.1171875, 0.28173828125, 0.6806640625, 1.07958984375, 1.478515625, 1.87744140625, 2.2763671875, 2.67529296875, 3.07421875, 3.47314453125, 3.8720703125, 4.27099609375, 4.669921875, 5.06884765625, 5.4677734375, 5.86669921875, 6.265625, 6.66455078125, 7.0634765625, 7.46240234375, 7.861328125, 8.26025390625, 8.6591796875, 9.05810546875, 9.45703125, 9.85595703125, 10.2548828125, 10.65380859375, 11.052734375, 11.45166015625, 11.8505859375, 12.24951171875, 12.6484375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 7.0, 7.0, 11.0, 32.0, 37.0, 52.0, 71.0, 123.0, 192.0, 294.0, 509.0, 786.0, 1241.0, 2112.0, 3422.0, 5399.0, 8812.0, 14613.0, 23472.0, 36676.0, 54177.0, 76879.0, 101085.0, 120328.0, 127710.0, 121907.0, 105005.0, 80935.0, 57687.0, 38806.0, 25404.0, 15651.0, 9753.0, 5896.0, 3708.0, 2234.0, 1335.0, 790.0, 522.0, 326.0, 196.0, 126.0, 86.0, 53.0, 34.0, 17.0, 13.0, 10.0, 4.0, 3.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0], "bins": [-9.4453125, -9.1553955078125, -8.865478515625, -8.5755615234375, -8.28564453125, -7.9957275390625, -7.705810546875, -7.4158935546875, -7.1259765625, -6.8360595703125, -6.546142578125, -6.2562255859375, -5.96630859375, -5.6763916015625, -5.386474609375, -5.0965576171875, -4.806640625, -4.5167236328125, -4.226806640625, -3.9368896484375, -3.64697265625, -3.3570556640625, -3.067138671875, -2.7772216796875, -2.4873046875, -2.1973876953125, -1.907470703125, -1.6175537109375, -1.32763671875, -1.0377197265625, -0.747802734375, -0.4578857421875, -0.16796875, 0.1219482421875, 0.411865234375, 0.7017822265625, 0.99169921875, 1.2816162109375, 1.571533203125, 1.8614501953125, 2.1513671875, 2.4412841796875, 2.731201171875, 3.0211181640625, 3.31103515625, 3.6009521484375, 3.890869140625, 4.1807861328125, 4.470703125, 4.7606201171875, 5.050537109375, 5.3404541015625, 5.63037109375, 5.9202880859375, 6.210205078125, 6.5001220703125, 6.7900390625, 7.0799560546875, 7.369873046875, 7.6597900390625, 7.94970703125, 8.2396240234375, 8.529541015625, 8.8194580078125, 9.109375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 1.0, 4.0, 5.0, 7.0, 7.0, 11.0, 9.0, 7.0, 10.0, 19.0, 21.0, 29.0, 36.0, 33.0, 30.0, 25.0, 33.0, 34.0, 46.0, 42.0, 43.0, 49.0, 41.0, 48.0, 39.0, 36.0, 33.0, 38.0, 34.0, 21.0, 43.0, 33.0, 25.0, 20.0, 14.0, 12.0, 15.0, 8.0, 14.0, 8.0, 7.0, 7.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.74609375, -7.49420166015625, -7.2423095703125, -6.99041748046875, -6.738525390625, -6.48663330078125, -6.2347412109375, -5.98284912109375, -5.73095703125, -5.47906494140625, -5.2271728515625, -4.97528076171875, -4.723388671875, -4.47149658203125, -4.2196044921875, -3.96771240234375, -3.7158203125, -3.46392822265625, -3.2120361328125, -2.96014404296875, -2.708251953125, -2.45635986328125, -2.2044677734375, -1.95257568359375, -1.70068359375, -1.44879150390625, -1.1968994140625, -0.94500732421875, -0.693115234375, -0.44122314453125, -0.1893310546875, 0.06256103515625, 0.314453125, 0.56634521484375, 0.8182373046875, 1.07012939453125, 1.322021484375, 1.57391357421875, 1.8258056640625, 2.07769775390625, 2.32958984375, 2.58148193359375, 2.8333740234375, 3.08526611328125, 3.337158203125, 3.58905029296875, 3.8409423828125, 4.09283447265625, 4.3447265625, 4.59661865234375, 4.8485107421875, 5.10040283203125, 5.352294921875, 5.60418701171875, 5.8560791015625, 6.10797119140625, 6.35986328125, 6.61175537109375, 6.8636474609375, 7.11553955078125, 7.367431640625, 7.61932373046875, 7.8712158203125, 8.12310791015625, 8.375]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 3.0, 0.0, 5.0, 7.0, 13.0, 25.0, 32.0, 57.0, 81.0, 115.0, 204.0, 314.0, 462.0, 737.0, 1087.0, 1938.0, 3064.0, 5100.0, 8205.0, 13531.0, 22193.0, 35666.0, 54625.0, 80499.0, 108107.0, 130071.0, 137712.0, 127219.0, 103339.0, 76600.0, 51491.0, 33241.0, 20683.0, 12527.0, 7572.0, 4588.0, 2772.0, 1689.0, 1090.0, 671.0, 402.0, 300.0, 169.0, 124.0, 77.0, 58.0, 40.0, 26.0, 10.0, 10.0, 6.0, 8.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.40625, -2.324462890625, -2.24267578125, -2.160888671875, -2.0791015625, -1.997314453125, -1.91552734375, -1.833740234375, -1.751953125, -1.670166015625, -1.58837890625, -1.506591796875, -1.4248046875, -1.343017578125, -1.26123046875, -1.179443359375, -1.09765625, -1.015869140625, -0.93408203125, -0.852294921875, -0.7705078125, -0.688720703125, -0.60693359375, -0.525146484375, -0.443359375, -0.361572265625, -0.27978515625, -0.197998046875, -0.1162109375, -0.034423828125, 0.04736328125, 0.129150390625, 0.2109375, 0.292724609375, 0.37451171875, 0.456298828125, 0.5380859375, 0.619873046875, 0.70166015625, 0.783447265625, 0.865234375, 0.947021484375, 1.02880859375, 1.110595703125, 1.1923828125, 1.274169921875, 1.35595703125, 1.437744140625, 1.51953125, 1.601318359375, 1.68310546875, 1.764892578125, 1.8466796875, 1.928466796875, 2.01025390625, 2.092041015625, 2.173828125, 2.255615234375, 2.33740234375, 2.419189453125, 2.5009765625, 2.582763671875, 2.66455078125, 2.746337890625, 2.828125]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 4.0, 7.0, 1.0, 7.0, 6.0, 11.0, 12.0, 9.0, 9.0, 15.0, 18.0, 30.0, 29.0, 37.0, 33.0, 32.0, 39.0, 49.0, 57.0, 52.0, 54.0, 46.0, 64.0, 52.0, 50.0, 50.0, 39.0, 26.0, 48.0, 15.0, 24.0, 18.0, 17.0, 12.0, 10.0, 7.0, 8.0, 2.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00029778480529785156, -0.0002890639007091522, -0.0002803429961204529, -0.00027162209153175354, -0.0002629011869430542, -0.00025418028235435486, -0.0002454593777656555, -0.00023673847317695618, -0.00022801756858825684, -0.0002192966639995575, -0.00021057575941085815, -0.0002018548548221588, -0.00019313395023345947, -0.00018441304564476013, -0.0001756921410560608, -0.00016697123646736145, -0.0001582503318786621, -0.00014952942728996277, -0.00014080852270126343, -0.0001320876181125641, -0.00012336671352386475, -0.0001146458089351654, -0.00010592490434646606, -9.720399975776672e-05, -8.848309516906738e-05, -7.976219058036804e-05, -7.10412859916687e-05, -6.232038140296936e-05, -5.359947681427002e-05, -4.487857222557068e-05, -3.615766763687134e-05, -2.7436763048171997e-05, -1.8715858459472656e-05, -9.994953870773315e-06, -1.2740492820739746e-06, 7.446855306625366e-06, 1.6167759895324707e-05, 2.4888664484024048e-05, 3.360956907272339e-05, 4.233047366142273e-05, 5.105137825012207e-05, 5.977228283882141e-05, 6.849318742752075e-05, 7.721409201622009e-05, 8.593499660491943e-05, 9.465590119361877e-05, 0.00010337680578231812, 0.00011209771037101746, 0.0001208186149597168, 0.00012953951954841614, 0.00013826042413711548, 0.00014698132872581482, 0.00015570223331451416, 0.0001644231379032135, 0.00017314404249191284, 0.00018186494708061218, 0.00019058585166931152, 0.00019930675625801086, 0.0002080276608467102, 0.00021674856543540955, 0.0002254694700241089, 0.00023419037461280823, 0.00024291127920150757, 0.0002516321837902069, 0.00026035308837890625]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 7.0, 6.0, 16.0, 30.0, 32.0, 46.0, 61.0, 104.0, 169.0, 248.0, 380.0, 592.0, 913.0, 1442.0, 2386.0, 3941.0, 6398.0, 11126.0, 18591.0, 31059.0, 49011.0, 75856.0, 107639.0, 136353.0, 147956.0, 137762.0, 109490.0, 77160.0, 50676.0, 31457.0, 18830.0, 11446.0, 6733.0, 4076.0, 2418.0, 1524.0, 932.0, 568.0, 412.0, 247.0, 136.0, 107.0, 79.0, 58.0, 25.0, 29.0, 12.0, 5.0, 6.0, 2.0, 3.0, 6.0, 3.0, 1.0, 1.0], "bins": [-3.134765625, -3.041259765625, -2.94775390625, -2.854248046875, -2.7607421875, -2.667236328125, -2.57373046875, -2.480224609375, -2.38671875, -2.293212890625, -2.19970703125, -2.106201171875, -2.0126953125, -1.919189453125, -1.82568359375, -1.732177734375, -1.638671875, -1.545166015625, -1.45166015625, -1.358154296875, -1.2646484375, -1.171142578125, -1.07763671875, -0.984130859375, -0.890625, -0.797119140625, -0.70361328125, -0.610107421875, -0.5166015625, -0.423095703125, -0.32958984375, -0.236083984375, -0.142578125, -0.049072265625, 0.04443359375, 0.137939453125, 0.2314453125, 0.324951171875, 0.41845703125, 0.511962890625, 0.60546875, 0.698974609375, 0.79248046875, 0.885986328125, 0.9794921875, 1.072998046875, 1.16650390625, 1.260009765625, 1.353515625, 1.447021484375, 1.54052734375, 1.634033203125, 1.7275390625, 1.821044921875, 1.91455078125, 2.008056640625, 2.1015625, 2.195068359375, 2.28857421875, 2.382080078125, 2.4755859375, 2.569091796875, 2.66259765625, 2.756103515625, 2.849609375]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 2.0, 4.0, 5.0, 4.0, 10.0, 4.0, 12.0, 13.0, 16.0, 26.0, 24.0, 38.0, 39.0, 31.0, 38.0, 57.0, 57.0, 49.0, 57.0, 57.0, 55.0, 43.0, 51.0, 45.0, 37.0, 39.0, 26.0, 36.0, 27.0, 15.0, 22.0, 16.0, 12.0, 11.0, 4.0, 7.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.33203125, -1.2878570556640625, -1.243682861328125, -1.1995086669921875, -1.15533447265625, -1.1111602783203125, -1.066986083984375, -1.0228118896484375, -0.9786376953125, -0.9344635009765625, -0.890289306640625, -0.8461151123046875, -0.80194091796875, -0.7577667236328125, -0.713592529296875, -0.6694183349609375, -0.625244140625, -0.5810699462890625, -0.536895751953125, -0.4927215576171875, -0.44854736328125, -0.4043731689453125, -0.360198974609375, -0.3160247802734375, -0.2718505859375, -0.2276763916015625, -0.183502197265625, -0.1393280029296875, -0.09515380859375, -0.0509796142578125, -0.006805419921875, 0.0373687744140625, 0.08154296875, 0.1257171630859375, 0.169891357421875, 0.2140655517578125, 0.25823974609375, 0.3024139404296875, 0.346588134765625, 0.3907623291015625, 0.4349365234375, 0.4791107177734375, 0.523284912109375, 0.5674591064453125, 0.61163330078125, 0.6558074951171875, 0.699981689453125, 0.7441558837890625, 0.788330078125, 0.8325042724609375, 0.876678466796875, 0.9208526611328125, 0.96502685546875, 1.0092010498046875, 1.053375244140625, 1.0975494384765625, 1.1417236328125, 1.1858978271484375, 1.230072021484375, 1.2742462158203125, 1.31842041015625, 1.3625946044921875, 1.406768798828125, 1.4509429931640625, 1.4951171875]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 1.0, 4.0, 5.0, 3.0, 1.0, 5.0, 5.0, 5.0, 16.0, 10.0, 13.0, 25.0, 22.0, 26.0, 28.0, 19.0, 29.0, 50.0, 35.0, 40.0, 48.0, 48.0, 52.0, 42.0, 47.0, 46.0, 29.0, 44.0, 43.0, 33.0, 27.0, 28.0, 27.0, 22.0, 24.0, 21.0, 14.0, 26.0, 9.0, 4.0, 7.0, 5.0, 8.0, 5.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.57022762298584, -8.250162124633789, -7.930095672607422, -7.610029697418213, -7.289963722229004, -6.969898223876953, -6.649832248687744, -6.329766273498535, -6.009700298309326, -5.689634323120117, -5.369568347930908, -5.049502372741699, -4.729436874389648, -4.409370422363281, -4.0893049240112305, -3.7692389488220215, -3.4491729736328125, -3.1291069984436035, -2.8090410232543945, -2.4889752864837646, -2.1689093112945557, -1.8488433361053467, -1.5287774801254272, -1.2087116241455078, -0.8886456489562988, -0.5685797333717346, -0.2485138177871704, 0.0715520977973938, 0.391618013381958, 0.711683988571167, 1.0317498445510864, 1.3518157005310059, 1.6718807220458984, 1.9919466972351074, 2.3120126724243164, 2.6320784091949463, 2.9521443843841553, 3.2722103595733643, 3.592276096343994, 3.912342071533203, 4.232408046722412, 4.552474021911621, 4.87253999710083, 5.192605972290039, 5.51267147064209, 5.832737922668457, 6.152803421020508, 6.472869396209717, 6.792935371398926, 7.113001346588135, 7.433067321777344, 7.753133296966553, 8.073199272155762, 8.393264770507812, 8.71333122253418, 9.03339672088623, 9.353462219238281, 9.673527717590332, 9.9935941696167, 10.31365966796875, 10.633726119995117, 10.953791618347168, 11.273858070373535, 11.593923568725586, 11.913990020751953]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 5.0, 2.0, 3.0, 5.0, 6.0, 8.0, 5.0, 10.0, 16.0, 26.0, 22.0, 28.0, 37.0, 22.0, 19.0, 38.0, 33.0, 28.0, 36.0, 40.0, 41.0, 38.0, 44.0, 35.0, 33.0, 32.0, 27.0, 44.0, 44.0, 45.0, 36.0, 23.0, 33.0, 21.0, 27.0, 16.0, 27.0, 7.0, 6.0, 10.0, 7.0, 2.0, 7.0, 6.0, 4.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.495716094970703, -12.075135231018066, -11.65455436706543, -11.233973503112793, -10.813392639160156, -10.392810821533203, -9.972229957580566, -9.55164909362793, -9.131068229675293, -8.710487365722656, -8.28990650177002, -7.869325160980225, -7.448744297027588, -7.028163433074951, -6.607582092285156, -6.1870012283325195, -5.766420364379883, -5.345839500427246, -4.925258636474609, -4.5046772956848145, -4.084096431732178, -3.663515567779541, -3.242934465408325, -2.8223533630371094, -2.4017724990844727, -1.9811915159225464, -1.5606105327606201, -1.1400295495986938, -0.7194485664367676, -0.29886770248413086, 0.12171339988708496, 0.5422945022583008, 0.9628744125366211, 1.3834553956985474, 1.8040363788604736, 2.2246174812316895, 2.645198345184326, 3.065779209136963, 3.4863603115081787, 3.9069414138793945, 4.327522277832031, 4.748103141784668, 5.168684005737305, 5.5892653465271, 6.009846210479736, 6.430427074432373, 6.851008415222168, 7.271589279174805, 7.692170143127441, 8.112751007080078, 8.533331871032715, 8.953912734985352, 9.374494552612305, 9.795074462890625, 10.215656280517578, 10.636237144470215, 11.056818008422852, 11.477398872375488, 11.897979736328125, 12.318560600280762, 12.739141464233398, 13.159723281860352, 13.580304145812988, 14.000885009765625, 14.421465873718262]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 4.0, 9.0, 15.0, 24.0, 36.0, 39.0, 86.0, 120.0, 182.0, 299.0, 418.0, 649.0, 958.0, 1508.0, 2272.0, 3461.0, 5227.0, 8100.0, 12467.0, 19144.0, 29351.0, 45689.0, 70089.0, 107376.0, 161433.0, 237401.0, 332772.0, 434013.0, 508486.0, 523372.0, 471382.0, 378138.0, 278568.0, 192241.0, 128529.0, 85031.0, 54692.0, 35404.0, 23205.0, 15006.0, 9532.0, 6127.0, 3945.0, 2562.0, 1623.0, 1126.0, 742.0, 493.0, 327.0, 201.0, 145.0, 104.0, 47.0, 48.0, 27.0, 19.0, 18.0, 9.0, 2.0, 3.0, 1.0], "bins": [-8.2890625, -8.03173828125, -7.7744140625, -7.51708984375, -7.259765625, -7.00244140625, -6.7451171875, -6.48779296875, -6.23046875, -5.97314453125, -5.7158203125, -5.45849609375, -5.201171875, -4.94384765625, -4.6865234375, -4.42919921875, -4.171875, -3.91455078125, -3.6572265625, -3.39990234375, -3.142578125, -2.88525390625, -2.6279296875, -2.37060546875, -2.11328125, -1.85595703125, -1.5986328125, -1.34130859375, -1.083984375, -0.82666015625, -0.5693359375, -0.31201171875, -0.0546875, 0.20263671875, 0.4599609375, 0.71728515625, 0.974609375, 1.23193359375, 1.4892578125, 1.74658203125, 2.00390625, 2.26123046875, 2.5185546875, 2.77587890625, 3.033203125, 3.29052734375, 3.5478515625, 3.80517578125, 4.0625, 4.31982421875, 4.5771484375, 4.83447265625, 5.091796875, 5.34912109375, 5.6064453125, 5.86376953125, 6.12109375, 6.37841796875, 6.6357421875, 6.89306640625, 7.150390625, 7.40771484375, 7.6650390625, 7.92236328125, 8.1796875]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 5.0, 4.0, 2.0, 9.0, 4.0, 10.0, 15.0, 19.0, 14.0, 14.0, 19.0, 33.0, 31.0, 23.0, 26.0, 29.0, 30.0, 30.0, 36.0, 38.0, 34.0, 40.0, 43.0, 32.0, 36.0, 34.0, 32.0, 22.0, 31.0, 40.0, 39.0, 43.0, 23.0, 25.0, 21.0, 25.0, 13.0, 15.0, 14.0, 11.0, 5.0, 4.0, 6.0, 6.0, 5.0, 2.0, 6.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.390625, -9.0950927734375, -8.799560546875, -8.5040283203125, -8.20849609375, -7.9129638671875, -7.617431640625, -7.3218994140625, -7.0263671875, -6.7308349609375, -6.435302734375, -6.1397705078125, -5.84423828125, -5.5487060546875, -5.253173828125, -4.9576416015625, -4.662109375, -4.3665771484375, -4.071044921875, -3.7755126953125, -3.47998046875, -3.1844482421875, -2.888916015625, -2.5933837890625, -2.2978515625, -2.0023193359375, -1.706787109375, -1.4112548828125, -1.11572265625, -0.8201904296875, -0.524658203125, -0.2291259765625, 0.06640625, 0.3619384765625, 0.657470703125, 0.9530029296875, 1.24853515625, 1.5440673828125, 1.839599609375, 2.1351318359375, 2.4306640625, 2.7261962890625, 3.021728515625, 3.3172607421875, 3.61279296875, 3.9083251953125, 4.203857421875, 4.4993896484375, 4.794921875, 5.0904541015625, 5.385986328125, 5.6815185546875, 5.97705078125, 6.2725830078125, 6.568115234375, 6.8636474609375, 7.1591796875, 7.4547119140625, 7.750244140625, 8.0457763671875, 8.34130859375, 8.6368408203125, 8.932373046875, 9.2279052734375, 9.5234375]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 4.0, 10.0, 22.0, 15.0, 48.0, 76.0, 106.0, 174.0, 295.0, 467.0, 728.0, 1239.0, 2031.0, 3190.0, 5252.0, 8770.0, 14104.0, 23177.0, 37010.0, 58577.0, 90397.0, 135803.0, 194506.0, 267869.0, 342512.0, 412211.0, 454753.0, 459379.0, 423204.0, 356973.0, 280738.0, 207383.0, 145765.0, 97611.0, 63415.0, 40669.0, 25438.0, 15819.0, 9638.0, 5793.0, 3604.0, 2069.0, 1292.0, 843.0, 506.0, 312.0, 204.0, 90.0, 81.0, 45.0, 28.0, 15.0, 10.0, 7.0, 4.0, 5.0, 4.0, 4.0], "bins": [-7.80078125, -7.5650634765625, -7.329345703125, -7.0936279296875, -6.85791015625, -6.6221923828125, -6.386474609375, -6.1507568359375, -5.9150390625, -5.6793212890625, -5.443603515625, -5.2078857421875, -4.97216796875, -4.7364501953125, -4.500732421875, -4.2650146484375, -4.029296875, -3.7935791015625, -3.557861328125, -3.3221435546875, -3.08642578125, -2.8507080078125, -2.614990234375, -2.3792724609375, -2.1435546875, -1.9078369140625, -1.672119140625, -1.4364013671875, -1.20068359375, -0.9649658203125, -0.729248046875, -0.4935302734375, -0.2578125, -0.0220947265625, 0.213623046875, 0.4493408203125, 0.68505859375, 0.9207763671875, 1.156494140625, 1.3922119140625, 1.6279296875, 1.8636474609375, 2.099365234375, 2.3350830078125, 2.57080078125, 2.8065185546875, 3.042236328125, 3.2779541015625, 3.513671875, 3.7493896484375, 3.985107421875, 4.2208251953125, 4.45654296875, 4.6922607421875, 4.927978515625, 5.1636962890625, 5.3994140625, 5.6351318359375, 5.870849609375, 6.1065673828125, 6.34228515625, 6.5780029296875, 6.813720703125, 7.0494384765625, 7.28515625]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 10.0, 9.0, 12.0, 11.0, 16.0, 30.0, 29.0, 34.0, 57.0, 64.0, 77.0, 88.0, 106.0, 143.0, 176.0, 173.0, 194.0, 221.0, 221.0, 227.0, 223.0, 243.0, 257.0, 216.0, 189.0, 191.0, 161.0, 110.0, 113.0, 93.0, 80.0, 71.0, 51.0, 39.0, 22.0, 28.0, 20.0, 8.0, 12.0, 12.0, 10.0, 9.0, 5.0, 7.0, 5.0, 1.0, 3.0, 0.0, 2.0, 3.0], "bins": [-5.4765625, -5.31927490234375, -5.1619873046875, -5.00469970703125, -4.847412109375, -4.69012451171875, -4.5328369140625, -4.37554931640625, -4.21826171875, -4.06097412109375, -3.9036865234375, -3.74639892578125, -3.589111328125, -3.43182373046875, -3.2745361328125, -3.11724853515625, -2.9599609375, -2.80267333984375, -2.6453857421875, -2.48809814453125, -2.330810546875, -2.17352294921875, -2.0162353515625, -1.85894775390625, -1.70166015625, -1.54437255859375, -1.3870849609375, -1.22979736328125, -1.072509765625, -0.91522216796875, -0.7579345703125, -0.60064697265625, -0.443359375, -0.28607177734375, -0.1287841796875, 0.02850341796875, 0.185791015625, 0.34307861328125, 0.5003662109375, 0.65765380859375, 0.81494140625, 0.97222900390625, 1.1295166015625, 1.28680419921875, 1.444091796875, 1.60137939453125, 1.7586669921875, 1.91595458984375, 2.0732421875, 2.23052978515625, 2.3878173828125, 2.54510498046875, 2.702392578125, 2.85968017578125, 3.0169677734375, 3.17425537109375, 3.33154296875, 3.48883056640625, 3.6461181640625, 3.80340576171875, 3.960693359375, 4.11798095703125, 4.2752685546875, 4.43255615234375, 4.58984375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 5.0, 6.0, 4.0, 4.0, 13.0, 13.0, 8.0, 20.0, 15.0, 18.0, 21.0, 45.0, 43.0, 43.0, 45.0, 42.0, 47.0, 43.0, 40.0, 44.0, 36.0, 60.0, 29.0, 49.0, 39.0, 19.0, 44.0, 28.0, 36.0, 28.0, 19.0, 24.0, 17.0, 13.0, 12.0, 5.0, 11.0, 5.0, 4.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.597051620483398, -9.288947105407715, -8.980842590332031, -8.672738075256348, -8.364633560180664, -8.056528091430664, -7.7484235763549805, -7.440319061279297, -7.132214546203613, -6.82411003112793, -6.516005516052246, -6.207900524139404, -5.899796009063721, -5.591691493988037, -5.283586502075195, -4.975481986999512, -4.667377471923828, -4.3592729568481445, -4.051168441772461, -3.743063449859619, -3.4349589347839355, -3.126854419708252, -2.8187496662139893, -2.5106449127197266, -2.202540397644043, -1.8944357633590698, -1.5863311290740967, -1.2782264947891235, -0.9701218605041504, -0.6620172262191772, -0.3539125919342041, -0.045807838439941406, 0.2622976303100586, 0.5704022645950317, 0.8785068988800049, 1.186611533164978, 1.4947161674499512, 1.8028208017349243, 2.1109254360198975, 2.41903018951416, 2.7271347045898438, 3.0352392196655273, 3.34334397315979, 3.6514487266540527, 3.9595532417297363, 4.26765775680542, 4.575762748718262, 4.883867263793945, 5.191971778869629, 5.5000762939453125, 5.808180809020996, 6.116285800933838, 6.4243903160095215, 6.732494831085205, 7.040599822998047, 7.3487043380737305, 7.656808853149414, 7.964913368225098, 8.273017883300781, 8.581122398376465, 8.889226913452148, 9.197332382202148, 9.505436897277832, 9.813541412353516, 10.1216459274292]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 5.0, 2.0, 8.0, 8.0, 7.0, 19.0, 14.0, 16.0, 14.0, 30.0, 24.0, 23.0, 36.0, 35.0, 37.0, 38.0, 39.0, 38.0, 26.0, 44.0, 43.0, 38.0, 42.0, 34.0, 56.0, 42.0, 38.0, 41.0, 31.0, 30.0, 27.0, 22.0, 20.0, 16.0, 14.0, 10.0, 12.0, 8.0, 3.0, 6.0, 2.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.517653465270996, -11.1144437789917, -10.711235046386719, -10.308025360107422, -9.904815673828125, -9.501605987548828, -9.098396301269531, -8.69518756866455, -8.291977882385254, -7.888768196105957, -7.485558986663818, -7.08234977722168, -6.679140090942383, -6.275930404663086, -5.872721195220947, -5.469511985778809, -5.066302299499512, -4.663092613220215, -4.259883403778076, -3.8566739559173584, -3.4534645080566406, -3.050255060195923, -2.647045612335205, -2.2438361644744873, -1.8406267166137695, -1.4374172687530518, -1.034207820892334, -0.6309983730316162, -0.22778892517089844, 0.17542052268981934, 0.5786299705505371, 0.9818394184112549, 1.385049819946289, 1.7882592678070068, 2.1914687156677246, 2.5946781635284424, 2.99788761138916, 3.401097059249878, 3.8043065071105957, 4.207515716552734, 4.610725402832031, 5.013935089111328, 5.417144298553467, 5.8203535079956055, 6.223563194274902, 6.626772880554199, 7.029982089996338, 7.433191299438477, 7.836400985717773, 8.23961067199707, 8.642820358276367, 9.046029090881348, 9.449238777160645, 9.852448463439941, 10.255657196044922, 10.658866882324219, 11.062076568603516, 11.465286254882812, 11.86849594116211, 12.27170467376709, 12.674914360046387, 13.078124046325684, 13.481332778930664, 13.884542465209961, 14.287752151489258]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 4.0, 13.0, 15.0, 14.0, 25.0, 48.0, 50.0, 77.0, 118.0, 188.0, 269.0, 368.0, 566.0, 833.0, 1270.0, 1913.0, 2833.0, 4380.0, 6779.0, 10560.0, 17336.0, 27498.0, 45083.0, 73921.0, 120296.0, 178775.0, 191962.0, 137707.0, 86448.0, 52518.0, 32124.0, 19632.0, 12288.0, 7779.0, 5042.0, 3200.0, 2111.0, 1487.0, 995.0, 612.0, 446.0, 303.0, 206.0, 138.0, 109.0, 69.0, 56.0, 30.0, 19.0, 19.0, 11.0, 10.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.248046875, -2.178131103515625, -2.10821533203125, -2.038299560546875, -1.9683837890625, -1.898468017578125, -1.82855224609375, -1.758636474609375, -1.688720703125, -1.618804931640625, -1.54888916015625, -1.478973388671875, -1.4090576171875, -1.339141845703125, -1.26922607421875, -1.199310302734375, -1.12939453125, -1.059478759765625, -0.98956298828125, -0.919647216796875, -0.8497314453125, -0.779815673828125, -0.70989990234375, -0.639984130859375, -0.570068359375, -0.500152587890625, -0.43023681640625, -0.360321044921875, -0.2904052734375, -0.220489501953125, -0.15057373046875, -0.080657958984375, -0.0107421875, 0.059173583984375, 0.12908935546875, 0.199005126953125, 0.2689208984375, 0.338836669921875, 0.40875244140625, 0.478668212890625, 0.548583984375, 0.618499755859375, 0.68841552734375, 0.758331298828125, 0.8282470703125, 0.898162841796875, 0.96807861328125, 1.037994384765625, 1.10791015625, 1.177825927734375, 1.24774169921875, 1.317657470703125, 1.3875732421875, 1.457489013671875, 1.52740478515625, 1.597320556640625, 1.667236328125, 1.737152099609375, 1.80706787109375, 1.876983642578125, 1.9468994140625, 2.016815185546875, 2.08673095703125, 2.156646728515625, 2.2265625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 11.0, 5.0, 12.0, 9.0, 19.0, 18.0, 17.0, 21.0, 19.0, 22.0, 37.0, 35.0, 30.0, 35.0, 34.0, 42.0, 38.0, 30.0, 41.0, 49.0, 41.0, 38.0, 46.0, 46.0, 37.0, 35.0, 31.0, 31.0, 23.0, 25.0, 32.0, 20.0, 13.0, 8.0, 8.0, 17.0, 4.0, 11.0, 5.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.1328125, -10.7265625, -10.3203125, -9.9140625, -9.5078125, -9.1015625, -8.6953125, -8.2890625, -7.8828125, -7.4765625, -7.0703125, -6.6640625, -6.2578125, -5.8515625, -5.4453125, -5.0390625, -4.6328125, -4.2265625, -3.8203125, -3.4140625, -3.0078125, -2.6015625, -2.1953125, -1.7890625, -1.3828125, -0.9765625, -0.5703125, -0.1640625, 0.2421875, 0.6484375, 1.0546875, 1.4609375, 1.8671875, 2.2734375, 2.6796875, 3.0859375, 3.4921875, 3.8984375, 4.3046875, 4.7109375, 5.1171875, 5.5234375, 5.9296875, 6.3359375, 6.7421875, 7.1484375, 7.5546875, 7.9609375, 8.3671875, 8.7734375, 9.1796875, 9.5859375, 9.9921875, 10.3984375, 10.8046875, 11.2109375, 11.6171875, 12.0234375, 12.4296875, 12.8359375, 13.2421875, 13.6484375, 14.0546875, 14.4609375, 14.8671875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 5.0, 12.0, 8.0, 14.0, 14.0, 24.0, 25.0, 40.0, 59.0, 72.0, 105.0, 129.0, 155.0, 252.0, 393.0, 529.0, 813.0, 1345.0, 2548.0, 5338.0, 13563.0, 41240.0, 906480.0, 47172.0, 15388.0, 5888.0, 2705.0, 1432.0, 864.0, 582.0, 396.0, 278.0, 169.0, 140.0, 101.0, 82.0, 58.0, 34.0, 23.0, 27.0, 15.0, 10.0, 12.0, 7.0, 7.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-8.4609375, -8.2010498046875, -7.941162109375, -7.6812744140625, -7.42138671875, -7.1614990234375, -6.901611328125, -6.6417236328125, -6.3818359375, -6.1219482421875, -5.862060546875, -5.6021728515625, -5.34228515625, -5.0823974609375, -4.822509765625, -4.5626220703125, -4.302734375, -4.0428466796875, -3.782958984375, -3.5230712890625, -3.26318359375, -3.0032958984375, -2.743408203125, -2.4835205078125, -2.2236328125, -1.9637451171875, -1.703857421875, -1.4439697265625, -1.18408203125, -0.9241943359375, -0.664306640625, -0.4044189453125, -0.14453125, 0.1153564453125, 0.375244140625, 0.6351318359375, 0.89501953125, 1.1549072265625, 1.414794921875, 1.6746826171875, 1.9345703125, 2.1944580078125, 2.454345703125, 2.7142333984375, 2.97412109375, 3.2340087890625, 3.493896484375, 3.7537841796875, 4.013671875, 4.2735595703125, 4.533447265625, 4.7933349609375, 5.05322265625, 5.3131103515625, 5.572998046875, 5.8328857421875, 6.0927734375, 6.3526611328125, 6.612548828125, 6.8724365234375, 7.13232421875, 7.3922119140625, 7.652099609375, 7.9119873046875, 8.171875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 6.0, 3.0, 6.0, 13.0, 12.0, 12.0, 10.0, 21.0, 17.0, 23.0, 31.0, 24.0, 25.0, 29.0, 39.0, 28.0, 34.0, 37.0, 44.0, 42.0, 39.0, 40.0, 34.0, 37.0, 35.0, 36.0, 23.0, 31.0, 32.0, 39.0, 26.0, 20.0, 24.0, 18.0, 20.0, 18.0, 12.0, 14.0, 11.0, 4.0, 9.0, 5.0, 4.0, 7.0, 1.0, 4.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0], "bins": [-8.4375, -8.18450927734375, -7.9315185546875, -7.67852783203125, -7.425537109375, -7.17254638671875, -6.9195556640625, -6.66656494140625, -6.41357421875, -6.16058349609375, -5.9075927734375, -5.65460205078125, -5.401611328125, -5.14862060546875, -4.8956298828125, -4.64263916015625, -4.3896484375, -4.13665771484375, -3.8836669921875, -3.63067626953125, -3.377685546875, -3.12469482421875, -2.8717041015625, -2.61871337890625, -2.36572265625, -2.11273193359375, -1.8597412109375, -1.60675048828125, -1.353759765625, -1.10076904296875, -0.8477783203125, -0.59478759765625, -0.341796875, -0.08880615234375, 0.1641845703125, 0.41717529296875, 0.670166015625, 0.92315673828125, 1.1761474609375, 1.42913818359375, 1.68212890625, 1.93511962890625, 2.1881103515625, 2.44110107421875, 2.694091796875, 2.94708251953125, 3.2000732421875, 3.45306396484375, 3.7060546875, 3.95904541015625, 4.2120361328125, 4.46502685546875, 4.718017578125, 4.97100830078125, 5.2239990234375, 5.47698974609375, 5.72998046875, 5.98297119140625, 6.2359619140625, 6.48895263671875, 6.741943359375, 6.99493408203125, 7.2479248046875, 7.50091552734375, 7.75390625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 5.0, 5.0, 17.0, 24.0, 22.0, 44.0, 32.0, 50.0, 93.0, 106.0, 207.0, 279.0, 387.0, 612.0, 959.0, 1767.0, 3725.0, 9191.0, 34882.0, 947337.0, 31984.0, 8793.0, 3508.0, 1759.0, 956.0, 594.0, 345.0, 253.0, 172.0, 120.0, 90.0, 67.0, 52.0, 35.0, 25.0, 18.0, 9.0, 10.0, 10.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2587890625, -1.2160797119140625, -1.173370361328125, -1.1306610107421875, -1.08795166015625, -1.0452423095703125, -1.002532958984375, -0.9598236083984375, -0.9171142578125, -0.8744049072265625, -0.831695556640625, -0.7889862060546875, -0.74627685546875, -0.7035675048828125, -0.660858154296875, -0.6181488037109375, -0.575439453125, -0.5327301025390625, -0.490020751953125, -0.4473114013671875, -0.40460205078125, -0.3618927001953125, -0.319183349609375, -0.2764739990234375, -0.2337646484375, -0.1910552978515625, -0.148345947265625, -0.1056365966796875, -0.06292724609375, -0.0202178955078125, 0.022491455078125, 0.0652008056640625, 0.10791015625, 0.1506195068359375, 0.193328857421875, 0.2360382080078125, 0.27874755859375, 0.3214569091796875, 0.364166259765625, 0.4068756103515625, 0.4495849609375, 0.4922943115234375, 0.535003662109375, 0.5777130126953125, 0.62042236328125, 0.6631317138671875, 0.705841064453125, 0.7485504150390625, 0.791259765625, 0.8339691162109375, 0.876678466796875, 0.9193878173828125, 0.96209716796875, 1.0048065185546875, 1.047515869140625, 1.0902252197265625, 1.1329345703125, 1.1756439208984375, 1.218353271484375, 1.2610626220703125, 1.30377197265625, 1.3464813232421875, 1.389190673828125, 1.4319000244140625, 1.474609375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 2.0, 5.0, 7.0, 4.0, 5.0, 11.0, 14.0, 18.0, 16.0, 20.0, 20.0, 30.0, 25.0, 39.0, 40.0, 57.0, 49.0, 35.0, 62.0, 62.0, 52.0, 64.0, 44.0, 45.0, 48.0, 43.0, 39.0, 29.0, 17.0, 17.0, 11.0, 21.0, 10.0, 9.0, 11.0, 7.0, 5.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.510185241699219e-06, -7.209368050098419e-06, -6.90855085849762e-06, -6.60773366689682e-06, -6.3069164752960205e-06, -6.006099283695221e-06, -5.705282092094421e-06, -5.404464900493622e-06, -5.103647708892822e-06, -4.802830517292023e-06, -4.502013325691223e-06, -4.201196134090424e-06, -3.900378942489624e-06, -3.5995617508888245e-06, -3.298744559288025e-06, -2.9979273676872253e-06, -2.6971101760864258e-06, -2.3962929844856262e-06, -2.0954757928848267e-06, -1.794658601284027e-06, -1.4938414096832275e-06, -1.193024218082428e-06, -8.922070264816284e-07, -5.913898348808289e-07, -2.905726432800293e-07, 1.0244548320770264e-08, 3.110617399215698e-07, 6.118789315223694e-07, 9.126961231231689e-07, 1.2135133147239685e-06, 1.514330506324768e-06, 1.8151476979255676e-06, 2.115964889526367e-06, 2.4167820811271667e-06, 2.7175992727279663e-06, 3.018416464328766e-06, 3.3192336559295654e-06, 3.620050847530365e-06, 3.9208680391311646e-06, 4.221685230731964e-06, 4.522502422332764e-06, 4.823319613933563e-06, 5.124136805534363e-06, 5.424953997135162e-06, 5.725771188735962e-06, 6.0265883803367615e-06, 6.327405571937561e-06, 6.628222763538361e-06, 6.92903995513916e-06, 7.22985714673996e-06, 7.530674338340759e-06, 7.831491529941559e-06, 8.132308721542358e-06, 8.433125913143158e-06, 8.733943104743958e-06, 9.034760296344757e-06, 9.335577487945557e-06, 9.636394679546356e-06, 9.937211871147156e-06, 1.0238029062747955e-05, 1.0538846254348755e-05, 1.0839663445949554e-05, 1.1140480637550354e-05, 1.1441297829151154e-05, 1.1742115020751953e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 6.0, 0.0, 7.0, 11.0, 17.0, 13.0, 34.0, 36.0, 51.0, 101.0, 153.0, 227.0, 387.0, 641.0, 1019.0, 1775.0, 3119.0, 5260.0, 8898.0, 15601.0, 27860.0, 50506.0, 103881.0, 291075.0, 309466.0, 108679.0, 52616.0, 28321.0, 16303.0, 9351.0, 5368.0, 3161.0, 1801.0, 1096.0, 680.0, 369.0, 229.0, 140.0, 97.0, 74.0, 35.0, 37.0, 14.0, 16.0, 11.0, 9.0, 3.0, 3.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.49951171875, -0.481689453125, -0.4638671875, -0.446044921875, -0.42822265625, -0.410400390625, -0.392578125, -0.374755859375, -0.35693359375, -0.339111328125, -0.3212890625, -0.303466796875, -0.28564453125, -0.267822265625, -0.25, -0.232177734375, -0.21435546875, -0.196533203125, -0.1787109375, -0.160888671875, -0.14306640625, -0.125244140625, -0.107421875, -0.089599609375, -0.07177734375, -0.053955078125, -0.0361328125, -0.018310546875, -0.00048828125, 0.017333984375, 0.03515625, 0.052978515625, 0.07080078125, 0.088623046875, 0.1064453125, 0.124267578125, 0.14208984375, 0.159912109375, 0.177734375, 0.195556640625, 0.21337890625, 0.231201171875, 0.2490234375, 0.266845703125, 0.28466796875, 0.302490234375, 0.3203125, 0.338134765625, 0.35595703125, 0.373779296875, 0.3916015625, 0.409423828125, 0.42724609375, 0.445068359375, 0.462890625, 0.480712890625, 0.49853515625, 0.516357421875, 0.5341796875, 0.552001953125, 0.56982421875, 0.587646484375, 0.60546875, 0.623291015625, 0.64111328125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 3.0, 6.0, 6.0, 10.0, 10.0, 10.0, 18.0, 13.0, 26.0, 26.0, 34.0, 27.0, 34.0, 44.0, 49.0, 53.0, 57.0, 69.0, 51.0, 54.0, 50.0, 62.0, 36.0, 34.0, 33.0, 41.0, 33.0, 26.0, 16.0, 25.0, 14.0, 12.0, 10.0, 9.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.372802734375, -0.3611793518066406, -0.34955596923828125, -0.3379325866699219, -0.3263092041015625, -0.3146858215332031, -0.30306243896484375, -0.2914390563964844, -0.279815673828125, -0.2681922912597656, -0.25656890869140625, -0.24494552612304688, -0.2333221435546875, -0.22169876098632812, -0.21007537841796875, -0.19845199584960938, -0.18682861328125, -0.17520523071289062, -0.16358184814453125, -0.15195846557617188, -0.1403350830078125, -0.12871170043945312, -0.11708831787109375, -0.10546493530273438, -0.093841552734375, -0.08221817016601562, -0.07059478759765625, -0.058971405029296875, -0.0473480224609375, -0.035724639892578125, -0.02410125732421875, -0.012477874755859375, -0.0008544921875, 0.010768890380859375, 0.02239227294921875, 0.034015655517578125, 0.0456390380859375, 0.057262420654296875, 0.06888580322265625, 0.08050918579101562, 0.092132568359375, 0.10375595092773438, 0.11537933349609375, 0.12700271606445312, 0.1386260986328125, 0.15024948120117188, 0.16187286376953125, 0.17349624633789062, 0.18511962890625, 0.19674301147460938, 0.20836639404296875, 0.21998977661132812, 0.2316131591796875, 0.24323654174804688, 0.25485992431640625, 0.2664833068847656, 0.278106689453125, 0.2897300720214844, 0.30135345458984375, 0.3129768371582031, 0.3246002197265625, 0.3362236022949219, 0.34784698486328125, 0.3594703674316406, 0.37109375]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 3.0, 3.0, 8.0, 5.0, 11.0, 13.0, 14.0, 18.0, 16.0, 23.0, 23.0, 36.0, 47.0, 41.0, 42.0, 43.0, 52.0, 42.0, 38.0, 51.0, 40.0, 57.0, 26.0, 50.0, 38.0, 22.0, 44.0, 25.0, 39.0, 16.0, 23.0, 23.0, 24.0, 10.0, 13.0, 4.0, 8.0, 3.0, 4.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.493256568908691, -9.185884475708008, -8.87851333618164, -8.571141242980957, -8.263769149780273, -7.95639705657959, -7.6490254402160645, -7.341653823852539, -7.0342817306518555, -6.726909637451172, -6.4195380210876465, -6.112166404724121, -5.8047943115234375, -5.497422218322754, -5.1900506019592285, -4.882678985595703, -4.5753068923950195, -4.267934799194336, -3.9605631828308105, -3.653191328048706, -3.3458194732666016, -3.038447618484497, -2.7310757637023926, -2.423703908920288, -2.1163320541381836, -1.808960199356079, -1.5015883445739746, -1.1942164897918701, -0.8868446350097656, -0.5794727802276611, -0.27210092544555664, 0.03527092933654785, 0.34264278411865234, 0.6500146389007568, 0.9573864936828613, 1.2647583484649658, 1.5721302032470703, 1.8795020580291748, 2.1868739128112793, 2.494245767593384, 2.8016176223754883, 3.1089894771575928, 3.4163613319396973, 3.7237331867218018, 4.031105041503906, 4.33847713470459, 4.645848751068115, 4.953220367431641, 5.260592460632324, 5.567964553833008, 5.875336170196533, 6.182707786560059, 6.490079879760742, 6.797451972961426, 7.104823589324951, 7.412195205688477, 7.71956729888916, 8.026939392089844, 8.334310531616211, 8.641682624816895, 8.949054718017578, 9.256426811218262, 9.563798904418945, 9.871170043945312, 10.178542137145996]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 2.0, 2.0, 7.0, 9.0, 9.0, 17.0, 16.0, 13.0, 16.0, 32.0, 22.0, 21.0, 35.0, 35.0, 38.0, 35.0, 46.0, 36.0, 28.0, 40.0, 44.0, 30.0, 48.0, 37.0, 49.0, 43.0, 40.0, 41.0, 28.0, 31.0, 30.0, 22.0, 20.0, 13.0, 17.0, 12.0, 10.0, 8.0, 4.0, 5.0, 4.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.424667358398438, -11.027074813842773, -10.62948226928711, -10.231889724731445, -9.834298133850098, -9.436705589294434, -9.03911304473877, -8.641520500183105, -8.243928909301758, -7.846336364746094, -7.448744297027588, -7.051151752471924, -6.653559684753418, -6.255967140197754, -5.85837459564209, -5.460782051086426, -5.063189506530762, -4.665596961975098, -4.268004894256592, -3.8704123497009277, -3.4728200435638428, -3.075227737426758, -2.6776351928710938, -2.280042886734009, -1.8824505805969238, -1.4848582744598389, -1.0872658491134644, -0.6896734237670898, -0.2920811176300049, 0.10551118850708008, 0.5031037330627441, 0.9006960391998291, 1.298288345336914, 1.695880651473999, 2.093472957611084, 2.491065502166748, 2.888657808303833, 3.286250114440918, 3.683842658996582, 4.081435203552246, 4.479027271270752, 4.876619815826416, 5.274211883544922, 5.671804428100586, 6.06939697265625, 6.466989040374756, 6.86458158493042, 7.262173652648926, 7.65976619720459, 8.057358741760254, 8.454951286315918, 8.852542877197266, 9.25013542175293, 9.647727966308594, 10.045320510864258, 10.442913055419922, 10.840505599975586, 11.23809814453125, 11.635690689086914, 12.033283233642578, 12.430874824523926, 12.82846736907959, 13.226059913635254, 13.623652458190918, 14.021244049072266]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 6.0, 3.0, 15.0, 19.0, 26.0, 33.0, 56.0, 105.0, 145.0, 229.0, 323.0, 568.0, 856.0, 1326.0, 2058.0, 3354.0, 5261.0, 7934.0, 12640.0, 19527.0, 29428.0, 42847.0, 60557.0, 80536.0, 99569.0, 112918.0, 117263.0, 110485.0, 94899.0, 74987.0, 55576.0, 39353.0, 26777.0, 17434.0, 11375.0, 7185.0, 4843.0, 2986.0, 1826.0, 1161.0, 766.0, 472.0, 288.0, 194.0, 130.0, 78.0, 54.0, 33.0, 24.0, 11.0, 6.0, 12.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-7.5546875, -7.32135009765625, -7.0880126953125, -6.85467529296875, -6.621337890625, -6.38800048828125, -6.1546630859375, -5.92132568359375, -5.68798828125, -5.45465087890625, -5.2213134765625, -4.98797607421875, -4.754638671875, -4.52130126953125, -4.2879638671875, -4.05462646484375, -3.8212890625, -3.58795166015625, -3.3546142578125, -3.12127685546875, -2.887939453125, -2.65460205078125, -2.4212646484375, -2.18792724609375, -1.95458984375, -1.72125244140625, -1.4879150390625, -1.25457763671875, -1.021240234375, -0.78790283203125, -0.5545654296875, -0.32122802734375, -0.087890625, 0.14544677734375, 0.3787841796875, 0.61212158203125, 0.845458984375, 1.07879638671875, 1.3121337890625, 1.54547119140625, 1.77880859375, 2.01214599609375, 2.2454833984375, 2.47882080078125, 2.712158203125, 2.94549560546875, 3.1788330078125, 3.41217041015625, 3.6455078125, 3.87884521484375, 4.1121826171875, 4.34552001953125, 4.578857421875, 4.81219482421875, 5.0455322265625, 5.27886962890625, 5.51220703125, 5.74554443359375, 5.9788818359375, 6.21221923828125, 6.445556640625, 6.67889404296875, 6.9122314453125, 7.14556884765625, 7.37890625]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 7.0, 2.0, 10.0, 1.0, 11.0, 9.0, 22.0, 16.0, 16.0, 15.0, 26.0, 23.0, 30.0, 30.0, 33.0, 38.0, 41.0, 29.0, 31.0, 45.0, 36.0, 43.0, 33.0, 37.0, 50.0, 45.0, 27.0, 41.0, 36.0, 34.0, 28.0, 21.0, 19.0, 19.0, 22.0, 13.0, 14.0, 11.0, 12.0, 6.0, 7.0, 4.0, 5.0, 6.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.34375, -10.9761962890625, -10.608642578125, -10.2410888671875, -9.87353515625, -9.5059814453125, -9.138427734375, -8.7708740234375, -8.4033203125, -8.0357666015625, -7.668212890625, -7.3006591796875, -6.93310546875, -6.5655517578125, -6.197998046875, -5.8304443359375, -5.462890625, -5.0953369140625, -4.727783203125, -4.3602294921875, -3.99267578125, -3.6251220703125, -3.257568359375, -2.8900146484375, -2.5224609375, -2.1549072265625, -1.787353515625, -1.4197998046875, -1.05224609375, -0.6846923828125, -0.317138671875, 0.0504150390625, 0.41796875, 0.7855224609375, 1.153076171875, 1.5206298828125, 1.88818359375, 2.2557373046875, 2.623291015625, 2.9908447265625, 3.3583984375, 3.7259521484375, 4.093505859375, 4.4610595703125, 4.82861328125, 5.1961669921875, 5.563720703125, 5.9312744140625, 6.298828125, 6.6663818359375, 7.033935546875, 7.4014892578125, 7.76904296875, 8.1365966796875, 8.504150390625, 8.8717041015625, 9.2392578125, 9.6068115234375, 9.974365234375, 10.3419189453125, 10.70947265625, 11.0770263671875, 11.444580078125, 11.8121337890625, 12.1796875]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 7.0, 10.0, 21.0, 31.0, 22.0, 62.0, 84.0, 122.0, 192.0, 282.0, 422.0, 647.0, 934.0, 1524.0, 2326.0, 3622.0, 5351.0, 8403.0, 12829.0, 19770.0, 29312.0, 42200.0, 59041.0, 78905.0, 97253.0, 111394.0, 116020.0, 109428.0, 94941.0, 76068.0, 56575.0, 40478.0, 27235.0, 18311.0, 12032.0, 7891.0, 5133.0, 3262.0, 2186.0, 1401.0, 952.0, 640.0, 430.0, 269.0, 165.0, 128.0, 91.0, 56.0, 36.0, 21.0, 21.0, 6.0, 6.0, 8.0, 6.0, 0.0, 1.0, 1.0], "bins": [-7.57421875, -7.34063720703125, -7.1070556640625, -6.87347412109375, -6.639892578125, -6.40631103515625, -6.1727294921875, -5.93914794921875, -5.70556640625, -5.47198486328125, -5.2384033203125, -5.00482177734375, -4.771240234375, -4.53765869140625, -4.3040771484375, -4.07049560546875, -3.8369140625, -3.60333251953125, -3.3697509765625, -3.13616943359375, -2.902587890625, -2.66900634765625, -2.4354248046875, -2.20184326171875, -1.96826171875, -1.73468017578125, -1.5010986328125, -1.26751708984375, -1.033935546875, -0.80035400390625, -0.5667724609375, -0.33319091796875, -0.099609375, 0.13397216796875, 0.3675537109375, 0.60113525390625, 0.834716796875, 1.06829833984375, 1.3018798828125, 1.53546142578125, 1.76904296875, 2.00262451171875, 2.2362060546875, 2.46978759765625, 2.703369140625, 2.93695068359375, 3.1705322265625, 3.40411376953125, 3.6376953125, 3.87127685546875, 4.1048583984375, 4.33843994140625, 4.572021484375, 4.80560302734375, 5.0391845703125, 5.27276611328125, 5.50634765625, 5.73992919921875, 5.9735107421875, 6.20709228515625, 6.440673828125, 6.67425537109375, 6.9078369140625, 7.14141845703125, 7.375]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 4.0, 1.0, 9.0, 3.0, 17.0, 3.0, 8.0, 9.0, 15.0, 20.0, 24.0, 25.0, 29.0, 24.0, 16.0, 33.0, 33.0, 34.0, 35.0, 43.0, 40.0, 44.0, 33.0, 43.0, 43.0, 37.0, 47.0, 31.0, 43.0, 34.0, 21.0, 23.0, 23.0, 20.0, 24.0, 13.0, 17.0, 11.0, 7.0, 9.0, 12.0, 5.0, 8.0, 8.0, 3.0, 7.0, 3.0, 6.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.81640625, -6.5948486328125, -6.373291015625, -6.1517333984375, -5.93017578125, -5.7086181640625, -5.487060546875, -5.2655029296875, -5.0439453125, -4.8223876953125, -4.600830078125, -4.3792724609375, -4.15771484375, -3.9361572265625, -3.714599609375, -3.4930419921875, -3.271484375, -3.0499267578125, -2.828369140625, -2.6068115234375, -2.38525390625, -2.1636962890625, -1.942138671875, -1.7205810546875, -1.4990234375, -1.2774658203125, -1.055908203125, -0.8343505859375, -0.61279296875, -0.3912353515625, -0.169677734375, 0.0518798828125, 0.2734375, 0.4949951171875, 0.716552734375, 0.9381103515625, 1.15966796875, 1.3812255859375, 1.602783203125, 1.8243408203125, 2.0458984375, 2.2674560546875, 2.489013671875, 2.7105712890625, 2.93212890625, 3.1536865234375, 3.375244140625, 3.5968017578125, 3.818359375, 4.0399169921875, 4.261474609375, 4.4830322265625, 4.70458984375, 4.9261474609375, 5.147705078125, 5.3692626953125, 5.5908203125, 5.8123779296875, 6.033935546875, 6.2554931640625, 6.47705078125, 6.6986083984375, 6.920166015625, 7.1417236328125, 7.36328125]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 8.0, 8.0, 15.0, 19.0, 15.0, 46.0, 53.0, 89.0, 151.0, 249.0, 315.0, 518.0, 859.0, 1312.0, 2201.0, 3462.0, 5627.0, 9281.0, 15097.0, 23753.0, 37395.0, 55981.0, 78720.0, 103437.0, 121950.0, 129652.0, 121939.0, 102809.0, 78434.0, 55358.0, 37091.0, 23952.0, 14763.0, 9204.0, 5623.0, 3418.0, 2012.0, 1326.0, 853.0, 547.0, 353.0, 232.0, 156.0, 91.0, 65.0, 43.0, 30.0, 20.0, 8.0, 9.0, 6.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.326171875, -2.25457763671875, -2.1829833984375, -2.11138916015625, -2.039794921875, -1.96820068359375, -1.8966064453125, -1.82501220703125, -1.75341796875, -1.68182373046875, -1.6102294921875, -1.53863525390625, -1.467041015625, -1.39544677734375, -1.3238525390625, -1.25225830078125, -1.1806640625, -1.10906982421875, -1.0374755859375, -0.96588134765625, -0.894287109375, -0.82269287109375, -0.7510986328125, -0.67950439453125, -0.60791015625, -0.53631591796875, -0.4647216796875, -0.39312744140625, -0.321533203125, -0.24993896484375, -0.1783447265625, -0.10675048828125, -0.03515625, 0.03643798828125, 0.1080322265625, 0.17962646484375, 0.251220703125, 0.32281494140625, 0.3944091796875, 0.46600341796875, 0.53759765625, 0.60919189453125, 0.6807861328125, 0.75238037109375, 0.823974609375, 0.89556884765625, 0.9671630859375, 1.03875732421875, 1.1103515625, 1.18194580078125, 1.2535400390625, 1.32513427734375, 1.396728515625, 1.46832275390625, 1.5399169921875, 1.61151123046875, 1.68310546875, 1.75469970703125, 1.8262939453125, 1.89788818359375, 1.969482421875, 2.04107666015625, 2.1126708984375, 2.18426513671875, 2.255859375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 4.0, 3.0, 8.0, 8.0, 9.0, 16.0, 10.0, 27.0, 24.0, 18.0, 32.0, 28.0, 36.0, 45.0, 57.0, 53.0, 59.0, 52.0, 66.0, 51.0, 59.0, 57.0, 51.0, 43.0, 31.0, 32.0, 33.0, 19.0, 23.0, 15.0, 16.0, 8.0, 8.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0003333091735839844, -0.00032380223274230957, -0.00031429529190063477, -0.00030478835105895996, -0.00029528141021728516, -0.00028577446937561035, -0.00027626752853393555, -0.00026676058769226074, -0.00025725364685058594, -0.00024774670600891113, -0.00023823976516723633, -0.00022873282432556152, -0.00021922588348388672, -0.00020971894264221191, -0.0002002120018005371, -0.0001907050609588623, -0.0001811981201171875, -0.0001716911792755127, -0.0001621842384338379, -0.00015267729759216309, -0.00014317035675048828, -0.00013366341590881348, -0.00012415647506713867, -0.00011464953422546387, -0.00010514259338378906, -9.563565254211426e-05, -8.612871170043945e-05, -7.662177085876465e-05, -6.711483001708984e-05, -5.760788917541504e-05, -4.8100948333740234e-05, -3.859400749206543e-05, -2.9087066650390625e-05, -1.958012580871582e-05, -1.0073184967041016e-05, -5.662441253662109e-07, 8.940696716308594e-06, 1.84476375579834e-05, 2.7954578399658203e-05, 3.746151924133301e-05, 4.696846008300781e-05, 5.647540092468262e-05, 6.598234176635742e-05, 7.548928260803223e-05, 8.499622344970703e-05, 9.450316429138184e-05, 0.00010401010513305664, 0.00011351704597473145, 0.00012302398681640625, 0.00013253092765808105, 0.00014203786849975586, 0.00015154480934143066, 0.00016105175018310547, 0.00017055869102478027, 0.00018006563186645508, 0.00018957257270812988, 0.0001990795135498047, 0.0002085864543914795, 0.0002180933952331543, 0.0002276003360748291, 0.0002371072769165039, 0.0002466142177581787, 0.0002561211585998535, 0.0002656280994415283, 0.0002751350402832031]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 6.0, 10.0, 11.0, 19.0, 21.0, 38.0, 50.0, 73.0, 120.0, 144.0, 224.0, 358.0, 523.0, 819.0, 1227.0, 1988.0, 3030.0, 4727.0, 7602.0, 12225.0, 18962.0, 29624.0, 45155.0, 65197.0, 89686.0, 113510.0, 127588.0, 127701.0, 113236.0, 90586.0, 66050.0, 45212.0, 29987.0, 19161.0, 12340.0, 7643.0, 4842.0, 3122.0, 1940.0, 1256.0, 867.0, 507.0, 388.0, 259.0, 165.0, 122.0, 77.0, 55.0, 35.0, 28.0, 18.0, 11.0, 15.0, 6.0, 0.0, 0.0, 3.0], "bins": [-2.623046875, -2.545928955078125, -2.46881103515625, -2.391693115234375, -2.3145751953125, -2.237457275390625, -2.16033935546875, -2.083221435546875, -2.006103515625, -1.928985595703125, -1.85186767578125, -1.774749755859375, -1.6976318359375, -1.620513916015625, -1.54339599609375, -1.466278076171875, -1.38916015625, -1.312042236328125, -1.23492431640625, -1.157806396484375, -1.0806884765625, -1.003570556640625, -0.92645263671875, -0.849334716796875, -0.772216796875, -0.695098876953125, -0.61798095703125, -0.540863037109375, -0.4637451171875, -0.386627197265625, -0.30950927734375, -0.232391357421875, -0.1552734375, -0.078155517578125, -0.00103759765625, 0.076080322265625, 0.1531982421875, 0.230316162109375, 0.30743408203125, 0.384552001953125, 0.461669921875, 0.538787841796875, 0.61590576171875, 0.693023681640625, 0.7701416015625, 0.847259521484375, 0.92437744140625, 1.001495361328125, 1.07861328125, 1.155731201171875, 1.23284912109375, 1.309967041015625, 1.3870849609375, 1.464202880859375, 1.54132080078125, 1.618438720703125, 1.695556640625, 1.772674560546875, 1.84979248046875, 1.926910400390625, 2.0040283203125, 2.081146240234375, 2.15826416015625, 2.235382080078125, 2.3125]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 6.0, 4.0, 4.0, 5.0, 13.0, 21.0, 16.0, 20.0, 23.0, 26.0, 27.0, 36.0, 47.0, 44.0, 60.0, 59.0, 63.0, 58.0, 56.0, 61.0, 49.0, 64.0, 39.0, 34.0, 28.0, 32.0, 21.0, 21.0, 15.0, 12.0, 11.0, 6.0, 3.0, 4.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.388671875, -1.348297119140625, -1.30792236328125, -1.267547607421875, -1.2271728515625, -1.186798095703125, -1.14642333984375, -1.106048583984375, -1.065673828125, -1.025299072265625, -0.98492431640625, -0.944549560546875, -0.9041748046875, -0.863800048828125, -0.82342529296875, -0.783050537109375, -0.74267578125, -0.702301025390625, -0.66192626953125, -0.621551513671875, -0.5811767578125, -0.540802001953125, -0.50042724609375, -0.460052490234375, -0.419677734375, -0.379302978515625, -0.33892822265625, -0.298553466796875, -0.2581787109375, -0.217803955078125, -0.17742919921875, -0.137054443359375, -0.0966796875, -0.056304931640625, -0.01593017578125, 0.024444580078125, 0.0648193359375, 0.105194091796875, 0.14556884765625, 0.185943603515625, 0.226318359375, 0.266693115234375, 0.30706787109375, 0.347442626953125, 0.3878173828125, 0.428192138671875, 0.46856689453125, 0.508941650390625, 0.54931640625, 0.589691162109375, 0.63006591796875, 0.670440673828125, 0.7108154296875, 0.751190185546875, 0.79156494140625, 0.831939697265625, 0.872314453125, 0.912689208984375, 0.95306396484375, 0.993438720703125, 1.0338134765625, 1.074188232421875, 1.11456298828125, 1.154937744140625, 1.1953125]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 7.0, 4.0, 10.0, 11.0, 16.0, 12.0, 30.0, 28.0, 32.0, 41.0, 29.0, 49.0, 46.0, 59.0, 50.0, 57.0, 55.0, 38.0, 39.0, 33.0, 43.0, 52.0, 40.0, 43.0, 29.0, 27.0, 21.0, 18.0, 20.0, 14.0, 14.0, 11.0, 4.0, 8.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.999189376831055, -10.673126220703125, -10.347064018249512, -10.021001815795898, -9.694938659667969, -9.368875503540039, -9.042813301086426, -8.716751098632812, -8.390687942504883, -8.064624786376953, -7.73856258392334, -7.412499904632568, -7.086437225341797, -6.760374546051025, -6.434311866760254, -6.108249187469482, -5.782186508178711, -5.4561238288879395, -5.130061149597168, -4.8039984703063965, -4.477935791015625, -4.1518731117248535, -3.825810432434082, -3.4997477531433105, -3.173685073852539, -2.8476223945617676, -2.521559715270996, -2.1954970359802246, -1.8694343566894531, -1.5433716773986816, -1.2173089981079102, -0.8912463188171387, -0.5651826858520508, -0.2391200065612793, 0.08694267272949219, 0.41300535202026367, 0.7390680313110352, 1.0651307106018066, 1.3911933898925781, 1.7172560691833496, 2.043318748474121, 2.3693814277648926, 2.695444107055664, 3.0215067863464355, 3.347569465637207, 3.6736321449279785, 3.99969482421875, 4.3257575035095215, 4.651820182800293, 4.9778828620910645, 5.303945541381836, 5.630008220672607, 5.956070899963379, 6.28213357925415, 6.608196258544922, 6.934258937835693, 7.260321617126465, 7.586384296417236, 7.912446975708008, 8.238510131835938, 8.56457233428955, 8.890634536743164, 9.216697692871094, 9.542760848999023, 9.868823051452637]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 7.0, 10.0, 12.0, 15.0, 12.0, 15.0, 16.0, 21.0, 34.0, 35.0, 39.0, 42.0, 40.0, 34.0, 23.0, 38.0, 50.0, 49.0, 44.0, 40.0, 47.0, 41.0, 42.0, 47.0, 38.0, 38.0, 35.0, 21.0, 25.0, 16.0, 17.0, 11.0, 18.0, 7.0, 8.0, 6.0, 2.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.361191749572754, -11.918563842773438, -11.475935935974121, -11.033308029174805, -10.590680122375488, -10.148052215576172, -9.705425262451172, -9.262797355651855, -8.820169448852539, -8.377541542053223, -7.934913635253906, -7.49228572845459, -7.049658298492432, -6.607030391693115, -6.164402484893799, -5.721775054931641, -5.279146671295166, -4.83651876449585, -4.393890857696533, -3.951263189315796, -3.5086355209350586, -3.066007614135742, -2.623379707336426, -2.1807520389556885, -1.738124132156372, -1.2954963445663452, -0.8528684973716736, -0.41024065017700195, 0.0323871374130249, 0.47501492500305176, 0.9176428318023682, 1.3602705001831055, 1.8028984069824219, 2.2455263137817383, 2.6881539821624756, 3.130781888961792, 3.5734095573425293, 4.016037464141846, 4.458665370941162, 4.90129280090332, 5.343920707702637, 5.786548614501953, 6.2291765213012695, 6.671804428100586, 7.114431858062744, 7.5570597648620605, 7.999687671661377, 8.442315101623535, 8.884943008422852, 9.327570915222168, 9.770198822021484, 10.2128267288208, 10.655454635620117, 11.098081588745117, 11.54071044921875, 11.98333740234375, 12.425966262817383, 12.8685941696167, 13.311222076416016, 13.753849983215332, 14.196477890014648, 14.639104843139648, 15.081733703613281, 15.524360656738281, 15.966988563537598]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 10.0, 7.0, 8.0, 9.0, 37.0, 42.0, 47.0, 90.0, 152.0, 256.0, 399.0, 684.0, 1097.0, 1992.0, 3400.0, 5985.0, 10221.0, 17415.0, 29608.0, 49701.0, 83189.0, 138300.0, 222687.0, 339912.0, 476231.0, 585516.0, 606958.0, 528562.0, 396703.0, 268572.0, 169595.0, 104023.0, 62297.0, 36993.0, 21856.0, 12829.0, 7645.0, 4555.0, 2698.0, 1555.0, 940.0, 558.0, 360.0, 203.0, 150.0, 93.0, 46.0, 42.0, 24.0, 18.0, 6.0, 7.0, 6.0, 1.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.1484375, -7.869384765625, -7.59033203125, -7.311279296875, -7.0322265625, -6.753173828125, -6.47412109375, -6.195068359375, -5.916015625, -5.636962890625, -5.35791015625, -5.078857421875, -4.7998046875, -4.520751953125, -4.24169921875, -3.962646484375, -3.68359375, -3.404541015625, -3.12548828125, -2.846435546875, -2.5673828125, -2.288330078125, -2.00927734375, -1.730224609375, -1.451171875, -1.172119140625, -0.89306640625, -0.614013671875, -0.3349609375, -0.055908203125, 0.22314453125, 0.502197265625, 0.78125, 1.060302734375, 1.33935546875, 1.618408203125, 1.8974609375, 2.176513671875, 2.45556640625, 2.734619140625, 3.013671875, 3.292724609375, 3.57177734375, 3.850830078125, 4.1298828125, 4.408935546875, 4.68798828125, 4.967041015625, 5.24609375, 5.525146484375, 5.80419921875, 6.083251953125, 6.3623046875, 6.641357421875, 6.92041015625, 7.199462890625, 7.478515625, 7.757568359375, 8.03662109375, 8.315673828125, 8.5947265625, 8.873779296875, 9.15283203125, 9.431884765625, 9.7109375]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 5.0, 6.0, 5.0, 11.0, 17.0, 13.0, 14.0, 16.0, 23.0, 25.0, 35.0, 44.0, 31.0, 45.0, 39.0, 30.0, 37.0, 47.0, 42.0, 40.0, 35.0, 55.0, 49.0, 34.0, 54.0, 42.0, 35.0, 26.0, 27.0, 27.0, 19.0, 9.0, 13.0, 13.0, 17.0, 13.0, 5.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.15625, -8.8194580078125, -8.482666015625, -8.1458740234375, -7.80908203125, -7.4722900390625, -7.135498046875, -6.7987060546875, -6.4619140625, -6.1251220703125, -5.788330078125, -5.4515380859375, -5.11474609375, -4.7779541015625, -4.441162109375, -4.1043701171875, -3.767578125, -3.4307861328125, -3.093994140625, -2.7572021484375, -2.42041015625, -2.0836181640625, -1.746826171875, -1.4100341796875, -1.0732421875, -0.7364501953125, -0.399658203125, -0.0628662109375, 0.27392578125, 0.6107177734375, 0.947509765625, 1.2843017578125, 1.62109375, 1.9578857421875, 2.294677734375, 2.6314697265625, 2.96826171875, 3.3050537109375, 3.641845703125, 3.9786376953125, 4.3154296875, 4.6522216796875, 4.989013671875, 5.3258056640625, 5.66259765625, 5.9993896484375, 6.336181640625, 6.6729736328125, 7.009765625, 7.3465576171875, 7.683349609375, 8.0201416015625, 8.35693359375, 8.6937255859375, 9.030517578125, 9.3673095703125, 9.7041015625, 10.0408935546875, 10.377685546875, 10.7144775390625, 11.05126953125, 11.3880615234375, 11.724853515625, 12.0616455078125, 12.3984375]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 3.0, 6.0, 17.0, 30.0, 30.0, 57.0, 131.0, 235.0, 411.0, 682.0, 1182.0, 2072.0, 3742.0, 6530.0, 11527.0, 19653.0, 34167.0, 56629.0, 93169.0, 145707.0, 217540.0, 303479.0, 395294.0, 468933.0, 504347.0, 487088.0, 422618.0, 334382.0, 243768.0, 167861.0, 107980.0, 67871.0, 41045.0, 23919.0, 13858.0, 7890.0, 4424.0, 2553.0, 1514.0, 821.0, 449.0, 277.0, 159.0, 104.0, 54.0, 26.0, 19.0, 21.0, 5.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-7.9296875, -7.68695068359375, -7.4442138671875, -7.20147705078125, -6.958740234375, -6.71600341796875, -6.4732666015625, -6.23052978515625, -5.98779296875, -5.74505615234375, -5.5023193359375, -5.25958251953125, -5.016845703125, -4.77410888671875, -4.5313720703125, -4.28863525390625, -4.0458984375, -3.80316162109375, -3.5604248046875, -3.31768798828125, -3.074951171875, -2.83221435546875, -2.5894775390625, -2.34674072265625, -2.10400390625, -1.86126708984375, -1.6185302734375, -1.37579345703125, -1.133056640625, -0.89031982421875, -0.6475830078125, -0.40484619140625, -0.162109375, 0.08062744140625, 0.3233642578125, 0.56610107421875, 0.808837890625, 1.05157470703125, 1.2943115234375, 1.53704833984375, 1.77978515625, 2.02252197265625, 2.2652587890625, 2.50799560546875, 2.750732421875, 2.99346923828125, 3.2362060546875, 3.47894287109375, 3.7216796875, 3.96441650390625, 4.2071533203125, 4.44989013671875, 4.692626953125, 4.93536376953125, 5.1781005859375, 5.42083740234375, 5.66357421875, 5.90631103515625, 6.1490478515625, 6.39178466796875, 6.634521484375, 6.87725830078125, 7.1199951171875, 7.36273193359375, 7.60546875]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 6.0, 9.0, 7.0, 13.0, 16.0, 20.0, 31.0, 47.0, 42.0, 70.0, 68.0, 91.0, 102.0, 136.0, 132.0, 191.0, 205.0, 209.0, 207.0, 210.0, 252.0, 229.0, 232.0, 208.0, 220.0, 177.0, 168.0, 135.0, 108.0, 109.0, 90.0, 62.0, 70.0, 47.0, 31.0, 26.0, 25.0, 17.0, 24.0, 12.0, 11.0, 2.0, 3.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.91015625, -4.76165771484375, -4.6131591796875, -4.46466064453125, -4.316162109375, -4.16766357421875, -4.0191650390625, -3.87066650390625, -3.72216796875, -3.57366943359375, -3.4251708984375, -3.27667236328125, -3.128173828125, -2.97967529296875, -2.8311767578125, -2.68267822265625, -2.5341796875, -2.38568115234375, -2.2371826171875, -2.08868408203125, -1.940185546875, -1.79168701171875, -1.6431884765625, -1.49468994140625, -1.34619140625, -1.19769287109375, -1.0491943359375, -0.90069580078125, -0.752197265625, -0.60369873046875, -0.4552001953125, -0.30670166015625, -0.158203125, -0.00970458984375, 0.1387939453125, 0.28729248046875, 0.435791015625, 0.58428955078125, 0.7327880859375, 0.88128662109375, 1.02978515625, 1.17828369140625, 1.3267822265625, 1.47528076171875, 1.623779296875, 1.77227783203125, 1.9207763671875, 2.06927490234375, 2.2177734375, 2.36627197265625, 2.5147705078125, 2.66326904296875, 2.811767578125, 2.96026611328125, 3.1087646484375, 3.25726318359375, 3.40576171875, 3.55426025390625, 3.7027587890625, 3.85125732421875, 3.999755859375, 4.14825439453125, 4.2967529296875, 4.44525146484375, 4.59375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 5.0, 4.0, 4.0, 7.0, 8.0, 13.0, 11.0, 10.0, 22.0, 17.0, 29.0, 32.0, 24.0, 35.0, 39.0, 39.0, 39.0, 57.0, 55.0, 41.0, 56.0, 48.0, 33.0, 46.0, 37.0, 40.0, 33.0, 34.0, 32.0, 22.0, 26.0, 24.0, 19.0, 13.0, 10.0, 7.0, 5.0, 3.0, 10.0, 6.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.624696731567383, -9.327523231506348, -9.030348777770996, -8.733175277709961, -8.43600082397461, -8.138827323913574, -7.841653347015381, -7.5444793701171875, -7.247305393218994, -6.950131416320801, -6.652957439422607, -6.355783462524414, -6.058609962463379, -5.761435508728027, -5.464262008666992, -5.167088031768799, -4.8699140548706055, -4.572740077972412, -4.275566101074219, -3.9783923625946045, -3.681218385696411, -3.3840444087982178, -3.0868706703186035, -2.78969669342041, -2.492522716522217, -2.1953487396240234, -1.8981748819351196, -1.6010010242462158, -1.3038270473480225, -1.006653070449829, -0.7094792127609253, -0.4123053550720215, -0.11513042449951172, 0.18204349279403687, 0.47921741008758545, 0.776391327381134, 1.0735652446746826, 1.370739221572876, 1.6679130792617798, 1.9650869369506836, 2.262260913848877, 2.5594348907470703, 2.8566088676452637, 3.153782606124878, 3.4509565830230713, 3.7481305599212646, 4.045304298400879, 4.342478275299072, 4.639652252197266, 4.936826229095459, 5.234000205993652, 5.531174182891846, 5.828348159790039, 6.125521659851074, 6.422695636749268, 6.719869613647461, 7.017043590545654, 7.314217567443848, 7.611391544342041, 7.908565521240234, 8.20573902130127, 8.502913475036621, 8.800086975097656, 9.097261428833008, 9.394434928894043]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 5.0, 8.0, 9.0, 4.0, 7.0, 10.0, 14.0, 20.0, 19.0, 24.0, 20.0, 23.0, 30.0, 37.0, 29.0, 36.0, 41.0, 38.0, 46.0, 44.0, 38.0, 45.0, 49.0, 42.0, 36.0, 34.0, 37.0, 38.0, 29.0, 25.0, 25.0, 19.0, 16.0, 19.0, 17.0, 13.0, 9.0, 17.0, 8.0, 8.0, 5.0, 6.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.112897872924805, -10.742691040039062, -10.372485160827637, -10.002279281616211, -9.632072448730469, -9.261865615844727, -8.8916597366333, -8.521453857421875, -8.151247024536133, -7.781040668487549, -7.410834312438965, -7.040627956390381, -6.670421600341797, -6.300215244293213, -5.930008888244629, -5.559802532196045, -5.189596176147461, -4.819389820098877, -4.449183464050293, -4.078977108001709, -3.708770751953125, -3.338564395904541, -2.968358039855957, -2.598151683807373, -2.227945327758789, -1.857738971710205, -1.487532615661621, -1.117326259613037, -0.7471199035644531, -0.37691354751586914, -0.006707191467285156, 0.36349916458129883, 0.7337045669555664, 1.1039109230041504, 1.4741172790527344, 1.8443236351013184, 2.2145299911499023, 2.5847363471984863, 2.9549427032470703, 3.3251490592956543, 3.6953554153442383, 4.065561771392822, 4.435768127441406, 4.80597448348999, 5.176180839538574, 5.546387195587158, 5.916593551635742, 6.286799907684326, 6.65700626373291, 7.027212619781494, 7.397418975830078, 7.767625331878662, 8.137831687927246, 8.508037567138672, 8.878244400024414, 9.248451232910156, 9.618657112121582, 9.988862991333008, 10.35906982421875, 10.729276657104492, 11.099482536315918, 11.469688415527344, 11.839895248413086, 12.210102081298828, 12.580307960510254]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [6.0, 6.0, 2.0, 1.0, 13.0, 11.0, 17.0, 20.0, 31.0, 44.0, 75.0, 106.0, 147.0, 202.0, 249.0, 415.0, 496.0, 747.0, 1057.0, 1477.0, 2087.0, 2893.0, 4260.0, 6262.0, 9336.0, 14160.0, 22138.0, 34083.0, 54104.0, 85196.0, 127929.0, 170812.0, 166134.0, 120402.0, 79270.0, 50374.0, 31850.0, 20825.0, 13187.0, 8933.0, 5945.0, 3955.0, 2757.0, 1936.0, 1292.0, 888.0, 685.0, 461.0, 344.0, 244.0, 208.0, 150.0, 104.0, 73.0, 47.0, 34.0, 34.0, 23.0, 14.0, 8.0, 6.0, 7.0, 1.0, 3.0], "bins": [-1.7578125, -1.7027435302734375, -1.647674560546875, -1.5926055908203125, -1.53753662109375, -1.4824676513671875, -1.427398681640625, -1.3723297119140625, -1.3172607421875, -1.2621917724609375, -1.207122802734375, -1.1520538330078125, -1.09698486328125, -1.0419158935546875, -0.986846923828125, -0.9317779541015625, -0.876708984375, -0.8216400146484375, -0.766571044921875, -0.7115020751953125, -0.65643310546875, -0.6013641357421875, -0.546295166015625, -0.4912261962890625, -0.4361572265625, -0.3810882568359375, -0.326019287109375, -0.2709503173828125, -0.21588134765625, -0.1608123779296875, -0.105743408203125, -0.0506744384765625, 0.00439453125, 0.0594635009765625, 0.114532470703125, 0.1696014404296875, 0.22467041015625, 0.2797393798828125, 0.334808349609375, 0.3898773193359375, 0.4449462890625, 0.5000152587890625, 0.555084228515625, 0.6101531982421875, 0.66522216796875, 0.7202911376953125, 0.775360107421875, 0.8304290771484375, 0.885498046875, 0.9405670166015625, 0.995635986328125, 1.0507049560546875, 1.10577392578125, 1.1608428955078125, 1.215911865234375, 1.2709808349609375, 1.3260498046875, 1.3811187744140625, 1.436187744140625, 1.4912567138671875, 1.54632568359375, 1.6013946533203125, 1.656463623046875, 1.7115325927734375, 1.7666015625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 4.0, 10.0, 5.0, 8.0, 5.0, 7.0, 15.0, 10.0, 20.0, 18.0, 23.0, 17.0, 29.0, 29.0, 32.0, 31.0, 41.0, 45.0, 44.0, 40.0, 40.0, 39.0, 42.0, 43.0, 49.0, 51.0, 32.0, 39.0, 33.0, 18.0, 23.0, 17.0, 23.0, 15.0, 17.0, 18.0, 15.0, 12.0, 10.0, 6.0, 11.0, 7.0, 4.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.953125, -11.578125, -11.203125, -10.828125, -10.453125, -10.078125, -9.703125, -9.328125, -8.953125, -8.578125, -8.203125, -7.828125, -7.453125, -7.078125, -6.703125, -6.328125, -5.953125, -5.578125, -5.203125, -4.828125, -4.453125, -4.078125, -3.703125, -3.328125, -2.953125, -2.578125, -2.203125, -1.828125, -1.453125, -1.078125, -0.703125, -0.328125, 0.046875, 0.421875, 0.796875, 1.171875, 1.546875, 1.921875, 2.296875, 2.671875, 3.046875, 3.421875, 3.796875, 4.171875, 4.546875, 4.921875, 5.296875, 5.671875, 6.046875, 6.421875, 6.796875, 7.171875, 7.546875, 7.921875, 8.296875, 8.671875, 9.046875, 9.421875, 9.796875, 10.171875, 10.546875, 10.921875, 11.296875, 11.671875, 12.046875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 8.0, 8.0, 11.0, 14.0, 14.0, 17.0, 31.0, 30.0, 39.0, 57.0, 73.0, 96.0, 124.0, 178.0, 223.0, 316.0, 453.0, 585.0, 981.0, 1573.0, 2759.0, 5542.0, 12161.0, 30476.0, 874993.0, 72609.0, 23992.0, 9801.0, 4696.0, 2365.0, 1355.0, 872.0, 571.0, 349.0, 309.0, 218.0, 151.0, 125.0, 80.0, 63.0, 63.0, 42.0, 30.0, 29.0, 16.0, 20.0, 8.0, 8.0, 11.0, 8.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0], "bins": [-6.359375, -6.15985107421875, -5.9603271484375, -5.76080322265625, -5.561279296875, -5.36175537109375, -5.1622314453125, -4.96270751953125, -4.76318359375, -4.56365966796875, -4.3641357421875, -4.16461181640625, -3.965087890625, -3.76556396484375, -3.5660400390625, -3.36651611328125, -3.1669921875, -2.96746826171875, -2.7679443359375, -2.56842041015625, -2.368896484375, -2.16937255859375, -1.9698486328125, -1.77032470703125, -1.57080078125, -1.37127685546875, -1.1717529296875, -0.97222900390625, -0.772705078125, -0.57318115234375, -0.3736572265625, -0.17413330078125, 0.025390625, 0.22491455078125, 0.4244384765625, 0.62396240234375, 0.823486328125, 1.02301025390625, 1.2225341796875, 1.42205810546875, 1.62158203125, 1.82110595703125, 2.0206298828125, 2.22015380859375, 2.419677734375, 2.61920166015625, 2.8187255859375, 3.01824951171875, 3.2177734375, 3.41729736328125, 3.6168212890625, 3.81634521484375, 4.015869140625, 4.21539306640625, 4.4149169921875, 4.61444091796875, 4.81396484375, 5.01348876953125, 5.2130126953125, 5.41253662109375, 5.612060546875, 5.81158447265625, 6.0111083984375, 6.21063232421875, 6.41015625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 7.0, 4.0, 4.0, 3.0, 4.0, 7.0, 8.0, 9.0, 7.0, 11.0, 12.0, 14.0, 20.0, 15.0, 25.0, 23.0, 22.0, 28.0, 32.0, 31.0, 29.0, 39.0, 35.0, 26.0, 49.0, 38.0, 34.0, 37.0, 36.0, 48.0, 35.0, 27.0, 34.0, 30.0, 26.0, 23.0, 27.0, 25.0, 17.0, 22.0, 18.0, 10.0, 9.0, 10.0, 11.0, 11.0, 1.0, 5.0, 4.0, 4.0, 2.0, 7.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-7.90625, -7.66790771484375, -7.4295654296875, -7.19122314453125, -6.952880859375, -6.71453857421875, -6.4761962890625, -6.23785400390625, -5.99951171875, -5.76116943359375, -5.5228271484375, -5.28448486328125, -5.046142578125, -4.80780029296875, -4.5694580078125, -4.33111572265625, -4.0927734375, -3.85443115234375, -3.6160888671875, -3.37774658203125, -3.139404296875, -2.90106201171875, -2.6627197265625, -2.42437744140625, -2.18603515625, -1.94769287109375, -1.7093505859375, -1.47100830078125, -1.232666015625, -0.99432373046875, -0.7559814453125, -0.51763916015625, -0.279296875, -0.04095458984375, 0.1973876953125, 0.43572998046875, 0.674072265625, 0.91241455078125, 1.1507568359375, 1.38909912109375, 1.62744140625, 1.86578369140625, 2.1041259765625, 2.34246826171875, 2.580810546875, 2.81915283203125, 3.0574951171875, 3.29583740234375, 3.5341796875, 3.77252197265625, 4.0108642578125, 4.24920654296875, 4.487548828125, 4.72589111328125, 4.9642333984375, 5.20257568359375, 5.44091796875, 5.67926025390625, 5.9176025390625, 6.15594482421875, 6.394287109375, 6.63262939453125, 6.8709716796875, 7.10931396484375, 7.34765625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 4.0, 5.0, 8.0, 14.0, 17.0, 11.0, 24.0, 24.0, 44.0, 49.0, 63.0, 109.0, 120.0, 196.0, 271.0, 386.0, 617.0, 949.0, 1629.0, 3305.0, 7689.0, 25356.0, 938261.0, 47841.0, 11516.0, 4453.0, 2093.0, 1193.0, 721.0, 478.0, 319.0, 196.0, 172.0, 104.0, 71.0, 71.0, 32.0, 34.0, 26.0, 25.0, 13.0, 10.0, 8.0, 2.0, 5.0, 6.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.865234375, -0.836090087890625, -0.80694580078125, -0.777801513671875, -0.7486572265625, -0.719512939453125, -0.69036865234375, -0.661224365234375, -0.632080078125, -0.602935791015625, -0.57379150390625, -0.544647216796875, -0.5155029296875, -0.486358642578125, -0.45721435546875, -0.428070068359375, -0.39892578125, -0.369781494140625, -0.34063720703125, -0.311492919921875, -0.2823486328125, -0.253204345703125, -0.22406005859375, -0.194915771484375, -0.165771484375, -0.136627197265625, -0.10748291015625, -0.078338623046875, -0.0491943359375, -0.020050048828125, 0.00909423828125, 0.038238525390625, 0.0673828125, 0.096527099609375, 0.12567138671875, 0.154815673828125, 0.1839599609375, 0.213104248046875, 0.24224853515625, 0.271392822265625, 0.300537109375, 0.329681396484375, 0.35882568359375, 0.387969970703125, 0.4171142578125, 0.446258544921875, 0.47540283203125, 0.504547119140625, 0.53369140625, 0.562835693359375, 0.59197998046875, 0.621124267578125, 0.6502685546875, 0.679412841796875, 0.70855712890625, 0.737701416015625, 0.766845703125, 0.795989990234375, 0.82513427734375, 0.854278564453125, 0.8834228515625, 0.912567138671875, 0.94171142578125, 0.970855712890625, 1.0]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 5.0, 0.0, 1.0, 3.0, 4.0, 6.0, 7.0, 7.0, 9.0, 6.0, 17.0, 7.0, 16.0, 13.0, 13.0, 22.0, 18.0, 26.0, 25.0, 33.0, 41.0, 26.0, 27.0, 29.0, 36.0, 38.0, 35.0, 40.0, 38.0, 28.0, 59.0, 44.0, 31.0, 28.0, 46.0, 30.0, 20.0, 26.0, 26.0, 14.0, 16.0, 15.0, 16.0, 9.0, 13.0, 7.0, 11.0, 9.0, 3.0, 6.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.900859832763672e-06, -5.704350769519806e-06, -5.50784170627594e-06, -5.311332643032074e-06, -5.114823579788208e-06, -4.918314516544342e-06, -4.721805453300476e-06, -4.52529639005661e-06, -4.328787326812744e-06, -4.132278263568878e-06, -3.935769200325012e-06, -3.7392601370811462e-06, -3.5427510738372803e-06, -3.3462420105934143e-06, -3.1497329473495483e-06, -2.9532238841056824e-06, -2.7567148208618164e-06, -2.5602057576179504e-06, -2.3636966943740845e-06, -2.1671876311302185e-06, -1.9706785678863525e-06, -1.7741695046424866e-06, -1.5776604413986206e-06, -1.3811513781547546e-06, -1.1846423149108887e-06, -9.881332516670227e-07, -7.916241884231567e-07, -5.951151251792908e-07, -3.986060619354248e-07, -2.0209699869155884e-07, -5.587935447692871e-09, 1.909211277961731e-07, 3.8743019104003906e-07, 5.83939254283905e-07, 7.80448317527771e-07, 9.76957380771637e-07, 1.173466444015503e-06, 1.369975507259369e-06, 1.5664845705032349e-06, 1.7629936337471008e-06, 1.959502696990967e-06, 2.1560117602348328e-06, 2.3525208234786987e-06, 2.5490298867225647e-06, 2.7455389499664307e-06, 2.9420480132102966e-06, 3.1385570764541626e-06, 3.3350661396980286e-06, 3.5315752029418945e-06, 3.7280842661857605e-06, 3.9245933294296265e-06, 4.1211023926734924e-06, 4.317611455917358e-06, 4.514120519161224e-06, 4.71062958240509e-06, 4.907138645648956e-06, 5.103647708892822e-06, 5.300156772136688e-06, 5.496665835380554e-06, 5.69317489862442e-06, 5.889683961868286e-06, 6.086193025112152e-06, 6.282702088356018e-06, 6.479211151599884e-06, 6.67572021484375e-06]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 9.0, 15.0, 10.0, 20.0, 25.0, 48.0, 53.0, 77.0, 144.0, 197.0, 263.0, 375.0, 557.0, 853.0, 1234.0, 1782.0, 2705.0, 4100.0, 6285.0, 10034.0, 15622.0, 26104.0, 44920.0, 81174.0, 167084.0, 314750.0, 170220.0, 82913.0, 45722.0, 26391.0, 16038.0, 9855.0, 6386.0, 4167.0, 2676.0, 1871.0, 1204.0, 782.0, 561.0, 435.0, 302.0, 183.0, 139.0, 77.0, 57.0, 34.0, 40.0, 23.0, 8.0, 14.0, 15.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.32373046875, -0.3134574890136719, -0.30318450927734375, -0.2929115295410156, -0.2826385498046875, -0.2723655700683594, -0.26209259033203125, -0.2518196105957031, -0.241546630859375, -0.23127365112304688, -0.22100067138671875, -0.21072769165039062, -0.2004547119140625, -0.19018173217773438, -0.17990875244140625, -0.16963577270507812, -0.15936279296875, -0.14908981323242188, -0.13881683349609375, -0.12854385375976562, -0.1182708740234375, -0.10799789428710938, -0.09772491455078125, -0.08745193481445312, -0.077178955078125, -0.06690597534179688, -0.05663299560546875, -0.046360015869140625, -0.0360870361328125, -0.025814056396484375, -0.01554107666015625, -0.005268096923828125, 0.0050048828125, 0.015277862548828125, 0.02555084228515625, 0.035823822021484375, 0.0460968017578125, 0.056369781494140625, 0.06664276123046875, 0.07691574096679688, 0.087188720703125, 0.09746170043945312, 0.10773468017578125, 0.11800765991210938, 0.1282806396484375, 0.13855361938476562, 0.14882659912109375, 0.15909957885742188, 0.16937255859375, 0.17964553833007812, 0.18991851806640625, 0.20019149780273438, 0.2104644775390625, 0.22073745727539062, 0.23101043701171875, 0.24128341674804688, 0.251556396484375, 0.2618293762207031, 0.27210235595703125, 0.2823753356933594, 0.2926483154296875, 0.3029212951660156, 0.31319427490234375, 0.3234672546386719, 0.333740234375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 6.0, 1.0, 4.0, 8.0, 13.0, 14.0, 17.0, 31.0, 30.0, 33.0, 30.0, 30.0, 58.0, 53.0, 52.0, 55.0, 62.0, 68.0, 57.0, 57.0, 47.0, 47.0, 42.0, 29.0, 30.0, 22.0, 19.0, 14.0, 12.0, 11.0, 9.0, 4.0, 4.0, 9.0, 4.0, 3.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.251953125, -0.24425888061523438, -0.23656463623046875, -0.22887039184570312, -0.2211761474609375, -0.21348190307617188, -0.20578765869140625, -0.19809341430664062, -0.190399169921875, -0.18270492553710938, -0.17501068115234375, -0.16731643676757812, -0.1596221923828125, -0.15192794799804688, -0.14423370361328125, -0.13653945922851562, -0.12884521484375, -0.12115097045898438, -0.11345672607421875, -0.10576248168945312, -0.0980682373046875, -0.09037399291992188, -0.08267974853515625, -0.07498550415039062, -0.067291259765625, -0.059597015380859375, -0.05190277099609375, -0.044208526611328125, -0.0365142822265625, -0.028820037841796875, -0.02112579345703125, -0.013431549072265625, -0.0057373046875, 0.001956939697265625, 0.00965118408203125, 0.017345428466796875, 0.0250396728515625, 0.032733917236328125, 0.04042816162109375, 0.048122406005859375, 0.055816650390625, 0.06351089477539062, 0.07120513916015625, 0.07889938354492188, 0.0865936279296875, 0.09428787231445312, 0.10198211669921875, 0.10967636108398438, 0.11737060546875, 0.12506484985351562, 0.13275909423828125, 0.14045333862304688, 0.1481475830078125, 0.15584182739257812, 0.16353607177734375, 0.17123031616210938, 0.178924560546875, 0.18661880493164062, 0.19431304931640625, 0.20200729370117188, 0.2097015380859375, 0.21739578247070312, 0.22509002685546875, 0.23278427124023438, 0.240478515625]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 6.0, 3.0, 5.0, 3.0, 11.0, 13.0, 12.0, 9.0, 23.0, 18.0, 24.0, 35.0, 27.0, 27.0, 41.0, 34.0, 45.0, 51.0, 63.0, 47.0, 54.0, 43.0, 32.0, 51.0, 37.0, 41.0, 39.0, 29.0, 26.0, 29.0, 25.0, 26.0, 16.0, 15.0, 8.0, 7.0, 3.0, 5.0, 10.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.701034545898438, -9.40096378326416, -9.100892066955566, -8.800821304321289, -8.500749588012695, -8.200678825378418, -7.900607585906982, -7.600536346435547, -7.300465106964111, -7.000393867492676, -6.70032262802124, -6.400251388549805, -6.100180625915527, -5.800108909606934, -5.500038146972656, -5.199966907501221, -4.899895668029785, -4.59982442855835, -4.299753189086914, -3.9996821880340576, -3.699610948562622, -3.3995397090911865, -3.09946870803833, -2.7993974685668945, -2.499326229095459, -2.1992549896240234, -1.8991838693618774, -1.5991127490997314, -1.299041509628296, -0.9989702701568604, -0.6988991498947144, -0.39882802963256836, -0.0987558364868164, 0.20131534337997437, 0.5013865232467651, 0.8014577031135559, 1.1015288829803467, 1.4016001224517822, 1.7016712427139282, 2.001742362976074, 2.3018136024475098, 2.6018848419189453, 2.901956081390381, 3.2020270824432373, 3.502098321914673, 3.8021695613861084, 4.102240562438965, 4.4023118019104, 4.702383041381836, 5.0024542808532715, 5.302525520324707, 5.602596759796143, 5.902667999267578, 6.2027387619018555, 6.502810001373291, 6.802881240844727, 7.102952480316162, 7.403023719787598, 7.703094959259033, 8.003166198730469, 8.303236961364746, 8.60330867767334, 8.903379440307617, 9.203451156616211, 9.503521919250488]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 3.0, 4.0, 10.0, 7.0, 6.0, 5.0, 9.0, 20.0, 16.0, 18.0, 27.0, 19.0, 22.0, 29.0, 35.0, 34.0, 37.0, 39.0, 35.0, 47.0, 44.0, 41.0, 42.0, 48.0, 43.0, 32.0, 33.0, 40.0, 41.0, 27.0, 25.0, 25.0, 18.0, 16.0, 19.0, 17.0, 13.0, 10.0, 16.0, 10.0, 7.0, 6.0, 5.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.948939323425293, -10.583560943603516, -10.218182563781738, -9.852804183959961, -9.487425804138184, -9.122047424316406, -8.756669044494629, -8.391290664672852, -8.025912284851074, -7.660533905029297, -7.2951555252075195, -6.929777145385742, -6.564398765563965, -6.1990203857421875, -5.83364200592041, -5.468263626098633, -5.102885723114014, -4.737507343292236, -4.372128963470459, -4.006750583648682, -3.6413722038269043, -3.275993824005127, -2.9106156826019287, -2.5452373027801514, -2.179858922958374, -1.8144805431365967, -1.4491021633148193, -1.0837239027023315, -0.7183455228805542, -0.35296714305877686, 0.012411117553710938, 0.3777894973754883, 0.7431678771972656, 1.108546257019043, 1.4739246368408203, 1.839302897453308, 2.204681396484375, 2.5700597763061523, 2.9354379177093506, 3.300816297531128, 3.6661946773529053, 4.0315728187561035, 4.396951198577881, 4.762329578399658, 5.1277079582214355, 5.493086338043213, 5.85846471786499, 6.223843097686768, 6.589221477508545, 6.954599857330322, 7.3199782371521, 7.685356616973877, 8.050734519958496, 8.416112899780273, 8.78149127960205, 9.146869659423828, 9.512248039245605, 9.877626419067383, 10.24300479888916, 10.608383178710938, 10.973761558532715, 11.339139938354492, 11.70451831817627, 12.069896697998047, 12.435275077819824]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 4.0, 6.0, 10.0, 14.0, 24.0, 37.0, 43.0, 60.0, 127.0, 158.0, 274.0, 401.0, 671.0, 994.0, 1565.0, 2419.0, 3720.0, 5880.0, 9041.0, 14151.0, 21488.0, 32779.0, 47330.0, 66309.0, 86648.0, 104618.0, 117310.0, 117658.0, 107177.0, 89398.0, 68972.0, 49862.0, 34384.0, 22829.0, 14897.0, 9774.0, 6242.0, 3978.0, 2639.0, 1677.0, 1066.0, 689.0, 442.0, 272.0, 187.0, 153.0, 70.0, 35.0, 34.0, 7.0, 12.0, 14.0, 8.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.6328125, -6.4122314453125, -6.191650390625, -5.9710693359375, -5.75048828125, -5.5299072265625, -5.309326171875, -5.0887451171875, -4.8681640625, -4.6475830078125, -4.427001953125, -4.2064208984375, -3.98583984375, -3.7652587890625, -3.544677734375, -3.3240966796875, -3.103515625, -2.8829345703125, -2.662353515625, -2.4417724609375, -2.22119140625, -2.0006103515625, -1.780029296875, -1.5594482421875, -1.3388671875, -1.1182861328125, -0.897705078125, -0.6771240234375, -0.45654296875, -0.2359619140625, -0.015380859375, 0.2052001953125, 0.42578125, 0.6463623046875, 0.866943359375, 1.0875244140625, 1.30810546875, 1.5286865234375, 1.749267578125, 1.9698486328125, 2.1904296875, 2.4110107421875, 2.631591796875, 2.8521728515625, 3.07275390625, 3.2933349609375, 3.513916015625, 3.7344970703125, 3.955078125, 4.1756591796875, 4.396240234375, 4.6168212890625, 4.83740234375, 5.0579833984375, 5.278564453125, 5.4991455078125, 5.7197265625, 5.9403076171875, 6.160888671875, 6.3814697265625, 6.60205078125, 6.8226318359375, 7.043212890625, 7.2637939453125, 7.484375]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 6.0, 8.0, 7.0, 0.0, 7.0, 7.0, 9.0, 12.0, 24.0, 18.0, 26.0, 20.0, 20.0, 29.0, 31.0, 32.0, 34.0, 46.0, 53.0, 37.0, 43.0, 39.0, 50.0, 31.0, 42.0, 42.0, 38.0, 40.0, 28.0, 35.0, 26.0, 22.0, 23.0, 22.0, 17.0, 17.0, 11.0, 16.0, 14.0, 4.0, 7.0, 5.0, 6.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.75, -10.3800048828125, -10.010009765625, -9.6400146484375, -9.27001953125, -8.9000244140625, -8.530029296875, -8.1600341796875, -7.7900390625, -7.4200439453125, -7.050048828125, -6.6800537109375, -6.31005859375, -5.9400634765625, -5.570068359375, -5.2000732421875, -4.830078125, -4.4600830078125, -4.090087890625, -3.7200927734375, -3.35009765625, -2.9801025390625, -2.610107421875, -2.2401123046875, -1.8701171875, -1.5001220703125, -1.130126953125, -0.7601318359375, -0.39013671875, -0.0201416015625, 0.349853515625, 0.7198486328125, 1.08984375, 1.4598388671875, 1.829833984375, 2.1998291015625, 2.56982421875, 2.9398193359375, 3.309814453125, 3.6798095703125, 4.0498046875, 4.4197998046875, 4.789794921875, 5.1597900390625, 5.52978515625, 5.8997802734375, 6.269775390625, 6.6397705078125, 7.009765625, 7.3797607421875, 7.749755859375, 8.1197509765625, 8.48974609375, 8.8597412109375, 9.229736328125, 9.5997314453125, 9.9697265625, 10.3397216796875, 10.709716796875, 11.0797119140625, 11.44970703125, 11.8197021484375, 12.189697265625, 12.5596923828125, 12.9296875]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 4.0, 6.0, 5.0, 16.0, 23.0, 36.0, 52.0, 68.0, 120.0, 165.0, 287.0, 421.0, 647.0, 962.0, 1507.0, 2468.0, 3699.0, 5785.0, 9058.0, 13732.0, 21149.0, 31149.0, 44910.0, 62133.0, 80937.0, 97827.0, 110528.0, 113448.0, 106874.0, 92346.0, 74191.0, 55310.0, 39724.0, 27345.0, 18413.0, 11774.0, 7713.0, 4956.0, 3156.0, 1921.0, 1289.0, 774.0, 576.0, 358.0, 224.0, 167.0, 106.0, 78.0, 39.0, 36.0, 15.0, 18.0, 7.0, 6.0, 4.0, 3.0, 1.0, 1.0], "bins": [-7.1953125, -6.9793701171875, -6.763427734375, -6.5474853515625, -6.33154296875, -6.1156005859375, -5.899658203125, -5.6837158203125, -5.4677734375, -5.2518310546875, -5.035888671875, -4.8199462890625, -4.60400390625, -4.3880615234375, -4.172119140625, -3.9561767578125, -3.740234375, -3.5242919921875, -3.308349609375, -3.0924072265625, -2.87646484375, -2.6605224609375, -2.444580078125, -2.2286376953125, -2.0126953125, -1.7967529296875, -1.580810546875, -1.3648681640625, -1.14892578125, -0.9329833984375, -0.717041015625, -0.5010986328125, -0.28515625, -0.0692138671875, 0.146728515625, 0.3626708984375, 0.57861328125, 0.7945556640625, 1.010498046875, 1.2264404296875, 1.4423828125, 1.6583251953125, 1.874267578125, 2.0902099609375, 2.30615234375, 2.5220947265625, 2.738037109375, 2.9539794921875, 3.169921875, 3.3858642578125, 3.601806640625, 3.8177490234375, 4.03369140625, 4.2496337890625, 4.465576171875, 4.6815185546875, 4.8974609375, 5.1134033203125, 5.329345703125, 5.5452880859375, 5.76123046875, 5.9771728515625, 6.193115234375, 6.4090576171875, 6.625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 6.0, 6.0, 10.0, 7.0, 9.0, 8.0, 12.0, 10.0, 12.0, 14.0, 18.0, 22.0, 25.0, 38.0, 23.0, 26.0, 40.0, 38.0, 46.0, 45.0, 39.0, 37.0, 37.0, 37.0, 43.0, 36.0, 36.0, 26.0, 32.0, 40.0, 36.0, 27.0, 24.0, 21.0, 25.0, 18.0, 11.0, 14.0, 6.0, 14.0, 7.0, 5.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-7.8359375, -7.6085205078125, -7.381103515625, -7.1536865234375, -6.92626953125, -6.6988525390625, -6.471435546875, -6.2440185546875, -6.0166015625, -5.7891845703125, -5.561767578125, -5.3343505859375, -5.10693359375, -4.8795166015625, -4.652099609375, -4.4246826171875, -4.197265625, -3.9698486328125, -3.742431640625, -3.5150146484375, -3.28759765625, -3.0601806640625, -2.832763671875, -2.6053466796875, -2.3779296875, -2.1505126953125, -1.923095703125, -1.6956787109375, -1.46826171875, -1.2408447265625, -1.013427734375, -0.7860107421875, -0.55859375, -0.3311767578125, -0.103759765625, 0.1236572265625, 0.35107421875, 0.5784912109375, 0.805908203125, 1.0333251953125, 1.2607421875, 1.4881591796875, 1.715576171875, 1.9429931640625, 2.17041015625, 2.3978271484375, 2.625244140625, 2.8526611328125, 3.080078125, 3.3074951171875, 3.534912109375, 3.7623291015625, 3.98974609375, 4.2171630859375, 4.444580078125, 4.6719970703125, 4.8994140625, 5.1268310546875, 5.354248046875, 5.5816650390625, 5.80908203125, 6.0364990234375, 6.263916015625, 6.4913330078125, 6.71875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 6.0, 6.0, 10.0, 20.0, 25.0, 33.0, 54.0, 74.0, 98.0, 169.0, 251.0, 385.0, 712.0, 1041.0, 1771.0, 3012.0, 4872.0, 7972.0, 12804.0, 20460.0, 31658.0, 47534.0, 66963.0, 88502.0, 107628.0, 120318.0, 120613.0, 110182.0, 90710.0, 69402.0, 49884.0, 33927.0, 21624.0, 13844.0, 8496.0, 5275.0, 3198.0, 1923.0, 1175.0, 731.0, 435.0, 275.0, 174.0, 103.0, 79.0, 41.0, 33.0, 22.0, 12.0, 13.0, 7.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.025390625, -1.964141845703125, -1.90289306640625, -1.841644287109375, -1.7803955078125, -1.719146728515625, -1.65789794921875, -1.596649169921875, -1.535400390625, -1.474151611328125, -1.41290283203125, -1.351654052734375, -1.2904052734375, -1.229156494140625, -1.16790771484375, -1.106658935546875, -1.04541015625, -0.984161376953125, -0.92291259765625, -0.861663818359375, -0.8004150390625, -0.739166259765625, -0.67791748046875, -0.616668701171875, -0.555419921875, -0.494171142578125, -0.43292236328125, -0.371673583984375, -0.3104248046875, -0.249176025390625, -0.18792724609375, -0.126678466796875, -0.0654296875, -0.004180908203125, 0.05706787109375, 0.118316650390625, 0.1795654296875, 0.240814208984375, 0.30206298828125, 0.363311767578125, 0.424560546875, 0.485809326171875, 0.54705810546875, 0.608306884765625, 0.6695556640625, 0.730804443359375, 0.79205322265625, 0.853302001953125, 0.91455078125, 0.975799560546875, 1.03704833984375, 1.098297119140625, 1.1595458984375, 1.220794677734375, 1.28204345703125, 1.343292236328125, 1.404541015625, 1.465789794921875, 1.52703857421875, 1.588287353515625, 1.6495361328125, 1.710784912109375, 1.77203369140625, 1.833282470703125, 1.89453125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 5.0, 2.0, 3.0, 10.0, 4.0, 10.0, 9.0, 10.0, 8.0, 14.0, 15.0, 11.0, 27.0, 29.0, 17.0, 37.0, 22.0, 36.0, 34.0, 35.0, 56.0, 40.0, 42.0, 32.0, 37.0, 43.0, 37.0, 40.0, 50.0, 43.0, 39.0, 32.0, 16.0, 21.0, 23.0, 20.0, 11.0, 9.0, 15.0, 4.0, 9.0, 4.0, 10.0, 4.0, 7.0, 3.0, 5.0, 2.0, 3.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.00017714500427246094, -0.00017140433192253113, -0.00016566365957260132, -0.0001599229872226715, -0.0001541823148727417, -0.0001484416425228119, -0.00014270097017288208, -0.00013696029782295227, -0.00013121962547302246, -0.00012547895312309265, -0.00011973828077316284, -0.00011399760842323303, -0.00010825693607330322, -0.00010251626372337341, -9.67755913734436e-05, -9.10349190235138e-05, -8.529424667358398e-05, -7.955357432365417e-05, -7.381290197372437e-05, -6.807222962379456e-05, -6.233155727386475e-05, -5.6590884923934937e-05, -5.085021257400513e-05, -4.510954022407532e-05, -3.936886787414551e-05, -3.36281955242157e-05, -2.788752317428589e-05, -2.214685082435608e-05, -1.640617847442627e-05, -1.066550612449646e-05, -4.92483377456665e-06, 8.158385753631592e-07, 6.556510925292969e-06, 1.2297183275222778e-05, 1.8037855625152588e-05, 2.3778527975082397e-05, 2.9519200325012207e-05, 3.5259872674942017e-05, 4.1000545024871826e-05, 4.6741217374801636e-05, 5.2481889724731445e-05, 5.8222562074661255e-05, 6.396323442459106e-05, 6.970390677452087e-05, 7.544457912445068e-05, 8.118525147438049e-05, 8.69259238243103e-05, 9.266659617424011e-05, 9.840726852416992e-05, 0.00010414794087409973, 0.00010988861322402954, 0.00011562928557395935, 0.00012136995792388916, 0.00012711063027381897, 0.00013285130262374878, 0.0001385919749736786, 0.0001443326473236084, 0.0001500733196735382, 0.00015581399202346802, 0.00016155466437339783, 0.00016729533672332764, 0.00017303600907325745, 0.00017877668142318726, 0.00018451735377311707, 0.00019025802612304688]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 6.0, 9.0, 11.0, 18.0, 22.0, 40.0, 55.0, 75.0, 127.0, 179.0, 321.0, 435.0, 742.0, 1098.0, 1868.0, 3081.0, 4907.0, 8268.0, 13414.0, 20935.0, 33204.0, 49219.0, 69764.0, 92569.0, 113307.0, 124438.0, 123163.0, 109052.0, 88184.0, 64762.0, 45481.0, 29694.0, 18961.0, 11977.0, 7443.0, 4509.0, 2745.0, 1657.0, 1016.0, 647.0, 408.0, 264.0, 150.0, 104.0, 75.0, 56.0, 28.0, 29.0, 15.0, 10.0, 6.0, 4.0, 4.0, 1.0, 5.0, 3.0], "bins": [-2.216796875, -2.1513824462890625, -2.085968017578125, -2.0205535888671875, -1.95513916015625, -1.8897247314453125, -1.824310302734375, -1.7588958740234375, -1.6934814453125, -1.6280670166015625, -1.562652587890625, -1.4972381591796875, -1.43182373046875, -1.3664093017578125, -1.300994873046875, -1.2355804443359375, -1.170166015625, -1.1047515869140625, -1.039337158203125, -0.9739227294921875, -0.90850830078125, -0.8430938720703125, -0.777679443359375, -0.7122650146484375, -0.6468505859375, -0.5814361572265625, -0.516021728515625, -0.4506072998046875, -0.38519287109375, -0.3197784423828125, -0.254364013671875, -0.1889495849609375, -0.12353515625, -0.0581207275390625, 0.007293701171875, 0.0727081298828125, 0.13812255859375, 0.2035369873046875, 0.268951416015625, 0.3343658447265625, 0.3997802734375, 0.4651947021484375, 0.530609130859375, 0.5960235595703125, 0.66143798828125, 0.7268524169921875, 0.792266845703125, 0.8576812744140625, 0.923095703125, 0.9885101318359375, 1.053924560546875, 1.1193389892578125, 1.18475341796875, 1.2501678466796875, 1.315582275390625, 1.3809967041015625, 1.4464111328125, 1.5118255615234375, 1.577239990234375, 1.6426544189453125, 1.70806884765625, 1.7734832763671875, 1.838897705078125, 1.9043121337890625, 1.9697265625]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 5.0, 3.0, 8.0, 11.0, 12.0, 14.0, 13.0, 30.0, 24.0, 41.0, 44.0, 57.0, 40.0, 63.0, 58.0, 64.0, 71.0, 71.0, 56.0, 51.0, 58.0, 39.0, 39.0, 36.0, 21.0, 16.0, 12.0, 12.0, 8.0, 7.0, 9.0, 3.0, 7.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0048828125, -0.9660491943359375, -0.927215576171875, -0.8883819580078125, -0.84954833984375, -0.8107147216796875, -0.771881103515625, -0.7330474853515625, -0.6942138671875, -0.6553802490234375, -0.616546630859375, -0.5777130126953125, -0.53887939453125, -0.5000457763671875, -0.461212158203125, -0.4223785400390625, -0.383544921875, -0.3447113037109375, -0.305877685546875, -0.2670440673828125, -0.22821044921875, -0.1893768310546875, -0.150543212890625, -0.1117095947265625, -0.0728759765625, -0.0340423583984375, 0.004791259765625, 0.0436248779296875, 0.08245849609375, 0.1212921142578125, 0.160125732421875, 0.1989593505859375, 0.23779296875, 0.2766265869140625, 0.315460205078125, 0.3542938232421875, 0.39312744140625, 0.4319610595703125, 0.470794677734375, 0.5096282958984375, 0.5484619140625, 0.5872955322265625, 0.626129150390625, 0.6649627685546875, 0.70379638671875, 0.7426300048828125, 0.781463623046875, 0.8202972412109375, 0.859130859375, 0.8979644775390625, 0.936798095703125, 0.9756317138671875, 1.01446533203125, 1.0532989501953125, 1.092132568359375, 1.1309661865234375, 1.1697998046875, 1.2086334228515625, 1.247467041015625, 1.2863006591796875, 1.32513427734375, 1.3639678955078125, 1.402801513671875, 1.4416351318359375, 1.48046875]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 7.0, 3.0, 4.0, 2.0, 4.0, 7.0, 3.0, 12.0, 11.0, 11.0, 21.0, 21.0, 29.0, 27.0, 27.0, 40.0, 40.0, 37.0, 44.0, 35.0, 43.0, 48.0, 41.0, 58.0, 47.0, 48.0, 34.0, 30.0, 34.0, 41.0, 34.0, 20.0, 21.0, 19.0, 27.0, 18.0, 11.0, 8.0, 9.0, 7.0, 10.0, 4.0, 3.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.987759590148926, -8.703994750976562, -8.420230865478516, -8.136466026306152, -7.852701187133789, -7.568936347961426, -7.285171985626221, -7.001407623291016, -6.717642784118652, -6.433877944946289, -6.150113582611084, -5.866349220275879, -5.582584381103516, -5.298819541931152, -5.015055179595947, -4.731290817260742, -4.447525978088379, -4.163761138916016, -3.8799967765808105, -3.5962321758270264, -3.312467575073242, -3.028702974319458, -2.744938373565674, -2.4611737728118896, -2.1774091720581055, -1.8936445713043213, -1.609879970550537, -1.326115369796753, -1.0423507690429688, -0.7585861682891846, -0.4748215675354004, -0.1910569667816162, 0.09270668029785156, 0.37647128105163574, 0.6602358818054199, 0.9440004825592041, 1.2277650833129883, 1.5115296840667725, 1.7952942848205566, 2.079058885574341, 2.362823486328125, 2.646588087081909, 2.9303526878356934, 3.2141172885894775, 3.4978818893432617, 3.781646490097046, 4.06541109085083, 4.349175453186035, 4.632940292358398, 4.916705131530762, 5.200469493865967, 5.484233856201172, 5.767998695373535, 6.051763534545898, 6.3355278968811035, 6.619292259216309, 6.903057098388672, 7.186821937561035, 7.47058629989624, 7.754350662231445, 8.038115501403809, 8.321880340576172, 8.605644226074219, 8.889409065246582, 9.173173904418945]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 5.0, 10.0, 10.0, 10.0, 19.0, 14.0, 6.0, 19.0, 16.0, 16.0, 24.0, 24.0, 41.0, 35.0, 40.0, 34.0, 43.0, 42.0, 37.0, 55.0, 33.0, 52.0, 45.0, 46.0, 38.0, 26.0, 30.0, 30.0, 22.0, 20.0, 22.0, 22.0, 27.0, 15.0, 13.0, 15.0, 10.0, 10.0, 8.0, 8.0, 4.0, 0.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-12.09431266784668, -11.716167449951172, -11.338022232055664, -10.959877014160156, -10.581731796264648, -10.20358657836914, -9.825441360473633, -9.447296142578125, -9.069150924682617, -8.69100570678711, -8.312860488891602, -7.934715270996094, -7.556570053100586, -7.178424835205078, -6.80027961730957, -6.4221343994140625, -6.043989181518555, -5.665843963623047, -5.287698745727539, -4.909553527832031, -4.531408309936523, -4.153263092041016, -3.775117874145508, -3.39697265625, -3.018827438354492, -2.6406822204589844, -2.2625370025634766, -1.8843917846679688, -1.506246566772461, -1.1281013488769531, -0.7499561309814453, -0.3718109130859375, 0.0063343048095703125, 0.3844795227050781, 0.7626247406005859, 1.1407699584960938, 1.5189151763916016, 1.8970603942871094, 2.275205612182617, 2.653350830078125, 3.031496047973633, 3.4096412658691406, 3.7877864837646484, 4.165931701660156, 4.544076919555664, 4.922222137451172, 5.30036735534668, 5.6785125732421875, 6.056657791137695, 6.434803009033203, 6.812948226928711, 7.191093444824219, 7.569238662719727, 7.947383880615234, 8.325529098510742, 8.70367431640625, 9.081819534301758, 9.459964752197266, 9.838109970092773, 10.216255187988281, 10.594400405883789, 10.972545623779297, 11.350690841674805, 11.728836059570312, 12.10698127746582]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 6.0, 7.0, 8.0, 7.0, 14.0, 23.0, 35.0, 62.0, 97.0, 128.0, 265.0, 412.0, 599.0, 1007.0, 1628.0, 2543.0, 4104.0, 6474.0, 10123.0, 16059.0, 25301.0, 39797.0, 61186.0, 94462.0, 141400.0, 204768.0, 285425.0, 372856.0, 449163.0, 489484.0, 476800.0, 418918.0, 335623.0, 248479.0, 173874.0, 117577.0, 77589.0, 50355.0, 32354.0, 20494.0, 13068.0, 8084.0, 5141.0, 3075.0, 1976.0, 1332.0, 829.0, 495.0, 308.0, 186.0, 105.0, 71.0, 55.0, 36.0, 15.0, 6.0, 6.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.796875, -6.5760498046875, -6.355224609375, -6.1343994140625, -5.91357421875, -5.6927490234375, -5.471923828125, -5.2510986328125, -5.0302734375, -4.8094482421875, -4.588623046875, -4.3677978515625, -4.14697265625, -3.9261474609375, -3.705322265625, -3.4844970703125, -3.263671875, -3.0428466796875, -2.822021484375, -2.6011962890625, -2.38037109375, -2.1595458984375, -1.938720703125, -1.7178955078125, -1.4970703125, -1.2762451171875, -1.055419921875, -0.8345947265625, -0.61376953125, -0.3929443359375, -0.172119140625, 0.0487060546875, 0.26953125, 0.4903564453125, 0.711181640625, 0.9320068359375, 1.15283203125, 1.3736572265625, 1.594482421875, 1.8153076171875, 2.0361328125, 2.2569580078125, 2.477783203125, 2.6986083984375, 2.91943359375, 3.1402587890625, 3.361083984375, 3.5819091796875, 3.802734375, 4.0235595703125, 4.244384765625, 4.4652099609375, 4.68603515625, 4.9068603515625, 5.127685546875, 5.3485107421875, 5.5693359375, 5.7901611328125, 6.010986328125, 6.2318115234375, 6.45263671875, 6.6734619140625, 6.894287109375, 7.1151123046875, 7.3359375]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 4.0, 5.0, 7.0, 12.0, 7.0, 6.0, 17.0, 19.0, 17.0, 22.0, 16.0, 22.0, 33.0, 33.0, 36.0, 39.0, 39.0, 43.0, 62.0, 49.0, 45.0, 45.0, 33.0, 41.0, 38.0, 44.0, 42.0, 26.0, 27.0, 26.0, 24.0, 17.0, 19.0, 21.0, 13.0, 12.0, 11.0, 7.0, 10.0, 3.0, 5.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-10.203125, -9.899169921875, -9.59521484375, -9.291259765625, -8.9873046875, -8.683349609375, -8.37939453125, -8.075439453125, -7.771484375, -7.467529296875, -7.16357421875, -6.859619140625, -6.5556640625, -6.251708984375, -5.94775390625, -5.643798828125, -5.33984375, -5.035888671875, -4.73193359375, -4.427978515625, -4.1240234375, -3.820068359375, -3.51611328125, -3.212158203125, -2.908203125, -2.604248046875, -2.30029296875, -1.996337890625, -1.6923828125, -1.388427734375, -1.08447265625, -0.780517578125, -0.4765625, -0.172607421875, 0.13134765625, 0.435302734375, 0.7392578125, 1.043212890625, 1.34716796875, 1.651123046875, 1.955078125, 2.259033203125, 2.56298828125, 2.866943359375, 3.1708984375, 3.474853515625, 3.77880859375, 4.082763671875, 4.38671875, 4.690673828125, 4.99462890625, 5.298583984375, 5.6025390625, 5.906494140625, 6.21044921875, 6.514404296875, 6.818359375, 7.122314453125, 7.42626953125, 7.730224609375, 8.0341796875, 8.338134765625, 8.64208984375, 8.946044921875, 9.25]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 5.0, 14.0, 16.0, 30.0, 49.0, 76.0, 114.0, 201.0, 342.0, 566.0, 944.0, 1552.0, 2487.0, 4010.0, 6473.0, 10423.0, 16497.0, 25685.0, 39091.0, 58579.0, 86051.0, 122299.0, 168131.0, 220345.0, 278603.0, 333635.0, 373867.0, 395984.0, 393068.0, 366155.0, 320144.0, 263821.0, 207461.0, 156535.0, 112528.0, 77898.0, 53374.0, 35408.0, 22976.0, 14648.0, 9267.0, 5685.0, 3613.0, 2210.0, 1344.0, 833.0, 508.0, 314.0, 172.0, 107.0, 46.0, 52.0, 24.0, 18.0, 9.0, 5.0, 3.0, 0.0, 3.0, 2.0], "bins": [-6.03515625, -5.8458251953125, -5.656494140625, -5.4671630859375, -5.27783203125, -5.0885009765625, -4.899169921875, -4.7098388671875, -4.5205078125, -4.3311767578125, -4.141845703125, -3.9525146484375, -3.76318359375, -3.5738525390625, -3.384521484375, -3.1951904296875, -3.005859375, -2.8165283203125, -2.627197265625, -2.4378662109375, -2.24853515625, -2.0592041015625, -1.869873046875, -1.6805419921875, -1.4912109375, -1.3018798828125, -1.112548828125, -0.9232177734375, -0.73388671875, -0.5445556640625, -0.355224609375, -0.1658935546875, 0.0234375, 0.2127685546875, 0.402099609375, 0.5914306640625, 0.78076171875, 0.9700927734375, 1.159423828125, 1.3487548828125, 1.5380859375, 1.7274169921875, 1.916748046875, 2.1060791015625, 2.29541015625, 2.4847412109375, 2.674072265625, 2.8634033203125, 3.052734375, 3.2420654296875, 3.431396484375, 3.6207275390625, 3.81005859375, 3.9993896484375, 4.188720703125, 4.3780517578125, 4.5673828125, 4.7567138671875, 4.946044921875, 5.1353759765625, 5.32470703125, 5.5140380859375, 5.703369140625, 5.8927001953125, 6.08203125]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 7.0, 6.0, 8.0, 15.0, 12.0, 14.0, 35.0, 35.0, 39.0, 37.0, 64.0, 66.0, 100.0, 105.0, 131.0, 134.0, 151.0, 171.0, 177.0, 232.0, 201.0, 205.0, 203.0, 221.0, 205.0, 185.0, 178.0, 158.0, 163.0, 133.0, 127.0, 104.0, 76.0, 79.0, 53.0, 73.0, 40.0, 40.0, 20.0, 16.0, 11.0, 12.0, 11.0, 8.0, 5.0, 3.0, 3.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0], "bins": [-4.30859375, -4.17547607421875, -4.0423583984375, -3.90924072265625, -3.776123046875, -3.64300537109375, -3.5098876953125, -3.37677001953125, -3.24365234375, -3.11053466796875, -2.9774169921875, -2.84429931640625, -2.711181640625, -2.57806396484375, -2.4449462890625, -2.31182861328125, -2.1787109375, -2.04559326171875, -1.9124755859375, -1.77935791015625, -1.646240234375, -1.51312255859375, -1.3800048828125, -1.24688720703125, -1.11376953125, -0.98065185546875, -0.8475341796875, -0.71441650390625, -0.581298828125, -0.44818115234375, -0.3150634765625, -0.18194580078125, -0.048828125, 0.08428955078125, 0.2174072265625, 0.35052490234375, 0.483642578125, 0.61676025390625, 0.7498779296875, 0.88299560546875, 1.01611328125, 1.14923095703125, 1.2823486328125, 1.41546630859375, 1.548583984375, 1.68170166015625, 1.8148193359375, 1.94793701171875, 2.0810546875, 2.21417236328125, 2.3472900390625, 2.48040771484375, 2.613525390625, 2.74664306640625, 2.8797607421875, 3.01287841796875, 3.14599609375, 3.27911376953125, 3.4122314453125, 3.54534912109375, 3.678466796875, 3.81158447265625, 3.9447021484375, 4.07781982421875, 4.2109375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 7.0, 4.0, 6.0, 8.0, 11.0, 17.0, 12.0, 16.0, 30.0, 19.0, 27.0, 29.0, 38.0, 33.0, 44.0, 41.0, 55.0, 58.0, 54.0, 39.0, 43.0, 50.0, 41.0, 47.0, 41.0, 33.0, 37.0, 31.0, 34.0, 16.0, 11.0, 16.0, 14.0, 14.0, 6.0, 5.0, 8.0, 3.0, 1.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.910574913024902, -8.616293907165527, -8.322012901306152, -8.027731895446777, -7.7334513664245605, -7.4391703605651855, -7.1448893547058105, -6.850608825683594, -6.556327819824219, -6.262046813964844, -5.967765808105469, -5.673484802246094, -5.379204273223877, -5.084923267364502, -4.790642261505127, -4.49636173248291, -4.202080249786377, -3.907799243927002, -3.613518476486206, -3.319237470626831, -3.024956703186035, -2.73067569732666, -2.436394691467285, -2.1421139240264893, -1.8478329181671143, -1.5535520315170288, -1.2592711448669434, -0.9649901390075684, -0.6707092523574829, -0.37642836570739746, -0.08214735984802246, 0.21213340759277344, 0.5064144134521484, 0.8006953001022339, 1.0949761867523193, 1.3892571926116943, 1.6835380792617798, 1.9778189659118652, 2.2720999717712402, 2.566380739212036, 2.860661745071411, 3.154942750930786, 3.449223518371582, 3.743504524230957, 4.037785530090332, 4.332066535949707, 4.626347541809082, 4.920628070831299, 5.214909076690674, 5.509190082550049, 5.803471088409424, 6.097751617431641, 6.392032623291016, 6.686313629150391, 6.980594635009766, 7.274875640869141, 7.569156646728516, 7.863437652587891, 8.157718658447266, 8.45199966430664, 8.746280670166016, 9.04056167602539, 9.334842681884766, 9.629122734069824, 9.9234037399292]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 3.0, 1.0, 5.0, 6.0, 6.0, 11.0, 8.0, 14.0, 15.0, 12.0, 20.0, 20.0, 24.0, 22.0, 24.0, 34.0, 24.0, 46.0, 29.0, 50.0, 33.0, 37.0, 42.0, 36.0, 41.0, 45.0, 44.0, 35.0, 35.0, 34.0, 26.0, 31.0, 34.0, 17.0, 24.0, 11.0, 26.0, 16.0, 14.0, 14.0, 9.0, 9.0, 6.0, 3.0, 4.0, 2.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.705789566040039, -10.365928649902344, -10.026067733764648, -9.686206817626953, -9.346344947814941, -9.006484031677246, -8.66662311553955, -8.326762199401855, -7.986900806427002, -7.647039890289307, -7.307178497314453, -6.967317581176758, -6.6274566650390625, -6.287595272064209, -5.947734355926514, -5.60787296295166, -5.268012046813965, -4.9281511306762695, -4.588289737701416, -4.248428821563721, -3.9085676670074463, -3.568706512451172, -3.2288455963134766, -2.888984441757202, -2.5491232872009277, -2.2092621326446533, -1.8694010972976685, -1.5295400619506836, -1.1896789073944092, -0.8498177528381348, -0.5099568367004395, -0.17009568214416504, 0.16976642608642578, 0.5096275210380554, 0.8494886159896851, 1.18934965133667, 1.5292108058929443, 1.8690719604492188, 2.208932876586914, 2.5487940311431885, 2.888655185699463, 3.2285163402557373, 3.5683774948120117, 3.908238410949707, 4.248099327087402, 4.587960720062256, 4.927821636199951, 5.267683029174805, 5.6075439453125, 5.947404861450195, 6.287266254425049, 6.627127170562744, 6.966988563537598, 7.306849479675293, 7.646710395812988, 7.986571311950684, 8.326433181762695, 8.66629409790039, 9.006155014038086, 9.346015930175781, 9.685877799987793, 10.025738716125488, 10.365599632263184, 10.705460548400879, 11.045321464538574]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 4.0, 9.0, 9.0, 18.0, 34.0, 42.0, 64.0, 85.0, 126.0, 157.0, 263.0, 345.0, 492.0, 747.0, 988.0, 1449.0, 2143.0, 3138.0, 4756.0, 6904.0, 10581.0, 16334.0, 25372.0, 39739.0, 64520.0, 106029.0, 163233.0, 194513.0, 150391.0, 94608.0, 57731.0, 36344.0, 22970.0, 14986.0, 9427.0, 6314.0, 4313.0, 2947.0, 1971.0, 1346.0, 977.0, 621.0, 463.0, 359.0, 228.0, 142.0, 110.0, 68.0, 47.0, 40.0, 19.0, 23.0, 13.0, 6.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.8564453125, -1.79730224609375, -1.7381591796875, -1.67901611328125, -1.619873046875, -1.56072998046875, -1.5015869140625, -1.44244384765625, -1.38330078125, -1.32415771484375, -1.2650146484375, -1.20587158203125, -1.146728515625, -1.08758544921875, -1.0284423828125, -0.96929931640625, -0.91015625, -0.85101318359375, -0.7918701171875, -0.73272705078125, -0.673583984375, -0.61444091796875, -0.5552978515625, -0.49615478515625, -0.43701171875, -0.37786865234375, -0.3187255859375, -0.25958251953125, -0.200439453125, -0.14129638671875, -0.0821533203125, -0.02301025390625, 0.0361328125, 0.09527587890625, 0.1544189453125, 0.21356201171875, 0.272705078125, 0.33184814453125, 0.3909912109375, 0.45013427734375, 0.50927734375, 0.56842041015625, 0.6275634765625, 0.68670654296875, 0.745849609375, 0.80499267578125, 0.8641357421875, 0.92327880859375, 0.982421875, 1.04156494140625, 1.1007080078125, 1.15985107421875, 1.218994140625, 1.27813720703125, 1.3372802734375, 1.39642333984375, 1.45556640625, 1.51470947265625, 1.5738525390625, 1.63299560546875, 1.692138671875, 1.75128173828125, 1.8104248046875, 1.86956787109375, 1.9287109375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 7.0, 6.0, 6.0, 9.0, 16.0, 10.0, 12.0, 10.0, 17.0, 32.0, 22.0, 35.0, 22.0, 34.0, 35.0, 33.0, 32.0, 40.0, 32.0, 43.0, 48.0, 47.0, 37.0, 35.0, 34.0, 49.0, 35.0, 33.0, 26.0, 22.0, 31.0, 22.0, 21.0, 13.0, 16.0, 15.0, 15.0, 7.0, 14.0, 9.0, 4.0, 3.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-11.40625, -11.058837890625, -10.71142578125, -10.364013671875, -10.0166015625, -9.669189453125, -9.32177734375, -8.974365234375, -8.626953125, -8.279541015625, -7.93212890625, -7.584716796875, -7.2373046875, -6.889892578125, -6.54248046875, -6.195068359375, -5.84765625, -5.500244140625, -5.15283203125, -4.805419921875, -4.4580078125, -4.110595703125, -3.76318359375, -3.415771484375, -3.068359375, -2.720947265625, -2.37353515625, -2.026123046875, -1.6787109375, -1.331298828125, -0.98388671875, -0.636474609375, -0.2890625, 0.058349609375, 0.40576171875, 0.753173828125, 1.1005859375, 1.447998046875, 1.79541015625, 2.142822265625, 2.490234375, 2.837646484375, 3.18505859375, 3.532470703125, 3.8798828125, 4.227294921875, 4.57470703125, 4.922119140625, 5.26953125, 5.616943359375, 5.96435546875, 6.311767578125, 6.6591796875, 7.006591796875, 7.35400390625, 7.701416015625, 8.048828125, 8.396240234375, 8.74365234375, 9.091064453125, 9.4384765625, 9.785888671875, 10.13330078125, 10.480712890625, 10.828125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 7.0, 8.0, 10.0, 20.0, 26.0, 25.0, 23.0, 36.0, 55.0, 69.0, 108.0, 153.0, 179.0, 291.0, 350.0, 601.0, 838.0, 1411.0, 2571.0, 5448.0, 13063.0, 36349.0, 896039.0, 56886.0, 18549.0, 7242.0, 3178.0, 1730.0, 1032.0, 660.0, 481.0, 298.0, 221.0, 168.0, 119.0, 88.0, 46.0, 35.0, 30.0, 27.0, 18.0, 21.0, 13.0, 10.0, 6.0, 6.0, 2.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-6.7578125, -6.54449462890625, -6.3311767578125, -6.11785888671875, -5.904541015625, -5.69122314453125, -5.4779052734375, -5.26458740234375, -5.05126953125, -4.83795166015625, -4.6246337890625, -4.41131591796875, -4.197998046875, -3.98468017578125, -3.7713623046875, -3.55804443359375, -3.3447265625, -3.13140869140625, -2.9180908203125, -2.70477294921875, -2.491455078125, -2.27813720703125, -2.0648193359375, -1.85150146484375, -1.63818359375, -1.42486572265625, -1.2115478515625, -0.99822998046875, -0.784912109375, -0.57159423828125, -0.3582763671875, -0.14495849609375, 0.068359375, 0.28167724609375, 0.4949951171875, 0.70831298828125, 0.921630859375, 1.13494873046875, 1.3482666015625, 1.56158447265625, 1.77490234375, 1.98822021484375, 2.2015380859375, 2.41485595703125, 2.628173828125, 2.84149169921875, 3.0548095703125, 3.26812744140625, 3.4814453125, 3.69476318359375, 3.9080810546875, 4.12139892578125, 4.334716796875, 4.54803466796875, 4.7613525390625, 4.97467041015625, 5.18798828125, 5.40130615234375, 5.6146240234375, 5.82794189453125, 6.041259765625, 6.25457763671875, 6.4678955078125, 6.68121337890625, 6.89453125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 5.0, 4.0, 5.0, 7.0, 8.0, 7.0, 10.0, 11.0, 13.0, 21.0, 10.0, 13.0, 16.0, 24.0, 28.0, 24.0, 23.0, 36.0, 32.0, 36.0, 38.0, 39.0, 42.0, 33.0, 44.0, 34.0, 41.0, 48.0, 32.0, 36.0, 38.0, 29.0, 30.0, 22.0, 27.0, 15.0, 19.0, 17.0, 16.0, 15.0, 11.0, 11.0, 6.0, 7.0, 4.0, 7.0, 3.0, 5.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-7.22265625, -6.9957275390625, -6.768798828125, -6.5418701171875, -6.31494140625, -6.0880126953125, -5.861083984375, -5.6341552734375, -5.4072265625, -5.1802978515625, -4.953369140625, -4.7264404296875, -4.49951171875, -4.2725830078125, -4.045654296875, -3.8187255859375, -3.591796875, -3.3648681640625, -3.137939453125, -2.9110107421875, -2.68408203125, -2.4571533203125, -2.230224609375, -2.0032958984375, -1.7763671875, -1.5494384765625, -1.322509765625, -1.0955810546875, -0.86865234375, -0.6417236328125, -0.414794921875, -0.1878662109375, 0.0390625, 0.2659912109375, 0.492919921875, 0.7198486328125, 0.94677734375, 1.1737060546875, 1.400634765625, 1.6275634765625, 1.8544921875, 2.0814208984375, 2.308349609375, 2.5352783203125, 2.76220703125, 2.9891357421875, 3.216064453125, 3.4429931640625, 3.669921875, 3.8968505859375, 4.123779296875, 4.3507080078125, 4.57763671875, 4.8045654296875, 5.031494140625, 5.2584228515625, 5.4853515625, 5.7122802734375, 5.939208984375, 6.1661376953125, 6.39306640625, 6.6199951171875, 6.846923828125, 7.0738525390625, 7.30078125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 1.0, 10.0, 2.0, 14.0, 10.0, 16.0, 16.0, 14.0, 44.0, 62.0, 76.0, 78.0, 127.0, 163.0, 253.0, 364.0, 535.0, 898.0, 1505.0, 2902.0, 6579.0, 19762.0, 914215.0, 74804.0, 14606.0, 5349.0, 2385.0, 1330.0, 766.0, 496.0, 373.0, 211.0, 167.0, 111.0, 90.0, 58.0, 29.0, 34.0, 29.0, 20.0, 10.0, 11.0, 12.0, 5.0, 7.0, 2.0, 0.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.92041015625, -0.8932418823242188, -0.8660736083984375, -0.8389053344726562, -0.811737060546875, -0.7845687866210938, -0.7574005126953125, -0.7302322387695312, -0.70306396484375, -0.6758956909179688, -0.6487274169921875, -0.6215591430664062, -0.594390869140625, -0.5672225952148438, -0.5400543212890625, -0.5128860473632812, -0.4857177734375, -0.45854949951171875, -0.4313812255859375, -0.40421295166015625, -0.377044677734375, -0.34987640380859375, -0.3227081298828125, -0.29553985595703125, -0.26837158203125, -0.24120330810546875, -0.2140350341796875, -0.18686676025390625, -0.159698486328125, -0.13253021240234375, -0.1053619384765625, -0.07819366455078125, -0.051025390625, -0.02385711669921875, 0.0033111572265625, 0.03047943115234375, 0.057647705078125, 0.08481597900390625, 0.1119842529296875, 0.13915252685546875, 0.16632080078125, 0.19348907470703125, 0.2206573486328125, 0.24782562255859375, 0.274993896484375, 0.30216217041015625, 0.3293304443359375, 0.35649871826171875, 0.3836669921875, 0.41083526611328125, 0.4380035400390625, 0.46517181396484375, 0.492340087890625, 0.5195083618164062, 0.5466766357421875, 0.5738449096679688, 0.60101318359375, 0.6281814575195312, 0.6553497314453125, 0.6825180053710938, 0.709686279296875, 0.7368545532226562, 0.7640228271484375, 0.7911911010742188, 0.818359375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 12.0, 7.0, 8.0, 4.0, 12.0, 9.0, 13.0, 12.0, 18.0, 14.0, 25.0, 32.0, 21.0, 37.0, 28.0, 41.0, 34.0, 40.0, 35.0, 41.0, 44.0, 37.0, 41.0, 34.0, 43.0, 41.0, 46.0, 22.0, 38.0, 25.0, 28.0, 18.0, 17.0, 28.0, 19.0, 18.0, 12.0, 11.0, 7.0, 7.0, 6.0, 9.0, 6.0, 1.0, 3.0, 0.0, 1.0, 5.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.735324859619141e-06, -6.52950257062912e-06, -6.323680281639099e-06, -6.117857992649078e-06, -5.912035703659058e-06, -5.706213414669037e-06, -5.500391125679016e-06, -5.294568836688995e-06, -5.088746547698975e-06, -4.882924258708954e-06, -4.677101969718933e-06, -4.471279680728912e-06, -4.265457391738892e-06, -4.059635102748871e-06, -3.85381281375885e-06, -3.6479905247688293e-06, -3.4421682357788086e-06, -3.236345946788788e-06, -3.030523657798767e-06, -2.8247013688087463e-06, -2.6188790798187256e-06, -2.413056790828705e-06, -2.207234501838684e-06, -2.0014122128486633e-06, -1.7955899238586426e-06, -1.5897676348686218e-06, -1.383945345878601e-06, -1.1781230568885803e-06, -9.723007678985596e-07, -7.664784789085388e-07, -5.606561899185181e-07, -3.548339009284973e-07, -1.4901161193847656e-07, 5.681067705154419e-08, 2.6263296604156494e-07, 4.684552550315857e-07, 6.742775440216064e-07, 8.800998330116272e-07, 1.085922122001648e-06, 1.2917444109916687e-06, 1.4975666999816895e-06, 1.7033889889717102e-06, 1.909211277961731e-06, 2.1150335669517517e-06, 2.3208558559417725e-06, 2.5266781449317932e-06, 2.732500433921814e-06, 2.9383227229118347e-06, 3.1441450119018555e-06, 3.3499673008918762e-06, 3.555789589881897e-06, 3.7616118788719177e-06, 3.9674341678619385e-06, 4.173256456851959e-06, 4.37907874584198e-06, 4.584901034832001e-06, 4.7907233238220215e-06, 4.996545612812042e-06, 5.202367901802063e-06, 5.408190190792084e-06, 5.6140124797821045e-06, 5.819834768772125e-06, 6.025657057762146e-06, 6.231479346752167e-06, 6.4373016357421875e-06]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 6.0, 4.0, 7.0, 10.0, 21.0, 19.0, 22.0, 48.0, 52.0, 111.0, 124.0, 228.0, 328.0, 461.0, 662.0, 993.0, 1480.0, 2211.0, 3416.0, 5487.0, 8389.0, 13393.0, 21148.0, 34111.0, 56943.0, 100458.0, 219247.0, 280992.0, 123510.0, 67088.0, 39977.0, 24600.0, 15320.0, 9630.0, 6294.0, 3967.0, 2615.0, 1754.0, 1102.0, 736.0, 509.0, 360.0, 243.0, 160.0, 106.0, 81.0, 46.0, 24.0, 25.0, 26.0, 9.0, 6.0, 5.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.302001953125, -0.2923088073730469, -0.28261566162109375, -0.2729225158691406, -0.2632293701171875, -0.2535362243652344, -0.24384307861328125, -0.23414993286132812, -0.224456787109375, -0.21476364135742188, -0.20507049560546875, -0.19537734985351562, -0.1856842041015625, -0.17599105834960938, -0.16629791259765625, -0.15660476684570312, -0.14691162109375, -0.13721847534179688, -0.12752532958984375, -0.11783218383789062, -0.1081390380859375, -0.09844589233398438, -0.08875274658203125, -0.07905960083007812, -0.069366455078125, -0.059673309326171875, -0.04998016357421875, -0.040287017822265625, -0.0305938720703125, -0.020900726318359375, -0.01120758056640625, -0.001514434814453125, 0.0081787109375, 0.017871856689453125, 0.02756500244140625, 0.037258148193359375, 0.0469512939453125, 0.056644439697265625, 0.06633758544921875, 0.07603073120117188, 0.085723876953125, 0.09541702270507812, 0.10511016845703125, 0.11480331420898438, 0.1244964599609375, 0.13418960571289062, 0.14388275146484375, 0.15357589721679688, 0.16326904296875, 0.17296218872070312, 0.18265533447265625, 0.19234848022460938, 0.2020416259765625, 0.21173477172851562, 0.22142791748046875, 0.23112106323242188, 0.240814208984375, 0.2505073547363281, 0.26020050048828125, 0.2698936462402344, 0.2795867919921875, 0.2892799377441406, 0.29897308349609375, 0.3086662292480469, 0.318359375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 7.0, 5.0, 6.0, 6.0, 4.0, 4.0, 5.0, 14.0, 17.0, 25.0, 17.0, 16.0, 28.0, 26.0, 40.0, 41.0, 58.0, 58.0, 77.0, 82.0, 67.0, 64.0, 44.0, 37.0, 40.0, 35.0, 23.0, 29.0, 24.0, 21.0, 12.0, 20.0, 7.0, 10.0, 12.0, 5.0, 5.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.284423828125, -0.2766284942626953, -0.2688331604003906, -0.26103782653808594, -0.25324249267578125, -0.24544715881347656, -0.23765182495117188, -0.2298564910888672, -0.2220611572265625, -0.2142658233642578, -0.20647048950195312, -0.19867515563964844, -0.19087982177734375, -0.18308448791503906, -0.17528915405273438, -0.1674938201904297, -0.159698486328125, -0.1519031524658203, -0.14410781860351562, -0.13631248474121094, -0.12851715087890625, -0.12072181701660156, -0.11292648315429688, -0.10513114929199219, -0.0973358154296875, -0.08954048156738281, -0.08174514770507812, -0.07394981384277344, -0.06615447998046875, -0.05835914611816406, -0.050563812255859375, -0.04276847839355469, -0.03497314453125, -0.027177810668945312, -0.019382476806640625, -0.011587142944335938, -0.00379180908203125, 0.0040035247802734375, 0.011798858642578125, 0.019594192504882812, 0.0273895263671875, 0.03518486022949219, 0.042980194091796875, 0.05077552795410156, 0.05857086181640625, 0.06636619567871094, 0.07416152954101562, 0.08195686340332031, 0.089752197265625, 0.09754753112792969, 0.10534286499023438, 0.11313819885253906, 0.12093353271484375, 0.12872886657714844, 0.13652420043945312, 0.1443195343017578, 0.1521148681640625, 0.1599102020263672, 0.16770553588867188, 0.17550086975097656, 0.18329620361328125, 0.19109153747558594, 0.19888687133789062, 0.2066822052001953, 0.2144775390625]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 8.0, 4.0, 7.0, 11.0, 16.0, 13.0, 17.0, 27.0, 23.0, 24.0, 40.0, 31.0, 46.0, 34.0, 46.0, 53.0, 54.0, 52.0, 49.0, 42.0, 48.0, 50.0, 46.0, 32.0, 38.0, 40.0, 29.0, 25.0, 21.0, 12.0, 12.0, 16.0, 9.0, 5.0, 8.0, 4.0, 2.0, 3.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.013989448547363, -8.714558601379395, -8.415127754211426, -8.115696907043457, -7.81626558303833, -7.516834735870361, -7.217403411865234, -6.917972564697266, -6.618541717529297, -6.319110870361328, -6.019680023193359, -5.720248699188232, -5.420817852020264, -5.121387004852295, -4.821955680847168, -4.522524833679199, -4.2230939865112305, -3.9236631393432617, -3.624232053756714, -3.324800968170166, -3.0253701210021973, -2.7259392738342285, -2.4265081882476807, -2.127077102661133, -1.827646255493164, -1.5282152891159058, -1.2287843227386475, -0.9293533563613892, -0.6299223899841309, -0.33049142360687256, -0.031060457229614258, 0.2683706283569336, 0.5678005218505859, 0.8672314882278442, 1.1666624546051025, 1.4660934209823608, 1.7655243873596191, 2.064955234527588, 2.3643863201141357, 2.6638174057006836, 2.9632482528686523, 3.262679100036621, 3.562110185623169, 3.861541271209717, 4.1609721183776855, 4.460402965545654, 4.759834289550781, 5.05926513671875, 5.358695983886719, 5.6581268310546875, 5.957557678222656, 6.256989002227783, 6.556419849395752, 6.855850696563721, 7.155282020568848, 7.454712867736816, 7.754143714904785, 8.053574562072754, 8.353005409240723, 8.652436256408691, 8.951868057250977, 9.251298904418945, 9.550729751586914, 9.850160598754883, 10.149591445922852]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 1.0, 4.0, 8.0, 6.0, 10.0, 8.0, 14.0, 14.0, 14.0, 19.0, 23.0, 22.0, 23.0, 24.0, 35.0, 28.0, 44.0, 29.0, 44.0, 37.0, 39.0, 42.0, 36.0, 42.0, 44.0, 42.0, 35.0, 36.0, 30.0, 29.0, 32.0, 31.0, 15.0, 26.0, 16.0, 24.0, 13.0, 12.0, 13.0, 12.0, 8.0, 5.0, 3.0, 4.0, 2.0, 1.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.571138381958008, -10.232892036437988, -9.894646644592285, -9.556400299072266, -9.218153953552246, -8.879907608032227, -8.541662216186523, -8.203415870666504, -7.865170001983643, -7.526924133300781, -7.188677787780762, -6.8504319190979, -6.512186050415039, -6.1739397048950195, -5.835693836212158, -5.497447967529297, -5.159201622009277, -4.820955753326416, -4.4827094078063965, -4.144463539123535, -3.8062174320220947, -3.4679713249206543, -3.129725456237793, -2.7914793491363525, -2.453233242034912, -2.1149871349334717, -1.7767411470413208, -1.43849515914917, -1.1002490520477295, -0.7620029449462891, -0.42375707626342773, -0.0855109691619873, 0.2527351379394531, 0.5909811854362488, 0.9292272329330444, 1.2674732208251953, 1.6057193279266357, 1.9439654350280762, 2.2822113037109375, 2.620457410812378, 2.9587035179138184, 3.296949625015259, 3.635195732116699, 3.9734416007995605, 4.311687469482422, 4.649933815002441, 4.988179683685303, 5.326425552368164, 5.664671897888184, 6.002917766571045, 6.3411641120910645, 6.679409980773926, 7.017656326293945, 7.355902194976807, 7.694148063659668, 8.032394409179688, 8.37063980102539, 8.70888614654541, 9.047131538391113, 9.385377883911133, 9.723624229431152, 10.061870574951172, 10.400115966796875, 10.738362312316895, 11.076608657836914]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 4.0, 3.0, 10.0, 8.0, 11.0, 19.0, 27.0, 51.0, 63.0, 85.0, 136.0, 212.0, 352.0, 528.0, 814.0, 1289.0, 1938.0, 2883.0, 4585.0, 7109.0, 10629.0, 16435.0, 24539.0, 35829.0, 49581.0, 67095.0, 84164.0, 99009.0, 108024.0, 108985.0, 100937.0, 86860.0, 69577.0, 52246.0, 37799.0, 26165.0, 17637.0, 11434.0, 7588.0, 4884.0, 3102.0, 2121.0, 1295.0, 878.0, 567.0, 352.0, 234.0, 172.0, 97.0, 70.0, 50.0, 30.0, 21.0, 9.0, 8.0, 7.0, 3.0, 7.0, 1.0, 0.0, 1.0], "bins": [-6.18359375, -5.9908447265625, -5.798095703125, -5.6053466796875, -5.41259765625, -5.2198486328125, -5.027099609375, -4.8343505859375, -4.6416015625, -4.4488525390625, -4.256103515625, -4.0633544921875, -3.87060546875, -3.6778564453125, -3.485107421875, -3.2923583984375, -3.099609375, -2.9068603515625, -2.714111328125, -2.5213623046875, -2.32861328125, -2.1358642578125, -1.943115234375, -1.7503662109375, -1.5576171875, -1.3648681640625, -1.172119140625, -0.9793701171875, -0.78662109375, -0.5938720703125, -0.401123046875, -0.2083740234375, -0.015625, 0.1771240234375, 0.369873046875, 0.5626220703125, 0.75537109375, 0.9481201171875, 1.140869140625, 1.3336181640625, 1.5263671875, 1.7191162109375, 1.911865234375, 2.1046142578125, 2.29736328125, 2.4901123046875, 2.682861328125, 2.8756103515625, 3.068359375, 3.2611083984375, 3.453857421875, 3.6466064453125, 3.83935546875, 4.0321044921875, 4.224853515625, 4.4176025390625, 4.6103515625, 4.8031005859375, 4.995849609375, 5.1885986328125, 5.38134765625, 5.5740966796875, 5.766845703125, 5.9595947265625, 6.15234375]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 9.0, 12.0, 8.0, 7.0, 12.0, 12.0, 18.0, 21.0, 24.0, 26.0, 23.0, 32.0, 32.0, 29.0, 44.0, 28.0, 39.0, 46.0, 37.0, 47.0, 39.0, 35.0, 32.0, 40.0, 43.0, 26.0, 37.0, 28.0, 32.0, 19.0, 29.0, 19.0, 25.0, 15.0, 11.0, 13.0, 11.0, 11.0, 4.0, 5.0, 1.0, 3.0, 3.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.5859375, -10.2535400390625, -9.921142578125, -9.5887451171875, -9.25634765625, -8.9239501953125, -8.591552734375, -8.2591552734375, -7.9267578125, -7.5943603515625, -7.261962890625, -6.9295654296875, -6.59716796875, -6.2647705078125, -5.932373046875, -5.5999755859375, -5.267578125, -4.9351806640625, -4.602783203125, -4.2703857421875, -3.93798828125, -3.6055908203125, -3.273193359375, -2.9407958984375, -2.6083984375, -2.2760009765625, -1.943603515625, -1.6112060546875, -1.27880859375, -0.9464111328125, -0.614013671875, -0.2816162109375, 0.05078125, 0.3831787109375, 0.715576171875, 1.0479736328125, 1.38037109375, 1.7127685546875, 2.045166015625, 2.3775634765625, 2.7099609375, 3.0423583984375, 3.374755859375, 3.7071533203125, 4.03955078125, 4.3719482421875, 4.704345703125, 5.0367431640625, 5.369140625, 5.7015380859375, 6.033935546875, 6.3663330078125, 6.69873046875, 7.0311279296875, 7.363525390625, 7.6959228515625, 8.0283203125, 8.3607177734375, 8.693115234375, 9.0255126953125, 9.35791015625, 9.6903076171875, 10.022705078125, 10.3551025390625, 10.6875]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 2.0, 4.0, 11.0, 17.0, 30.0, 39.0, 75.0, 109.0, 188.0, 303.0, 535.0, 796.0, 1383.0, 2240.0, 3856.0, 6289.0, 10275.0, 16512.0, 25495.0, 38505.0, 55157.0, 74390.0, 94478.0, 110990.0, 118289.0, 114675.0, 102013.0, 82996.0, 62486.0, 44673.0, 30098.0, 19810.0, 12464.0, 7602.0, 4659.0, 2841.0, 1697.0, 1048.0, 598.0, 344.0, 206.0, 137.0, 68.0, 62.0, 52.0, 23.0, 13.0, 10.0, 3.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8125, -5.6026611328125, -5.392822265625, -5.1829833984375, -4.97314453125, -4.7633056640625, -4.553466796875, -4.3436279296875, -4.1337890625, -3.9239501953125, -3.714111328125, -3.5042724609375, -3.29443359375, -3.0845947265625, -2.874755859375, -2.6649169921875, -2.455078125, -2.2452392578125, -2.035400390625, -1.8255615234375, -1.61572265625, -1.4058837890625, -1.196044921875, -0.9862060546875, -0.7763671875, -0.5665283203125, -0.356689453125, -0.1468505859375, 0.06298828125, 0.2728271484375, 0.482666015625, 0.6925048828125, 0.90234375, 1.1121826171875, 1.322021484375, 1.5318603515625, 1.74169921875, 1.9515380859375, 2.161376953125, 2.3712158203125, 2.5810546875, 2.7908935546875, 3.000732421875, 3.2105712890625, 3.42041015625, 3.6302490234375, 3.840087890625, 4.0499267578125, 4.259765625, 4.4696044921875, 4.679443359375, 4.8892822265625, 5.09912109375, 5.3089599609375, 5.518798828125, 5.7286376953125, 5.9384765625, 6.1483154296875, 6.358154296875, 6.5679931640625, 6.77783203125, 6.9876708984375, 7.197509765625, 7.4073486328125, 7.6171875]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 1.0, 1.0, 5.0, 3.0, 6.0, 6.0, 9.0, 9.0, 12.0, 7.0, 14.0, 23.0, 19.0, 29.0, 37.0, 33.0, 32.0, 36.0, 35.0, 35.0, 28.0, 38.0, 46.0, 46.0, 48.0, 46.0, 30.0, 47.0, 35.0, 40.0, 33.0, 37.0, 27.0, 32.0, 24.0, 13.0, 11.0, 13.0, 16.0, 10.0, 11.0, 6.0, 4.0, 7.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.6171875, -7.40264892578125, -7.1881103515625, -6.97357177734375, -6.759033203125, -6.54449462890625, -6.3299560546875, -6.11541748046875, -5.90087890625, -5.68634033203125, -5.4718017578125, -5.25726318359375, -5.042724609375, -4.82818603515625, -4.6136474609375, -4.39910888671875, -4.1845703125, -3.97003173828125, -3.7554931640625, -3.54095458984375, -3.326416015625, -3.11187744140625, -2.8973388671875, -2.68280029296875, -2.46826171875, -2.25372314453125, -2.0391845703125, -1.82464599609375, -1.610107421875, -1.39556884765625, -1.1810302734375, -0.96649169921875, -0.751953125, -0.53741455078125, -0.3228759765625, -0.10833740234375, 0.106201171875, 0.32073974609375, 0.5352783203125, 0.74981689453125, 0.96435546875, 1.17889404296875, 1.3934326171875, 1.60797119140625, 1.822509765625, 2.03704833984375, 2.2515869140625, 2.46612548828125, 2.6806640625, 2.89520263671875, 3.1097412109375, 3.32427978515625, 3.538818359375, 3.75335693359375, 3.9678955078125, 4.18243408203125, 4.39697265625, 4.61151123046875, 4.8260498046875, 5.04058837890625, 5.255126953125, 5.46966552734375, 5.6842041015625, 5.89874267578125, 6.11328125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 11.0, 3.0, 17.0, 24.0, 36.0, 67.0, 102.0, 139.0, 214.0, 325.0, 498.0, 868.0, 1301.0, 1948.0, 3373.0, 4983.0, 8133.0, 12419.0, 18624.0, 27608.0, 39967.0, 55261.0, 72255.0, 90085.0, 103889.0, 109792.0, 107768.0, 97398.0, 81238.0, 63943.0, 47113.0, 33433.0, 22795.0, 15234.0, 9994.0, 6393.0, 4078.0, 2647.0, 1656.0, 1082.0, 662.0, 409.0, 271.0, 177.0, 119.0, 68.0, 51.0, 34.0, 24.0, 17.0, 6.0, 0.0, 6.0, 0.0, 2.0], "bins": [-1.9423828125, -1.8864898681640625, -1.830596923828125, -1.7747039794921875, -1.71881103515625, -1.6629180908203125, -1.607025146484375, -1.5511322021484375, -1.4952392578125, -1.4393463134765625, -1.383453369140625, -1.3275604248046875, -1.27166748046875, -1.2157745361328125, -1.159881591796875, -1.1039886474609375, -1.048095703125, -0.9922027587890625, -0.936309814453125, -0.8804168701171875, -0.82452392578125, -0.7686309814453125, -0.712738037109375, -0.6568450927734375, -0.6009521484375, -0.5450592041015625, -0.489166259765625, -0.4332733154296875, -0.37738037109375, -0.3214874267578125, -0.265594482421875, -0.2097015380859375, -0.15380859375, -0.0979156494140625, -0.042022705078125, 0.0138702392578125, 0.06976318359375, 0.1256561279296875, 0.181549072265625, 0.2374420166015625, 0.2933349609375, 0.3492279052734375, 0.405120849609375, 0.4610137939453125, 0.51690673828125, 0.5727996826171875, 0.628692626953125, 0.6845855712890625, 0.740478515625, 0.7963714599609375, 0.852264404296875, 0.9081573486328125, 0.96405029296875, 1.0199432373046875, 1.075836181640625, 1.1317291259765625, 1.1876220703125, 1.2435150146484375, 1.299407958984375, 1.3553009033203125, 1.41119384765625, 1.4670867919921875, 1.522979736328125, 1.5788726806640625, 1.634765625]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 9.0, 4.0, 6.0, 4.0, 10.0, 10.0, 21.0, 23.0, 22.0, 29.0, 35.0, 24.0, 33.0, 32.0, 34.0, 54.0, 55.0, 65.0, 46.0, 42.0, 43.0, 41.0, 39.0, 41.0, 36.0, 23.0, 25.0, 28.0, 30.0, 24.0, 24.0, 14.0, 20.0, 11.0, 7.0, 8.0, 9.0, 7.0, 3.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00021910667419433594, -0.00021253898739814758, -0.00020597130060195923, -0.00019940361380577087, -0.00019283592700958252, -0.00018626824021339417, -0.0001797005534172058, -0.00017313286662101746, -0.0001665651798248291, -0.00015999749302864075, -0.0001534298062324524, -0.00014686211943626404, -0.00014029443264007568, -0.00013372674584388733, -0.00012715905904769897, -0.00012059137225151062, -0.00011402368545532227, -0.00010745599865913391, -0.00010088831186294556, -9.43206250667572e-05, -8.775293827056885e-05, -8.118525147438049e-05, -7.461756467819214e-05, -6.804987788200378e-05, -6.148219108581543e-05, -5.4914504289627075e-05, -4.834681749343872e-05, -4.1779130697250366e-05, -3.521144390106201e-05, -2.8643757104873657e-05, -2.2076070308685303e-05, -1.5508383512496948e-05, -8.940696716308594e-06, -2.3730099201202393e-06, 4.194676876068115e-06, 1.076236367225647e-05, 1.7330050468444824e-05, 2.389773726463318e-05, 3.0465424060821533e-05, 3.703311085700989e-05, 4.360079765319824e-05, 5.01684844493866e-05, 5.673617124557495e-05, 6.33038580417633e-05, 6.987154483795166e-05, 7.643923163414001e-05, 8.300691843032837e-05, 8.957460522651672e-05, 9.614229202270508e-05, 0.00010270997881889343, 0.00010927766561508179, 0.00011584535241127014, 0.0001224130392074585, 0.00012898072600364685, 0.0001355484127998352, 0.00014211609959602356, 0.00014868378639221191, 0.00015525147318840027, 0.00016181915998458862, 0.00016838684678077698, 0.00017495453357696533, 0.0001815222203731537, 0.00018808990716934204, 0.0001946575939655304, 0.00020122528076171875]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 6.0, 5.0, 11.0, 20.0, 14.0, 40.0, 39.0, 64.0, 106.0, 129.0, 202.0, 261.0, 398.0, 620.0, 1001.0, 1544.0, 2361.0, 3913.0, 6424.0, 10401.0, 16517.0, 25655.0, 39858.0, 59290.0, 82236.0, 104602.0, 121661.0, 127297.0, 118468.0, 99162.0, 75620.0, 53632.0, 35834.0, 22714.0, 14623.0, 8850.0, 5396.0, 3473.0, 2116.0, 1385.0, 885.0, 577.0, 369.0, 215.0, 176.0, 118.0, 80.0, 68.0, 46.0, 34.0, 14.0, 11.0, 8.0, 6.0, 1.0, 7.0, 3.0, 1.0, 1.0, 1.0], "bins": [-2.1640625, -2.095062255859375, -2.02606201171875, -1.957061767578125, -1.8880615234375, -1.819061279296875, -1.75006103515625, -1.681060791015625, -1.612060546875, -1.543060302734375, -1.47406005859375, -1.405059814453125, -1.3360595703125, -1.267059326171875, -1.19805908203125, -1.129058837890625, -1.06005859375, -0.991058349609375, -0.92205810546875, -0.853057861328125, -0.7840576171875, -0.715057373046875, -0.64605712890625, -0.577056884765625, -0.508056640625, -0.439056396484375, -0.37005615234375, -0.301055908203125, -0.2320556640625, -0.163055419921875, -0.09405517578125, -0.025054931640625, 0.0439453125, 0.112945556640625, 0.18194580078125, 0.250946044921875, 0.3199462890625, 0.388946533203125, 0.45794677734375, 0.526947021484375, 0.595947265625, 0.664947509765625, 0.73394775390625, 0.802947998046875, 0.8719482421875, 0.940948486328125, 1.00994873046875, 1.078948974609375, 1.14794921875, 1.216949462890625, 1.28594970703125, 1.354949951171875, 1.4239501953125, 1.492950439453125, 1.56195068359375, 1.630950927734375, 1.699951171875, 1.768951416015625, 1.83795166015625, 1.906951904296875, 1.9759521484375, 2.044952392578125, 2.11395263671875, 2.182952880859375, 2.251953125]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 2.0, 6.0, 10.0, 11.0, 8.0, 13.0, 15.0, 16.0, 15.0, 17.0, 32.0, 31.0, 26.0, 32.0, 42.0, 40.0, 54.0, 53.0, 54.0, 49.0, 47.0, 55.0, 42.0, 37.0, 44.0, 45.0, 30.0, 37.0, 28.0, 20.0, 20.0, 15.0, 15.0, 6.0, 5.0, 5.0, 6.0, 7.0, 6.0, 4.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9697265625, -0.9353790283203125, -0.901031494140625, -0.8666839599609375, -0.83233642578125, -0.7979888916015625, -0.763641357421875, -0.7292938232421875, -0.6949462890625, -0.6605987548828125, -0.626251220703125, -0.5919036865234375, -0.55755615234375, -0.5232086181640625, -0.488861083984375, -0.4545135498046875, -0.420166015625, -0.3858184814453125, -0.351470947265625, -0.3171234130859375, -0.28277587890625, -0.2484283447265625, -0.214080810546875, -0.1797332763671875, -0.1453857421875, -0.1110382080078125, -0.076690673828125, -0.0423431396484375, -0.00799560546875, 0.0263519287109375, 0.060699462890625, 0.0950469970703125, 0.12939453125, 0.1637420654296875, 0.198089599609375, 0.2324371337890625, 0.26678466796875, 0.3011322021484375, 0.335479736328125, 0.3698272705078125, 0.4041748046875, 0.4385223388671875, 0.472869873046875, 0.5072174072265625, 0.54156494140625, 0.5759124755859375, 0.610260009765625, 0.6446075439453125, 0.678955078125, 0.7133026123046875, 0.747650146484375, 0.7819976806640625, 0.81634521484375, 0.8506927490234375, 0.885040283203125, 0.9193878173828125, 0.9537353515625, 0.9880828857421875, 1.022430419921875, 1.0567779541015625, 1.09112548828125, 1.1254730224609375, 1.159820556640625, 1.1941680908203125, 1.228515625]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 8.0, 7.0, 9.0, 13.0, 15.0, 16.0, 21.0, 15.0, 33.0, 35.0, 35.0, 34.0, 53.0, 53.0, 40.0, 49.0, 66.0, 55.0, 57.0, 47.0, 54.0, 40.0, 46.0, 24.0, 30.0, 27.0, 28.0, 21.0, 15.0, 17.0, 9.0, 10.0, 1.0, 7.0, 5.0, 6.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.47191047668457, -8.161338806152344, -7.850767135620117, -7.540195465087891, -7.229623794555664, -6.9190521240234375, -6.608480930328369, -6.297909259796143, -5.987337589263916, -5.6767659187316895, -5.366194248199463, -5.055622577667236, -4.745051383972168, -4.434479713439941, -4.123908042907715, -3.8133363723754883, -3.5027647018432617, -3.192193031311035, -2.8816213607788086, -2.571049928665161, -2.2604782581329346, -1.949906587600708, -1.639335036277771, -1.328763484954834, -1.0181918144226074, -0.7076202034950256, -0.39704859256744385, -0.08647698163986206, 0.22409462928771973, 0.5346662998199463, 0.8452378511428833, 1.1558094024658203, 1.4663801193237305, 1.776951789855957, 2.0875234603881836, 2.398094892501831, 2.7086665630340576, 3.019238233566284, 3.3298096656799316, 3.640381336212158, 3.9509530067443848, 4.261524677276611, 4.572096347808838, 4.8826680183410645, 5.193239212036133, 5.503810882568359, 5.814382553100586, 6.1249542236328125, 6.435525894165039, 6.746097564697266, 7.056669235229492, 7.367240905761719, 7.677812576293945, 7.988384246826172, 8.298955917358398, 8.609527587890625, 8.920099258422852, 9.230670928955078, 9.541242599487305, 9.851814270019531, 10.162385940551758, 10.472957611083984, 10.783529281616211, 11.094100952148438, 11.404671669006348]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 1.0, 4.0, 6.0, 2.0, 11.0, 11.0, 18.0, 8.0, 6.0, 14.0, 15.0, 23.0, 18.0, 29.0, 22.0, 32.0, 35.0, 28.0, 40.0, 39.0, 46.0, 32.0, 44.0, 41.0, 31.0, 43.0, 44.0, 32.0, 35.0, 27.0, 37.0, 31.0, 29.0, 26.0, 23.0, 23.0, 13.0, 13.0, 15.0, 12.0, 7.0, 5.0, 8.0, 8.0, 4.0, 9.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.73109245300293, -11.3902587890625, -11.04942512512207, -10.70859146118164, -10.367757797241211, -10.026924133300781, -9.686090469360352, -9.345256805419922, -9.004423141479492, -8.663589477539062, -8.322755813598633, -7.981922149658203, -7.641088485717773, -7.300254821777344, -6.959421634674072, -6.618587970733643, -6.277754783630371, -5.936921119689941, -5.596087455749512, -5.255253791809082, -4.914420127868652, -4.573586463928223, -4.232753276824951, -3.8919196128845215, -3.551085948944092, -3.210252285003662, -2.8694186210632324, -2.528585195541382, -2.187751531600952, -1.8469178676605225, -1.5060844421386719, -1.1652507781982422, -0.8244161605834961, -0.4835825562477112, -0.14274895191192627, 0.19808459281921387, 0.5389182567596436, 0.8797519207000732, 1.2205853462219238, 1.5614190101623535, 1.9022526741027832, 2.243086338043213, 2.5839200019836426, 2.924753427505493, 3.265587091445923, 3.6064207553863525, 3.947254180908203, 4.288087844848633, 4.6289215087890625, 4.969755172729492, 5.310588836669922, 5.651422500610352, 5.992256164550781, 6.333089828491211, 6.673923015594482, 7.014756679534912, 7.355590343475342, 7.6964240074157715, 8.037257194519043, 8.378090858459473, 8.718924522399902, 9.059758186340332, 9.400591850280762, 9.741425514221191, 10.082259178161621]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 12.0, 9.0, 32.0, 49.0, 71.0, 111.0, 192.0, 269.0, 487.0, 801.0, 1333.0, 2221.0, 3564.0, 5595.0, 8893.0, 14141.0, 22349.0, 34586.0, 53152.0, 80582.0, 119277.0, 170475.0, 235644.0, 307338.0, 379695.0, 432747.0, 453619.0, 432735.0, 379720.0, 309481.0, 234914.0, 169653.0, 118473.0, 79410.0, 52082.0, 33939.0, 21570.0, 13419.0, 8381.0, 5283.0, 3160.0, 1968.0, 1162.0, 697.0, 413.0, 245.0, 136.0, 93.0, 44.0, 35.0, 13.0, 6.0, 10.0, 5.0, 0.0, 2.0], "bins": [-7.203125, -6.9942626953125, -6.785400390625, -6.5765380859375, -6.36767578125, -6.1588134765625, -5.949951171875, -5.7410888671875, -5.5322265625, -5.3233642578125, -5.114501953125, -4.9056396484375, -4.69677734375, -4.4879150390625, -4.279052734375, -4.0701904296875, -3.861328125, -3.6524658203125, -3.443603515625, -3.2347412109375, -3.02587890625, -2.8170166015625, -2.608154296875, -2.3992919921875, -2.1904296875, -1.9815673828125, -1.772705078125, -1.5638427734375, -1.35498046875, -1.1461181640625, -0.937255859375, -0.7283935546875, -0.51953125, -0.3106689453125, -0.101806640625, 0.1070556640625, 0.31591796875, 0.5247802734375, 0.733642578125, 0.9425048828125, 1.1513671875, 1.3602294921875, 1.569091796875, 1.7779541015625, 1.98681640625, 2.1956787109375, 2.404541015625, 2.6134033203125, 2.822265625, 3.0311279296875, 3.239990234375, 3.4488525390625, 3.65771484375, 3.8665771484375, 4.075439453125, 4.2843017578125, 4.4931640625, 4.7020263671875, 4.910888671875, 5.1197509765625, 5.32861328125, 5.5374755859375, 5.746337890625, 5.9552001953125, 6.1640625]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 1.0, 5.0, 8.0, 9.0, 7.0, 9.0, 9.0, 19.0, 13.0, 14.0, 22.0, 21.0, 30.0, 21.0, 27.0, 28.0, 28.0, 42.0, 39.0, 39.0, 38.0, 40.0, 35.0, 34.0, 39.0, 38.0, 49.0, 40.0, 27.0, 28.0, 29.0, 33.0, 32.0, 22.0, 23.0, 16.0, 14.0, 11.0, 12.0, 12.0, 6.0, 7.0, 5.0, 7.0, 8.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-9.6015625, -9.331787109375, -9.06201171875, -8.792236328125, -8.5224609375, -8.252685546875, -7.98291015625, -7.713134765625, -7.443359375, -7.173583984375, -6.90380859375, -6.634033203125, -6.3642578125, -6.094482421875, -5.82470703125, -5.554931640625, -5.28515625, -5.015380859375, -4.74560546875, -4.475830078125, -4.2060546875, -3.936279296875, -3.66650390625, -3.396728515625, -3.126953125, -2.857177734375, -2.58740234375, -2.317626953125, -2.0478515625, -1.778076171875, -1.50830078125, -1.238525390625, -0.96875, -0.698974609375, -0.42919921875, -0.159423828125, 0.1103515625, 0.380126953125, 0.64990234375, 0.919677734375, 1.189453125, 1.459228515625, 1.72900390625, 1.998779296875, 2.2685546875, 2.538330078125, 2.80810546875, 3.077880859375, 3.34765625, 3.617431640625, 3.88720703125, 4.156982421875, 4.4267578125, 4.696533203125, 4.96630859375, 5.236083984375, 5.505859375, 5.775634765625, 6.04541015625, 6.315185546875, 6.5849609375, 6.854736328125, 7.12451171875, 7.394287109375, 7.6640625]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 7.0, 18.0, 33.0, 41.0, 98.0, 151.0, 243.0, 419.0, 697.0, 1158.0, 1882.0, 3172.0, 5087.0, 8243.0, 13542.0, 20906.0, 32352.0, 48748.0, 71619.0, 101999.0, 141702.0, 186911.0, 238700.0, 292142.0, 337486.0, 370351.0, 381721.0, 372896.0, 344465.0, 298734.0, 247039.0, 195798.0, 147464.0, 107043.0, 75208.0, 51501.0, 34716.0, 22558.0, 14193.0, 9003.0, 5562.0, 3486.0, 2047.0, 1265.0, 714.0, 469.0, 264.0, 205.0, 89.0, 64.0, 35.0, 19.0, 15.0, 7.0, 3.0, 1.0, 2.0, 1.0], "bins": [-6.08203125, -5.89532470703125, -5.7086181640625, -5.52191162109375, -5.335205078125, -5.14849853515625, -4.9617919921875, -4.77508544921875, -4.58837890625, -4.40167236328125, -4.2149658203125, -4.02825927734375, -3.841552734375, -3.65484619140625, -3.4681396484375, -3.28143310546875, -3.0947265625, -2.90802001953125, -2.7213134765625, -2.53460693359375, -2.347900390625, -2.16119384765625, -1.9744873046875, -1.78778076171875, -1.60107421875, -1.41436767578125, -1.2276611328125, -1.04095458984375, -0.854248046875, -0.66754150390625, -0.4808349609375, -0.29412841796875, -0.107421875, 0.07928466796875, 0.2659912109375, 0.45269775390625, 0.639404296875, 0.82611083984375, 1.0128173828125, 1.19952392578125, 1.38623046875, 1.57293701171875, 1.7596435546875, 1.94635009765625, 2.133056640625, 2.31976318359375, 2.5064697265625, 2.69317626953125, 2.8798828125, 3.06658935546875, 3.2532958984375, 3.44000244140625, 3.626708984375, 3.81341552734375, 4.0001220703125, 4.18682861328125, 4.37353515625, 4.56024169921875, 4.7469482421875, 4.93365478515625, 5.120361328125, 5.30706787109375, 5.4937744140625, 5.68048095703125, 5.8671875]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 5.0, 5.0, 8.0, 14.0, 23.0, 18.0, 21.0, 42.0, 45.0, 54.0, 71.0, 84.0, 85.0, 112.0, 140.0, 139.0, 169.0, 185.0, 165.0, 191.0, 220.0, 208.0, 209.0, 211.0, 230.0, 199.0, 177.0, 147.0, 150.0, 124.0, 111.0, 100.0, 86.0, 72.0, 50.0, 50.0, 42.0, 30.0, 20.0, 15.0, 13.0, 11.0, 7.0, 6.0, 5.0, 3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9921875, -3.85943603515625, -3.7266845703125, -3.59393310546875, -3.461181640625, -3.32843017578125, -3.1956787109375, -3.06292724609375, -2.93017578125, -2.79742431640625, -2.6646728515625, -2.53192138671875, -2.399169921875, -2.26641845703125, -2.1336669921875, -2.00091552734375, -1.8681640625, -1.73541259765625, -1.6026611328125, -1.46990966796875, -1.337158203125, -1.20440673828125, -1.0716552734375, -0.93890380859375, -0.80615234375, -0.67340087890625, -0.5406494140625, -0.40789794921875, -0.275146484375, -0.14239501953125, -0.0096435546875, 0.12310791015625, 0.255859375, 0.38861083984375, 0.5213623046875, 0.65411376953125, 0.786865234375, 0.91961669921875, 1.0523681640625, 1.18511962890625, 1.31787109375, 1.45062255859375, 1.5833740234375, 1.71612548828125, 1.848876953125, 1.98162841796875, 2.1143798828125, 2.24713134765625, 2.3798828125, 2.51263427734375, 2.6453857421875, 2.77813720703125, 2.910888671875, 3.04364013671875, 3.1763916015625, 3.30914306640625, 3.44189453125, 3.57464599609375, 3.7073974609375, 3.84014892578125, 3.972900390625, 4.10565185546875, 4.2384033203125, 4.37115478515625, 4.50390625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 4.0, 10.0, 5.0, 18.0, 20.0, 13.0, 24.0, 29.0, 30.0, 45.0, 53.0, 34.0, 50.0, 56.0, 62.0, 62.0, 54.0, 62.0, 52.0, 52.0, 47.0, 49.0, 46.0, 25.0, 26.0, 19.0, 15.0, 7.0, 13.0, 5.0, 5.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.685473442077637, -11.328505516052246, -10.971537590026855, -10.614570617675781, -10.25760269165039, -9.900634765625, -9.54366683959961, -9.186698913574219, -8.829730987548828, -8.472763061523438, -8.115795135498047, -7.7588276863098145, -7.401859760284424, -7.044892311096191, -6.687924385070801, -6.33095645904541, -5.973989009857178, -5.617021083831787, -5.260053634643555, -4.903085708618164, -4.546117782592773, -4.189149856567383, -3.8321824073791504, -3.4752144813537598, -3.1182467937469482, -2.7612791061401367, -2.404311180114746, -2.0473434925079346, -1.6903756856918335, -1.3334078788757324, -0.9764401912689209, -0.6194722652435303, -0.26250457763671875, 0.09446319937705994, 0.4514309763908386, 0.8083987236022949, 1.165366530418396, 1.522334337234497, 1.8793020248413086, 2.236269950866699, 2.5932376384735107, 2.9502053260803223, 3.307173252105713, 3.6641409397125244, 4.021108627319336, 4.378076553344727, 4.735044479370117, 5.092012405395508, 5.44897985458374, 5.805947780609131, 6.162915229797363, 6.519883155822754, 6.8768510818481445, 7.233819007873535, 7.590786457061768, 7.947754383087158, 8.30472183227539, 8.661689758300781, 9.018657684326172, 9.375625610351562, 9.732592582702637, 10.089560508728027, 10.446528434753418, 10.803496360778809, 11.1604642868042]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 7.0, 2.0, 7.0, 8.0, 6.0, 8.0, 11.0, 9.0, 10.0, 9.0, 9.0, 16.0, 23.0, 23.0, 21.0, 31.0, 31.0, 28.0, 36.0, 37.0, 28.0, 40.0, 43.0, 42.0, 31.0, 31.0, 35.0, 37.0, 41.0, 33.0, 27.0, 40.0, 23.0, 33.0, 28.0, 21.0, 17.0, 28.0, 23.0, 11.0, 11.0, 10.0, 7.0, 9.0, 7.0, 7.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.560603141784668, -10.237327575683594, -9.914052963256836, -9.590777397155762, -9.267501831054688, -8.94422721862793, -8.620951652526855, -8.297676086425781, -7.974400997161865, -7.651125907897949, -7.327850341796875, -7.004575252532959, -6.681300163269043, -6.358024597167969, -6.034749507904053, -5.711474418640137, -5.3881988525390625, -5.0649237632751465, -4.741648197174072, -4.418373107910156, -4.095097541809082, -3.771822452545166, -3.44854736328125, -3.125272035598755, -2.8019967079162598, -2.4787213802337646, -2.1554460525512695, -1.8321709632873535, -1.5088956356048584, -1.1856203079223633, -0.8623450994491577, -0.5390698909759521, -0.21579456329345703, 0.10748070478439331, 0.43075597286224365, 0.754031240940094, 1.0773065090179443, 1.4005818367004395, 1.723857045173645, 2.0471322536468506, 2.3704075813293457, 2.693682909011841, 3.016958236694336, 3.340233325958252, 3.663508653640747, 3.986783981323242, 4.310059070587158, 4.633334159851074, 4.956609725952148, 5.2798848152160645, 5.603160381317139, 5.926435470581055, 6.249711036682129, 6.572986125946045, 6.896261215209961, 7.219536781311035, 7.542811870574951, 7.866086959838867, 8.189362525939941, 8.512638092041016, 8.835912704467773, 9.159188270568848, 9.482463836669922, 9.80573844909668, 10.129014015197754]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 5.0, 10.0, 11.0, 26.0, 17.0, 43.0, 64.0, 69.0, 121.0, 186.0, 190.0, 343.0, 396.0, 558.0, 897.0, 1254.0, 1784.0, 2673.0, 3836.0, 5452.0, 8192.0, 12353.0, 18393.0, 28408.0, 44500.0, 70288.0, 112340.0, 170516.0, 189490.0, 136294.0, 85086.0, 53597.0, 34155.0, 22065.0, 14492.0, 9617.0, 6498.0, 4345.0, 3007.0, 2051.0, 1458.0, 1036.0, 715.0, 513.0, 350.0, 274.0, 190.0, 114.0, 97.0, 62.0, 48.0, 25.0, 25.0, 11.0, 11.0, 6.0, 6.0, 2.0, 4.0, 0.0, 0.0, 1.0], "bins": [-1.7509765625, -1.6930084228515625, -1.635040283203125, -1.5770721435546875, -1.51910400390625, -1.4611358642578125, -1.403167724609375, -1.3451995849609375, -1.2872314453125, -1.2292633056640625, -1.171295166015625, -1.1133270263671875, -1.05535888671875, -0.9973907470703125, -0.939422607421875, -0.8814544677734375, -0.823486328125, -0.7655181884765625, -0.707550048828125, -0.6495819091796875, -0.59161376953125, -0.5336456298828125, -0.475677490234375, -0.4177093505859375, -0.3597412109375, -0.3017730712890625, -0.243804931640625, -0.1858367919921875, -0.12786865234375, -0.0699005126953125, -0.011932373046875, 0.0460357666015625, 0.10400390625, 0.1619720458984375, 0.219940185546875, 0.2779083251953125, 0.33587646484375, 0.3938446044921875, 0.451812744140625, 0.5097808837890625, 0.5677490234375, 0.6257171630859375, 0.683685302734375, 0.7416534423828125, 0.79962158203125, 0.8575897216796875, 0.915557861328125, 0.9735260009765625, 1.031494140625, 1.0894622802734375, 1.147430419921875, 1.2053985595703125, 1.26336669921875, 1.3213348388671875, 1.379302978515625, 1.4372711181640625, 1.4952392578125, 1.5532073974609375, 1.611175537109375, 1.6691436767578125, 1.72711181640625, 1.7850799560546875, 1.843048095703125, 1.9010162353515625, 1.958984375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 7.0, 3.0, 9.0, 5.0, 5.0, 10.0, 10.0, 7.0, 17.0, 12.0, 12.0, 18.0, 22.0, 30.0, 20.0, 27.0, 28.0, 25.0, 37.0, 40.0, 33.0, 46.0, 38.0, 44.0, 31.0, 38.0, 36.0, 35.0, 32.0, 33.0, 35.0, 34.0, 25.0, 17.0, 30.0, 23.0, 26.0, 18.0, 17.0, 17.0, 10.0, 7.0, 5.0, 5.0, 5.0, 8.0, 6.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0], "bins": [-11.6953125, -11.36181640625, -11.0283203125, -10.69482421875, -10.361328125, -10.02783203125, -9.6943359375, -9.36083984375, -9.02734375, -8.69384765625, -8.3603515625, -8.02685546875, -7.693359375, -7.35986328125, -7.0263671875, -6.69287109375, -6.359375, -6.02587890625, -5.6923828125, -5.35888671875, -5.025390625, -4.69189453125, -4.3583984375, -4.02490234375, -3.69140625, -3.35791015625, -3.0244140625, -2.69091796875, -2.357421875, -2.02392578125, -1.6904296875, -1.35693359375, -1.0234375, -0.68994140625, -0.3564453125, -0.02294921875, 0.310546875, 0.64404296875, 0.9775390625, 1.31103515625, 1.64453125, 1.97802734375, 2.3115234375, 2.64501953125, 2.978515625, 3.31201171875, 3.6455078125, 3.97900390625, 4.3125, 4.64599609375, 4.9794921875, 5.31298828125, 5.646484375, 5.97998046875, 6.3134765625, 6.64697265625, 6.98046875, 7.31396484375, 7.6474609375, 7.98095703125, 8.314453125, 8.64794921875, 8.9814453125, 9.31494140625, 9.6484375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 4.0, 3.0, 12.0, 23.0, 16.0, 20.0, 33.0, 34.0, 43.0, 77.0, 77.0, 114.0, 183.0, 178.0, 285.0, 462.0, 655.0, 1038.0, 1844.0, 3529.0, 7450.0, 19468.0, 63248.0, 893792.0, 32821.0, 11659.0, 4986.0, 2370.0, 1392.0, 803.0, 575.0, 356.0, 271.0, 207.0, 140.0, 88.0, 74.0, 60.0, 46.0, 24.0, 21.0, 17.0, 17.0, 13.0, 10.0, 7.0, 4.0, 5.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9609375, -6.7381591796875, -6.515380859375, -6.2926025390625, -6.06982421875, -5.8470458984375, -5.624267578125, -5.4014892578125, -5.1787109375, -4.9559326171875, -4.733154296875, -4.5103759765625, -4.28759765625, -4.0648193359375, -3.842041015625, -3.6192626953125, -3.396484375, -3.1737060546875, -2.950927734375, -2.7281494140625, -2.50537109375, -2.2825927734375, -2.059814453125, -1.8370361328125, -1.6142578125, -1.3914794921875, -1.168701171875, -0.9459228515625, -0.72314453125, -0.5003662109375, -0.277587890625, -0.0548095703125, 0.16796875, 0.3907470703125, 0.613525390625, 0.8363037109375, 1.05908203125, 1.2818603515625, 1.504638671875, 1.7274169921875, 1.9501953125, 2.1729736328125, 2.395751953125, 2.6185302734375, 2.84130859375, 3.0640869140625, 3.286865234375, 3.5096435546875, 3.732421875, 3.9552001953125, 4.177978515625, 4.4007568359375, 4.62353515625, 4.8463134765625, 5.069091796875, 5.2918701171875, 5.5146484375, 5.7374267578125, 5.960205078125, 6.1829833984375, 6.40576171875, 6.6285400390625, 6.851318359375, 7.0740966796875, 7.296875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 6.0, 3.0, 6.0, 8.0, 8.0, 10.0, 12.0, 14.0, 12.0, 18.0, 22.0, 28.0, 23.0, 33.0, 36.0, 16.0, 33.0, 37.0, 40.0, 40.0, 59.0, 46.0, 36.0, 45.0, 42.0, 46.0, 35.0, 33.0, 32.0, 23.0, 19.0, 30.0, 32.0, 19.0, 14.0, 20.0, 8.0, 10.0, 11.0, 9.0, 10.0, 4.0, 5.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.3359375, -8.08807373046875, -7.8402099609375, -7.59234619140625, -7.344482421875, -7.09661865234375, -6.8487548828125, -6.60089111328125, -6.35302734375, -6.10516357421875, -5.8572998046875, -5.60943603515625, -5.361572265625, -5.11370849609375, -4.8658447265625, -4.61798095703125, -4.3701171875, -4.12225341796875, -3.8743896484375, -3.62652587890625, -3.378662109375, -3.13079833984375, -2.8829345703125, -2.63507080078125, -2.38720703125, -2.13934326171875, -1.8914794921875, -1.64361572265625, -1.395751953125, -1.14788818359375, -0.9000244140625, -0.65216064453125, -0.404296875, -0.15643310546875, 0.0914306640625, 0.33929443359375, 0.587158203125, 0.83502197265625, 1.0828857421875, 1.33074951171875, 1.57861328125, 1.82647705078125, 2.0743408203125, 2.32220458984375, 2.570068359375, 2.81793212890625, 3.0657958984375, 3.31365966796875, 3.5615234375, 3.80938720703125, 4.0572509765625, 4.30511474609375, 4.552978515625, 4.80084228515625, 5.0487060546875, 5.29656982421875, 5.54443359375, 5.79229736328125, 6.0401611328125, 6.28802490234375, 6.535888671875, 6.78375244140625, 7.0316162109375, 7.27947998046875, 7.52734375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 7.0, 0.0, 3.0, 3.0, 9.0, 7.0, 7.0, 14.0, 14.0, 29.0, 27.0, 38.0, 44.0, 73.0, 93.0, 135.0, 158.0, 225.0, 361.0, 515.0, 801.0, 1436.0, 2643.0, 5721.0, 16061.0, 95832.0, 893592.0, 17606.0, 6179.0, 2750.0, 1501.0, 863.0, 532.0, 372.0, 252.0, 162.0, 133.0, 84.0, 71.0, 59.0, 40.0, 25.0, 26.0, 17.0, 15.0, 8.0, 6.0, 6.0, 1.0, 4.0, 1.0, 1.0, 2.0, 4.0, 0.0, 2.0, 2.0], "bins": [-0.8076171875, -0.783172607421875, -0.75872802734375, -0.734283447265625, -0.7098388671875, -0.685394287109375, -0.66094970703125, -0.636505126953125, -0.612060546875, -0.587615966796875, -0.56317138671875, -0.538726806640625, -0.5142822265625, -0.489837646484375, -0.46539306640625, -0.440948486328125, -0.41650390625, -0.392059326171875, -0.36761474609375, -0.343170166015625, -0.3187255859375, -0.294281005859375, -0.26983642578125, -0.245391845703125, -0.220947265625, -0.196502685546875, -0.17205810546875, -0.147613525390625, -0.1231689453125, -0.098724365234375, -0.07427978515625, -0.049835205078125, -0.025390625, -0.000946044921875, 0.02349853515625, 0.047943115234375, 0.0723876953125, 0.096832275390625, 0.12127685546875, 0.145721435546875, 0.170166015625, 0.194610595703125, 0.21905517578125, 0.243499755859375, 0.2679443359375, 0.292388916015625, 0.31683349609375, 0.341278076171875, 0.36572265625, 0.390167236328125, 0.41461181640625, 0.439056396484375, 0.4635009765625, 0.487945556640625, 0.51239013671875, 0.536834716796875, 0.561279296875, 0.585723876953125, 0.61016845703125, 0.634613037109375, 0.6590576171875, 0.683502197265625, 0.70794677734375, 0.732391357421875, 0.7568359375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 4.0, 8.0, 6.0, 7.0, 5.0, 8.0, 18.0, 20.0, 13.0, 18.0, 24.0, 40.0, 24.0, 42.0, 27.0, 30.0, 48.0, 38.0, 50.0, 34.0, 32.0, 51.0, 36.0, 36.0, 31.0, 48.0, 39.0, 29.0, 29.0, 19.0, 30.0, 22.0, 16.0, 15.0, 17.0, 14.0, 9.0, 23.0, 5.0, 13.0, 8.0, 5.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.079673767089844e-06, -5.887821316719055e-06, -5.695968866348267e-06, -5.504116415977478e-06, -5.3122639656066895e-06, -5.120411515235901e-06, -4.928559064865112e-06, -4.736706614494324e-06, -4.544854164123535e-06, -4.353001713752747e-06, -4.161149263381958e-06, -3.9692968130111694e-06, -3.777444362640381e-06, -3.5855919122695923e-06, -3.3937394618988037e-06, -3.201887011528015e-06, -3.0100345611572266e-06, -2.818182110786438e-06, -2.6263296604156494e-06, -2.434477210044861e-06, -2.2426247596740723e-06, -2.0507723093032837e-06, -1.8589198589324951e-06, -1.6670674085617065e-06, -1.475214958190918e-06, -1.2833625078201294e-06, -1.0915100574493408e-06, -8.996576070785522e-07, -7.078051567077637e-07, -5.159527063369751e-07, -3.241002559661865e-07, -1.3224780559539795e-07, 5.960464477539063e-08, 2.514570951461792e-07, 4.4330954551696777e-07, 6.351619958877563e-07, 8.270144462585449e-07, 1.0188668966293335e-06, 1.210719347000122e-06, 1.4025717973709106e-06, 1.5944242477416992e-06, 1.7862766981124878e-06, 1.9781291484832764e-06, 2.169981598854065e-06, 2.3618340492248535e-06, 2.553686499595642e-06, 2.7455389499664307e-06, 2.9373914003372192e-06, 3.129243850708008e-06, 3.3210963010787964e-06, 3.512948751449585e-06, 3.7048012018203735e-06, 3.896653652191162e-06, 4.088506102561951e-06, 4.280358552932739e-06, 4.472211003303528e-06, 4.664063453674316e-06, 4.855915904045105e-06, 5.0477683544158936e-06, 5.239620804786682e-06, 5.431473255157471e-06, 5.623325705528259e-06, 5.815178155899048e-06, 6.0070306062698364e-06, 6.198883056640625e-06]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 1.0, 2.0, 1.0, 6.0, 15.0, 16.0, 17.0, 18.0, 52.0, 72.0, 114.0, 164.0, 250.0, 458.0, 689.0, 1091.0, 1905.0, 3182.0, 5227.0, 9093.0, 16636.0, 30433.0, 60599.0, 134851.0, 371198.0, 228448.0, 88866.0, 42731.0, 22615.0, 12543.0, 7058.0, 3958.0, 2431.0, 1467.0, 895.0, 529.0, 322.0, 202.0, 141.0, 102.0, 63.0, 27.0, 33.0, 14.0, 13.0, 7.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.323974609375, -0.3123016357421875, -0.300628662109375, -0.2889556884765625, -0.27728271484375, -0.2656097412109375, -0.253936767578125, -0.2422637939453125, -0.2305908203125, -0.2189178466796875, -0.207244873046875, -0.1955718994140625, -0.18389892578125, -0.1722259521484375, -0.160552978515625, -0.1488800048828125, -0.13720703125, -0.1255340576171875, -0.113861083984375, -0.1021881103515625, -0.09051513671875, -0.0788421630859375, -0.067169189453125, -0.0554962158203125, -0.0438232421875, -0.0321502685546875, -0.020477294921875, -0.0088043212890625, 0.00286865234375, 0.0145416259765625, 0.026214599609375, 0.0378875732421875, 0.049560546875, 0.0612335205078125, 0.072906494140625, 0.0845794677734375, 0.09625244140625, 0.1079254150390625, 0.119598388671875, 0.1312713623046875, 0.1429443359375, 0.1546173095703125, 0.166290283203125, 0.1779632568359375, 0.18963623046875, 0.2013092041015625, 0.212982177734375, 0.2246551513671875, 0.236328125, 0.2480010986328125, 0.259674072265625, 0.2713470458984375, 0.28302001953125, 0.2946929931640625, 0.306365966796875, 0.3180389404296875, 0.3297119140625, 0.3413848876953125, 0.353057861328125, 0.3647308349609375, 0.37640380859375, 0.3880767822265625, 0.399749755859375, 0.4114227294921875, 0.423095703125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 1.0, 5.0, 7.0, 4.0, 5.0, 3.0, 5.0, 7.0, 11.0, 12.0, 19.0, 14.0, 14.0, 23.0, 24.0, 15.0, 38.0, 47.0, 48.0, 50.0, 82.0, 88.0, 82.0, 61.0, 43.0, 43.0, 32.0, 34.0, 28.0, 29.0, 21.0, 29.0, 15.0, 19.0, 7.0, 10.0, 7.0, 6.0, 2.0, 4.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2196044921875, -0.2116832733154297, -0.20376205444335938, -0.19584083557128906, -0.18791961669921875, -0.17999839782714844, -0.17207717895507812, -0.1641559600830078, -0.1562347412109375, -0.1483135223388672, -0.14039230346679688, -0.13247108459472656, -0.12454986572265625, -0.11662864685058594, -0.10870742797851562, -0.10078620910644531, -0.092864990234375, -0.08494377136230469, -0.07702255249023438, -0.06910133361816406, -0.06118011474609375, -0.05325889587402344, -0.045337677001953125, -0.03741645812988281, -0.0294952392578125, -0.021574020385742188, -0.013652801513671875, -0.0057315826416015625, 0.00218963623046875, 0.010110855102539062, 0.018032073974609375, 0.025953292846679688, 0.03387451171875, 0.04179573059082031, 0.049716949462890625, 0.05763816833496094, 0.06555938720703125, 0.07348060607910156, 0.08140182495117188, 0.08932304382324219, 0.0972442626953125, 0.10516548156738281, 0.11308670043945312, 0.12100791931152344, 0.12892913818359375, 0.13685035705566406, 0.14477157592773438, 0.1526927947998047, 0.160614013671875, 0.1685352325439453, 0.17645645141601562, 0.18437767028808594, 0.19229888916015625, 0.20022010803222656, 0.20814132690429688, 0.2160625457763672, 0.2239837646484375, 0.2319049835205078, 0.23982620239257812, 0.24774742126464844, 0.25566864013671875, 0.26358985900878906, 0.2715110778808594, 0.2794322967529297, 0.287353515625]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 6.0, 10.0, 5.0, 12.0, 23.0, 17.0, 19.0, 31.0, 27.0, 46.0, 51.0, 34.0, 55.0, 59.0, 57.0, 55.0, 55.0, 61.0, 48.0, 50.0, 48.0, 59.0, 44.0, 19.0, 33.0, 17.0, 12.0, 15.0, 12.0, 4.0, 6.0, 4.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.601850509643555, -11.249249458312988, -10.896649360656738, -10.544048309326172, -10.191448211669922, -9.838847160339355, -9.486246109008789, -9.133646011352539, -8.781044960021973, -8.428443908691406, -8.075843811035156, -7.72324275970459, -7.370642185211182, -7.018041610717773, -6.665440559387207, -6.312839984893799, -5.960239410400391, -5.607638835906982, -5.255038261413574, -4.902437210083008, -4.5498366355896, -4.197236061096191, -3.844635248184204, -3.492034435272217, -3.1394338607788086, -2.7868332862854004, -2.434232473373413, -2.081631660461426, -1.7290310859680176, -1.3764303922653198, -1.023829698562622, -0.6712288856506348, -0.31862926483154297, 0.033971428871154785, 0.38657212257385254, 0.7391728162765503, 1.091773509979248, 1.4443742036819458, 1.7969748973846436, 2.149575710296631, 2.502176284790039, 2.8547768592834473, 3.2073776721954346, 3.559978485107422, 3.91257905960083, 4.265179634094238, 4.617780685424805, 4.970381259918213, 5.322981834411621, 5.675582408905029, 6.0281829833984375, 6.380784034729004, 6.733384609222412, 7.08598518371582, 7.438586235046387, 7.791186809539795, 8.143787384033203, 8.49638843536377, 8.84898853302002, 9.201589584350586, 9.554189682006836, 9.906790733337402, 10.259391784667969, 10.611991882324219, 10.964592933654785]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 5.0, 5.0, 1.0, 13.0, 6.0, 6.0, 13.0, 8.0, 11.0, 7.0, 10.0, 15.0, 23.0, 21.0, 24.0, 25.0, 29.0, 37.0, 33.0, 32.0, 34.0, 36.0, 46.0, 40.0, 32.0, 24.0, 45.0, 32.0, 41.0, 36.0, 28.0, 37.0, 25.0, 33.0, 30.0, 17.0, 23.0, 25.0, 21.0, 14.0, 9.0, 10.0, 8.0, 12.0, 5.0, 7.0, 6.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.563755989074707, -10.241415977478027, -9.919075012207031, -9.596735000610352, -9.274394989013672, -8.952054977416992, -8.629714012145996, -8.307374000549316, -7.9850335121154785, -7.662693023681641, -7.340353012084961, -7.018012523651123, -6.695672035217285, -6.3733320236206055, -6.050991535186768, -5.72865104675293, -5.40631103515625, -5.083970546722412, -4.761630535125732, -4.4392900466918945, -4.116950035095215, -3.794609546661377, -3.472269058227539, -3.1499288082122803, -2.8275885581970215, -2.5052483081817627, -2.182908058166504, -1.860567569732666, -1.5382273197174072, -1.2158870697021484, -0.8935467004776001, -0.5712063312530518, -0.24886608123779297, 0.0734742283821106, 0.39581453800201416, 0.7181548476219177, 1.0404951572418213, 1.36283540725708, 1.6851757764816284, 2.0075161457061768, 2.3298563957214355, 2.6521966457366943, 2.974536895751953, 3.296877384185791, 3.61921763420105, 3.9415578842163086, 4.2638983726501465, 4.586238861083984, 4.908578872680664, 5.230919361114502, 5.553259372711182, 5.8755998611450195, 6.197939872741699, 6.520280361175537, 6.842620849609375, 7.164960861206055, 7.487301349639893, 7.8096418380737305, 8.13198184967041, 8.45432186126709, 8.776662826538086, 9.099002838134766, 9.421342849731445, 9.743683815002441, 10.066023826599121]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 6.0, 8.0, 16.0, 34.0, 54.0, 69.0, 120.0, 220.0, 356.0, 553.0, 884.0, 1435.0, 2162.0, 3455.0, 5298.0, 8340.0, 12847.0, 18909.0, 27231.0, 38395.0, 51887.0, 67751.0, 82053.0, 95781.0, 102018.0, 102412.0, 95947.0, 83898.0, 68810.0, 53066.0, 39546.0, 28423.0, 19453.0, 13235.0, 8500.0, 5598.0, 3574.0, 2293.0, 1458.0, 972.0, 581.0, 375.0, 207.0, 136.0, 80.0, 54.0, 31.0, 13.0, 5.0, 4.0, 4.0, 6.0, 2.0, 0.0, 1.0], "bins": [-5.98828125, -5.8123779296875, -5.636474609375, -5.4605712890625, -5.28466796875, -5.1087646484375, -4.932861328125, -4.7569580078125, -4.5810546875, -4.4051513671875, -4.229248046875, -4.0533447265625, -3.87744140625, -3.7015380859375, -3.525634765625, -3.3497314453125, -3.173828125, -2.9979248046875, -2.822021484375, -2.6461181640625, -2.47021484375, -2.2943115234375, -2.118408203125, -1.9425048828125, -1.7666015625, -1.5906982421875, -1.414794921875, -1.2388916015625, -1.06298828125, -0.8870849609375, -0.711181640625, -0.5352783203125, -0.359375, -0.1834716796875, -0.007568359375, 0.1683349609375, 0.34423828125, 0.5201416015625, 0.696044921875, 0.8719482421875, 1.0478515625, 1.2237548828125, 1.399658203125, 1.5755615234375, 1.75146484375, 1.9273681640625, 2.103271484375, 2.2791748046875, 2.455078125, 2.6309814453125, 2.806884765625, 2.9827880859375, 3.15869140625, 3.3345947265625, 3.510498046875, 3.6864013671875, 3.8623046875, 4.0382080078125, 4.214111328125, 4.3900146484375, 4.56591796875, 4.7418212890625, 4.917724609375, 5.0936279296875, 5.26953125]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 6.0, 5.0, 6.0, 3.0, 6.0, 7.0, 13.0, 5.0, 10.0, 13.0, 10.0, 14.0, 25.0, 33.0, 28.0, 40.0, 19.0, 29.0, 37.0, 43.0, 42.0, 39.0, 40.0, 45.0, 37.0, 29.0, 41.0, 40.0, 29.0, 30.0, 31.0, 36.0, 41.0, 28.0, 27.0, 15.0, 19.0, 17.0, 18.0, 5.0, 13.0, 10.0, 9.0, 6.0, 6.0, 1.0, 4.0, 0.0, 0.0, 3.0, 1.0, 1.0], "bins": [-12.4375, -12.0906982421875, -11.743896484375, -11.3970947265625, -11.05029296875, -10.7034912109375, -10.356689453125, -10.0098876953125, -9.6630859375, -9.3162841796875, -8.969482421875, -8.6226806640625, -8.27587890625, -7.9290771484375, -7.582275390625, -7.2354736328125, -6.888671875, -6.5418701171875, -6.195068359375, -5.8482666015625, -5.50146484375, -5.1546630859375, -4.807861328125, -4.4610595703125, -4.1142578125, -3.7674560546875, -3.420654296875, -3.0738525390625, -2.72705078125, -2.3802490234375, -2.033447265625, -1.6866455078125, -1.33984375, -0.9930419921875, -0.646240234375, -0.2994384765625, 0.04736328125, 0.3941650390625, 0.740966796875, 1.0877685546875, 1.4345703125, 1.7813720703125, 2.128173828125, 2.4749755859375, 2.82177734375, 3.1685791015625, 3.515380859375, 3.8621826171875, 4.208984375, 4.5557861328125, 4.902587890625, 5.2493896484375, 5.59619140625, 5.9429931640625, 6.289794921875, 6.6365966796875, 6.9833984375, 7.3302001953125, 7.677001953125, 8.0238037109375, 8.37060546875, 8.7174072265625, 9.064208984375, 9.4110107421875, 9.7578125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 10.0, 11.0, 20.0, 35.0, 52.0, 99.0, 167.0, 239.0, 363.0, 585.0, 874.0, 1322.0, 2087.0, 3267.0, 4856.0, 7297.0, 10642.0, 15497.0, 22173.0, 30738.0, 42048.0, 54661.0, 68227.0, 81555.0, 92062.0, 96981.0, 95494.0, 89409.0, 78964.0, 64925.0, 51651.0, 38945.0, 29048.0, 20662.0, 14155.0, 9813.0, 6720.0, 4424.0, 2986.0, 1948.0, 1250.0, 831.0, 553.0, 325.0, 220.0, 140.0, 77.0, 60.0, 40.0, 28.0, 11.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0], "bins": [-5.55859375, -5.38958740234375, -5.2205810546875, -5.05157470703125, -4.882568359375, -4.71356201171875, -4.5445556640625, -4.37554931640625, -4.20654296875, -4.03753662109375, -3.8685302734375, -3.69952392578125, -3.530517578125, -3.36151123046875, -3.1925048828125, -3.02349853515625, -2.8544921875, -2.68548583984375, -2.5164794921875, -2.34747314453125, -2.178466796875, -2.00946044921875, -1.8404541015625, -1.67144775390625, -1.50244140625, -1.33343505859375, -1.1644287109375, -0.99542236328125, -0.826416015625, -0.65740966796875, -0.4884033203125, -0.31939697265625, -0.150390625, 0.01861572265625, 0.1876220703125, 0.35662841796875, 0.525634765625, 0.69464111328125, 0.8636474609375, 1.03265380859375, 1.20166015625, 1.37066650390625, 1.5396728515625, 1.70867919921875, 1.877685546875, 2.04669189453125, 2.2156982421875, 2.38470458984375, 2.5537109375, 2.72271728515625, 2.8917236328125, 3.06072998046875, 3.229736328125, 3.39874267578125, 3.5677490234375, 3.73675537109375, 3.90576171875, 4.07476806640625, 4.2437744140625, 4.41278076171875, 4.581787109375, 4.75079345703125, 4.9197998046875, 5.08880615234375, 5.2578125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 6.0, 6.0, 11.0, 9.0, 5.0, 9.0, 11.0, 14.0, 23.0, 26.0, 18.0, 17.0, 21.0, 37.0, 21.0, 34.0, 29.0, 48.0, 51.0, 41.0, 53.0, 53.0, 40.0, 43.0, 44.0, 35.0, 27.0, 31.0, 19.0, 25.0, 31.0, 15.0, 36.0, 15.0, 14.0, 20.0, 17.0, 15.0, 9.0, 6.0, 3.0, 7.0, 3.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.984375, -6.7545166015625, -6.524658203125, -6.2947998046875, -6.06494140625, -5.8350830078125, -5.605224609375, -5.3753662109375, -5.1455078125, -4.9156494140625, -4.685791015625, -4.4559326171875, -4.22607421875, -3.9962158203125, -3.766357421875, -3.5364990234375, -3.306640625, -3.0767822265625, -2.846923828125, -2.6170654296875, -2.38720703125, -2.1573486328125, -1.927490234375, -1.6976318359375, -1.4677734375, -1.2379150390625, -1.008056640625, -0.7781982421875, -0.54833984375, -0.3184814453125, -0.088623046875, 0.1412353515625, 0.37109375, 0.6009521484375, 0.830810546875, 1.0606689453125, 1.29052734375, 1.5203857421875, 1.750244140625, 1.9801025390625, 2.2099609375, 2.4398193359375, 2.669677734375, 2.8995361328125, 3.12939453125, 3.3592529296875, 3.589111328125, 3.8189697265625, 4.048828125, 4.2786865234375, 4.508544921875, 4.7384033203125, 4.96826171875, 5.1981201171875, 5.427978515625, 5.6578369140625, 5.8876953125, 6.1175537109375, 6.347412109375, 6.5772705078125, 6.80712890625, 7.0369873046875, 7.266845703125, 7.4967041015625, 7.7265625]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 8.0, 13.0, 23.0, 38.0, 51.0, 79.0, 142.0, 212.0, 370.0, 576.0, 908.0, 1378.0, 2215.0, 3656.0, 5616.0, 8640.0, 12951.0, 19116.0, 27739.0, 39278.0, 52429.0, 68071.0, 82778.0, 95002.0, 101407.0, 102313.0, 95045.0, 83459.0, 68155.0, 53403.0, 39198.0, 28282.0, 19255.0, 12992.0, 8523.0, 5551.0, 3527.0, 2213.0, 1442.0, 906.0, 594.0, 337.0, 256.0, 141.0, 90.0, 68.0, 46.0, 33.0, 13.0, 8.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.650390625, -1.5988311767578125, -1.547271728515625, -1.4957122802734375, -1.44415283203125, -1.3925933837890625, -1.341033935546875, -1.2894744873046875, -1.2379150390625, -1.1863555908203125, -1.134796142578125, -1.0832366943359375, -1.03167724609375, -0.9801177978515625, -0.928558349609375, -0.8769989013671875, -0.825439453125, -0.7738800048828125, -0.722320556640625, -0.6707611083984375, -0.61920166015625, -0.5676422119140625, -0.516082763671875, -0.4645233154296875, -0.4129638671875, -0.3614044189453125, -0.309844970703125, -0.2582855224609375, -0.20672607421875, -0.1551666259765625, -0.103607177734375, -0.0520477294921875, -0.00048828125, 0.0510711669921875, 0.102630615234375, 0.1541900634765625, 0.20574951171875, 0.2573089599609375, 0.308868408203125, 0.3604278564453125, 0.4119873046875, 0.4635467529296875, 0.515106201171875, 0.5666656494140625, 0.61822509765625, 0.6697845458984375, 0.721343994140625, 0.7729034423828125, 0.824462890625, 0.8760223388671875, 0.927581787109375, 0.9791412353515625, 1.03070068359375, 1.0822601318359375, 1.133819580078125, 1.1853790283203125, 1.2369384765625, 1.2884979248046875, 1.340057373046875, 1.3916168212890625, 1.44317626953125, 1.4947357177734375, 1.546295166015625, 1.5978546142578125, 1.6494140625]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 5.0, 4.0, 5.0, 6.0, 6.0, 13.0, 16.0, 13.0, 25.0, 20.0, 13.0, 24.0, 21.0, 28.0, 40.0, 34.0, 48.0, 34.0, 50.0, 48.0, 49.0, 41.0, 43.0, 34.0, 50.0, 46.0, 40.0, 30.0, 37.0, 21.0, 31.0, 27.0, 22.0, 11.0, 17.0, 1.0, 16.0, 6.0, 7.0, 4.0, 6.0, 3.0, 4.0, 3.0, 4.0, 4.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.00021326541900634766, -0.00020721927285194397, -0.00020117312669754028, -0.0001951269805431366, -0.0001890808343887329, -0.00018303468823432922, -0.00017698854207992554, -0.00017094239592552185, -0.00016489624977111816, -0.00015885010361671448, -0.0001528039574623108, -0.0001467578113079071, -0.00014071166515350342, -0.00013466551899909973, -0.00012861937284469604, -0.00012257322669029236, -0.00011652708053588867, -0.00011048093438148499, -0.0001044347882270813, -9.838864207267761e-05, -9.234249591827393e-05, -8.629634976387024e-05, -8.025020360946655e-05, -7.420405745506287e-05, -6.815791130065918e-05, -6.211176514625549e-05, -5.606561899185181e-05, -5.001947283744812e-05, -4.3973326683044434e-05, -3.792718052864075e-05, -3.188103437423706e-05, -2.5834888219833374e-05, -1.9788742065429688e-05, -1.3742595911026001e-05, -7.696449756622314e-06, -1.650303602218628e-06, 4.395842552185059e-06, 1.0441988706588745e-05, 1.648813486099243e-05, 2.2534281015396118e-05, 2.8580427169799805e-05, 3.462657332420349e-05, 4.067271947860718e-05, 4.6718865633010864e-05, 5.276501178741455e-05, 5.881115794181824e-05, 6.485730409622192e-05, 7.090345025062561e-05, 7.69495964050293e-05, 8.299574255943298e-05, 8.904188871383667e-05, 9.508803486824036e-05, 0.00010113418102264404, 0.00010718032717704773, 0.00011322647333145142, 0.0001192726194858551, 0.0001253187656402588, 0.00013136491179466248, 0.00013741105794906616, 0.00014345720410346985, 0.00014950335025787354, 0.00015554949641227722, 0.0001615956425666809, 0.0001676417887210846, 0.00017368793487548828]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 5.0, 9.0, 6.0, 12.0, 21.0, 36.0, 41.0, 57.0, 83.0, 145.0, 202.0, 315.0, 527.0, 788.0, 1345.0, 2213.0, 3652.0, 5695.0, 9017.0, 14664.0, 22627.0, 34232.0, 49693.0, 67897.0, 87182.0, 104790.0, 113912.0, 114509.0, 105527.0, 89225.0, 69913.0, 50979.0, 35355.0, 23416.0, 14911.0, 9705.0, 6029.0, 3748.0, 2302.0, 1426.0, 860.0, 521.0, 345.0, 216.0, 150.0, 97.0, 59.0, 31.0, 24.0, 12.0, 11.0, 7.0, 8.0, 4.0, 1.0, 3.0, 3.0, 1.0], "bins": [-2.025390625, -1.9640960693359375, -1.902801513671875, -1.8415069580078125, -1.78021240234375, -1.7189178466796875, -1.657623291015625, -1.5963287353515625, -1.5350341796875, -1.4737396240234375, -1.412445068359375, -1.3511505126953125, -1.28985595703125, -1.2285614013671875, -1.167266845703125, -1.1059722900390625, -1.044677734375, -0.9833831787109375, -0.922088623046875, -0.8607940673828125, -0.79949951171875, -0.7382049560546875, -0.676910400390625, -0.6156158447265625, -0.5543212890625, -0.4930267333984375, -0.431732177734375, -0.3704376220703125, -0.30914306640625, -0.2478485107421875, -0.186553955078125, -0.1252593994140625, -0.06396484375, -0.0026702880859375, 0.058624267578125, 0.1199188232421875, 0.18121337890625, 0.2425079345703125, 0.303802490234375, 0.3650970458984375, 0.4263916015625, 0.4876861572265625, 0.548980712890625, 0.6102752685546875, 0.67156982421875, 0.7328643798828125, 0.794158935546875, 0.8554534912109375, 0.916748046875, 0.9780426025390625, 1.039337158203125, 1.1006317138671875, 1.16192626953125, 1.2232208251953125, 1.284515380859375, 1.3458099365234375, 1.4071044921875, 1.4683990478515625, 1.529693603515625, 1.5909881591796875, 1.65228271484375, 1.7135772705078125, 1.774871826171875, 1.8361663818359375, 1.8974609375]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 4.0, 9.0, 9.0, 18.0, 11.0, 21.0, 18.0, 32.0, 29.0, 30.0, 36.0, 46.0, 39.0, 44.0, 63.0, 43.0, 54.0, 54.0, 43.0, 46.0, 47.0, 45.0, 38.0, 42.0, 31.0, 32.0, 22.0, 24.0, 16.0, 11.0, 8.0, 6.0, 5.0, 5.0, 2.0, 1.0, 6.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.025390625, -0.991119384765625, -0.95684814453125, -0.922576904296875, -0.8883056640625, -0.854034423828125, -0.81976318359375, -0.785491943359375, -0.751220703125, -0.716949462890625, -0.68267822265625, -0.648406982421875, -0.6141357421875, -0.579864501953125, -0.54559326171875, -0.511322021484375, -0.47705078125, -0.442779541015625, -0.40850830078125, -0.374237060546875, -0.3399658203125, -0.305694580078125, -0.27142333984375, -0.237152099609375, -0.202880859375, -0.168609619140625, -0.13433837890625, -0.100067138671875, -0.0657958984375, -0.031524658203125, 0.00274658203125, 0.037017822265625, 0.0712890625, 0.105560302734375, 0.13983154296875, 0.174102783203125, 0.2083740234375, 0.242645263671875, 0.27691650390625, 0.311187744140625, 0.345458984375, 0.379730224609375, 0.41400146484375, 0.448272705078125, 0.4825439453125, 0.516815185546875, 0.55108642578125, 0.585357666015625, 0.61962890625, 0.653900146484375, 0.68817138671875, 0.722442626953125, 0.7567138671875, 0.790985107421875, 0.82525634765625, 0.859527587890625, 0.893798828125, 0.928070068359375, 0.96234130859375, 0.996612548828125, 1.0308837890625, 1.065155029296875, 1.09942626953125, 1.133697509765625, 1.16796875]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 13.0, 10.0, 13.0, 10.0, 14.0, 19.0, 19.0, 26.0, 27.0, 31.0, 47.0, 55.0, 45.0, 37.0, 55.0, 62.0, 57.0, 55.0, 56.0, 47.0, 54.0, 43.0, 45.0, 36.0, 32.0, 22.0, 13.0, 8.0, 13.0, 12.0, 10.0, 7.0, 2.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.836583137512207, -10.50124740600586, -10.165910720825195, -9.830574989318848, -9.495238304138184, -9.159902572631836, -8.824565887451172, -8.489230155944824, -8.153894424438477, -7.818558216094971, -7.483222007751465, -7.147886276245117, -6.812549591064453, -6.4772138595581055, -6.1418776512146, -5.806541442871094, -5.47120475769043, -5.135868549346924, -4.800532341003418, -4.46519660949707, -4.129859924316406, -3.7945239543914795, -3.4591879844665527, -3.123851776123047, -2.788515567779541, -2.453179359436035, -2.1178431510925293, -1.7825071811676025, -1.4471709728240967, -1.1118347644805908, -0.7764987945556641, -0.4411625862121582, -0.10582637786865234, 0.22950977087020874, 0.5648459196090698, 0.9001820087432861, 1.235518217086792, 1.5708544254302979, 1.9061903953552246, 2.2415266036987305, 2.5768628120422363, 2.912199020385742, 3.247535228729248, 3.582871198654175, 3.9182074069976807, 4.253543853759766, 4.588879585266113, 4.924215793609619, 5.259552001953125, 5.594888210296631, 5.930224418640137, 6.265560150146484, 6.600896835327148, 6.936232566833496, 7.271568775177002, 7.606904983520508, 7.942241191864014, 8.27757740020752, 8.612913131713867, 8.948249816894531, 9.283585548400879, 9.618922233581543, 9.95425796508789, 10.289594650268555, 10.624930381774902]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 2.0, 7.0, 4.0, 3.0, 6.0, 8.0, 8.0, 12.0, 10.0, 15.0, 15.0, 17.0, 17.0, 16.0, 20.0, 25.0, 34.0, 35.0, 27.0, 25.0, 40.0, 40.0, 34.0, 42.0, 31.0, 34.0, 24.0, 30.0, 33.0, 41.0, 25.0, 19.0, 30.0, 30.0, 27.0, 27.0, 27.0, 30.0, 19.0, 18.0, 14.0, 19.0, 11.0, 15.0, 8.0, 5.0, 6.0, 5.0, 1.0, 7.0, 3.0, 4.0, 3.0, 0.0, 1.0], "bins": [-11.285165786743164, -10.957624435424805, -10.630083084106445, -10.30254077911377, -9.97499942779541, -9.64745807647705, -9.319916725158691, -8.992375373840332, -8.664833068847656, -8.337291717529297, -8.009750366210938, -7.68220853805542, -7.354666709899902, -7.027125358581543, -6.699584007263184, -6.372042655944824, -6.044501304626465, -5.7169599533081055, -5.389418125152588, -5.0618767738342285, -4.734334945678711, -4.406793594360352, -4.079252243041992, -3.7517106533050537, -3.4241690635681152, -3.0966274738311768, -2.7690858840942383, -2.441544532775879, -2.1140029430389404, -1.786461353302002, -1.458919882774353, -1.131378412246704, -0.8038358688354492, -0.4762943387031555, -0.14875280857086182, 0.17878872156143188, 0.5063302516937256, 0.8338718414306641, 1.161413311958313, 1.488954782485962, 1.8164963722229004, 2.144037961959839, 2.4715795516967773, 2.7991209030151367, 3.126662492752075, 3.4542040824890137, 3.781745433807373, 4.109287261962891, 4.43682861328125, 4.764369964599609, 5.091911792755127, 5.419453144073486, 5.746994972229004, 6.074536323547363, 6.402077674865723, 6.729619026184082, 7.0571608543396, 7.384702205657959, 7.712244033813477, 8.039785385131836, 8.367326736450195, 8.694868087768555, 9.02241039276123, 9.34995174407959, 9.67749309539795]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 5.0, 1.0, 5.0, 10.0, 12.0, 30.0, 35.0, 87.0, 116.0, 201.0, 324.0, 516.0, 975.0, 1409.0, 2283.0, 3787.0, 5990.0, 9538.0, 15094.0, 23623.0, 36233.0, 55780.0, 83404.0, 121507.0, 169662.0, 233606.0, 300270.0, 363913.0, 412387.0, 432197.0, 418948.0, 375198.0, 313347.0, 245855.0, 183052.0, 130134.0, 89511.0, 59988.0, 39010.0, 25138.0, 16033.0, 9867.0, 6075.0, 3708.0, 2193.0, 1343.0, 795.0, 433.0, 268.0, 170.0, 94.0, 54.0, 39.0, 23.0, 11.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.0546875, -6.838134765625, -6.62158203125, -6.405029296875, -6.1884765625, -5.971923828125, -5.75537109375, -5.538818359375, -5.322265625, -5.105712890625, -4.88916015625, -4.672607421875, -4.4560546875, -4.239501953125, -4.02294921875, -3.806396484375, -3.58984375, -3.373291015625, -3.15673828125, -2.940185546875, -2.7236328125, -2.507080078125, -2.29052734375, -2.073974609375, -1.857421875, -1.640869140625, -1.42431640625, -1.207763671875, -0.9912109375, -0.774658203125, -0.55810546875, -0.341552734375, -0.125, 0.091552734375, 0.30810546875, 0.524658203125, 0.7412109375, 0.957763671875, 1.17431640625, 1.390869140625, 1.607421875, 1.823974609375, 2.04052734375, 2.257080078125, 2.4736328125, 2.690185546875, 2.90673828125, 3.123291015625, 3.33984375, 3.556396484375, 3.77294921875, 3.989501953125, 4.2060546875, 4.422607421875, 4.63916015625, 4.855712890625, 5.072265625, 5.288818359375, 5.50537109375, 5.721923828125, 5.9384765625, 6.155029296875, 6.37158203125, 6.588134765625, 6.8046875]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 4.0, 8.0, 10.0, 5.0, 8.0, 6.0, 13.0, 8.0, 12.0, 8.0, 15.0, 12.0, 20.0, 23.0, 11.0, 30.0, 29.0, 34.0, 29.0, 40.0, 28.0, 32.0, 40.0, 34.0, 30.0, 33.0, 33.0, 21.0, 33.0, 28.0, 29.0, 37.0, 22.0, 19.0, 23.0, 39.0, 31.0, 17.0, 18.0, 14.0, 24.0, 12.0, 12.0, 17.0, 8.0, 9.0, 6.0, 6.0, 5.0, 6.0, 2.0, 4.0, 2.0, 3.0, 2.0], "bins": [-8.703125, -8.44866943359375, -8.1942138671875, -7.93975830078125, -7.685302734375, -7.43084716796875, -7.1763916015625, -6.92193603515625, -6.66748046875, -6.41302490234375, -6.1585693359375, -5.90411376953125, -5.649658203125, -5.39520263671875, -5.1407470703125, -4.88629150390625, -4.6318359375, -4.37738037109375, -4.1229248046875, -3.86846923828125, -3.614013671875, -3.35955810546875, -3.1051025390625, -2.85064697265625, -2.59619140625, -2.34173583984375, -2.0872802734375, -1.83282470703125, -1.578369140625, -1.32391357421875, -1.0694580078125, -0.81500244140625, -0.560546875, -0.30609130859375, -0.0516357421875, 0.20281982421875, 0.457275390625, 0.71173095703125, 0.9661865234375, 1.22064208984375, 1.47509765625, 1.72955322265625, 1.9840087890625, 2.23846435546875, 2.492919921875, 2.74737548828125, 3.0018310546875, 3.25628662109375, 3.5107421875, 3.76519775390625, 4.0196533203125, 4.27410888671875, 4.528564453125, 4.78302001953125, 5.0374755859375, 5.29193115234375, 5.54638671875, 5.80084228515625, 6.0552978515625, 6.30975341796875, 6.564208984375, 6.81866455078125, 7.0731201171875, 7.32757568359375, 7.58203125]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 17.0, 20.0, 33.0, 55.0, 88.0, 165.0, 251.0, 436.0, 756.0, 1210.0, 2085.0, 3366.0, 5548.0, 9022.0, 14432.0, 22866.0, 35037.0, 52455.0, 77524.0, 110122.0, 151330.0, 200169.0, 253683.0, 304197.0, 348351.0, 375881.0, 382625.0, 369006.0, 334711.0, 287948.0, 235974.0, 184660.0, 135985.0, 98217.0, 68437.0, 45953.0, 30135.0, 19457.0, 12466.0, 7726.0, 4702.0, 2817.0, 1739.0, 1071.0, 619.0, 383.0, 218.0, 141.0, 84.0, 42.0, 35.0, 18.0, 11.0, 5.0, 5.0, 3.0, 2.0], "bins": [-6.78515625, -6.58160400390625, -6.3780517578125, -6.17449951171875, -5.970947265625, -5.76739501953125, -5.5638427734375, -5.36029052734375, -5.15673828125, -4.95318603515625, -4.7496337890625, -4.54608154296875, -4.342529296875, -4.13897705078125, -3.9354248046875, -3.73187255859375, -3.5283203125, -3.32476806640625, -3.1212158203125, -2.91766357421875, -2.714111328125, -2.51055908203125, -2.3070068359375, -2.10345458984375, -1.89990234375, -1.69635009765625, -1.4927978515625, -1.28924560546875, -1.085693359375, -0.88214111328125, -0.6785888671875, -0.47503662109375, -0.271484375, -0.06793212890625, 0.1356201171875, 0.33917236328125, 0.542724609375, 0.74627685546875, 0.9498291015625, 1.15338134765625, 1.35693359375, 1.56048583984375, 1.7640380859375, 1.96759033203125, 2.171142578125, 2.37469482421875, 2.5782470703125, 2.78179931640625, 2.9853515625, 3.18890380859375, 3.3924560546875, 3.59600830078125, 3.799560546875, 4.00311279296875, 4.2066650390625, 4.41021728515625, 4.61376953125, 4.81732177734375, 5.0208740234375, 5.22442626953125, 5.427978515625, 5.63153076171875, 5.8350830078125, 6.03863525390625, 6.2421875]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 2.0, 5.0, 3.0, 4.0, 7.0, 11.0, 8.0, 16.0, 17.0, 25.0, 26.0, 40.0, 43.0, 43.0, 57.0, 72.0, 96.0, 84.0, 119.0, 118.0, 132.0, 146.0, 170.0, 180.0, 181.0, 201.0, 179.0, 195.0, 190.0, 175.0, 165.0, 168.0, 150.0, 152.0, 138.0, 122.0, 85.0, 100.0, 89.0, 67.0, 55.0, 50.0, 35.0, 36.0, 27.0, 34.0, 10.0, 12.0, 8.0, 8.0, 7.0, 6.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-3.982421875, -3.850921630859375, -3.71942138671875, -3.587921142578125, -3.4564208984375, -3.324920654296875, -3.19342041015625, -3.061920166015625, -2.930419921875, -2.798919677734375, -2.66741943359375, -2.535919189453125, -2.4044189453125, -2.272918701171875, -2.14141845703125, -2.009918212890625, -1.87841796875, -1.746917724609375, -1.61541748046875, -1.483917236328125, -1.3524169921875, -1.220916748046875, -1.08941650390625, -0.957916259765625, -0.826416015625, -0.694915771484375, -0.56341552734375, -0.431915283203125, -0.3004150390625, -0.168914794921875, -0.03741455078125, 0.094085693359375, 0.2255859375, 0.357086181640625, 0.48858642578125, 0.620086669921875, 0.7515869140625, 0.883087158203125, 1.01458740234375, 1.146087646484375, 1.277587890625, 1.409088134765625, 1.54058837890625, 1.672088623046875, 1.8035888671875, 1.935089111328125, 2.06658935546875, 2.198089599609375, 2.32958984375, 2.461090087890625, 2.59259033203125, 2.724090576171875, 2.8555908203125, 2.987091064453125, 3.11859130859375, 3.250091552734375, 3.381591796875, 3.513092041015625, 3.64459228515625, 3.776092529296875, 3.9075927734375, 4.039093017578125, 4.17059326171875, 4.302093505859375, 4.43359375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 4.0, 4.0, 9.0, 14.0, 10.0, 8.0, 6.0, 15.0, 20.0, 18.0, 23.0, 28.0, 36.0, 34.0, 28.0, 37.0, 44.0, 38.0, 40.0, 51.0, 37.0, 55.0, 44.0, 40.0, 36.0, 48.0, 34.0, 34.0, 31.0, 31.0, 26.0, 14.0, 20.0, 14.0, 16.0, 5.0, 9.0, 9.0, 8.0, 6.0, 6.0, 8.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-9.548234939575195, -9.264052391052246, -8.979869842529297, -8.695687294006348, -8.411504745483398, -8.12732219696045, -7.8431396484375, -7.558957099914551, -7.274774551391602, -6.990592002868652, -6.706409454345703, -6.422226905822754, -6.138044357299805, -5.8538618087768555, -5.569679260253906, -5.285496711730957, -5.001314163208008, -4.717131614685059, -4.432949066162109, -4.14876651763916, -3.864583969116211, -3.5804014205932617, -3.2962188720703125, -3.0120363235473633, -2.727853775024414, -2.443671226501465, -2.1594886779785156, -1.8753061294555664, -1.5911235809326172, -1.306941032409668, -1.0227584838867188, -0.7385759353637695, -0.4543924331665039, -0.1702098846435547, 0.11397266387939453, 0.39815521240234375, 0.682337760925293, 0.9665203094482422, 1.2507028579711914, 1.5348854064941406, 1.8190679550170898, 2.103250503540039, 2.3874330520629883, 2.6716156005859375, 2.9557981491088867, 3.239980697631836, 3.524163246154785, 3.8083457946777344, 4.092528343200684, 4.376710891723633, 4.660893440246582, 4.945075988769531, 5.2292585372924805, 5.51344108581543, 5.797623634338379, 6.081806182861328, 6.365988731384277, 6.650171279907227, 6.934353828430176, 7.218536376953125, 7.502718925476074, 7.786901473999023, 8.071084022521973, 8.355266571044922, 8.639449119567871]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 7.0, 7.0, 4.0, 5.0, 8.0, 7.0, 6.0, 16.0, 9.0, 5.0, 19.0, 14.0, 23.0, 30.0, 25.0, 22.0, 26.0, 42.0, 34.0, 36.0, 39.0, 32.0, 44.0, 31.0, 29.0, 36.0, 49.0, 33.0, 38.0, 41.0, 37.0, 29.0, 26.0, 27.0, 23.0, 23.0, 24.0, 12.0, 14.0, 14.0, 19.0, 12.0, 9.0, 4.0, 5.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.095965385437012, -11.732452392578125, -11.368940353393555, -11.005427360534668, -10.641915321350098, -10.278402328491211, -9.91489028930664, -9.551377296447754, -9.187864303588867, -8.82435131072998, -8.46083927154541, -8.097326278686523, -7.733814239501953, -7.370301246643066, -7.006788730621338, -6.643276214599609, -6.279764175415039, -5.9162516593933105, -5.552739143371582, -5.189226150512695, -4.825714111328125, -4.462201118469238, -4.09868860244751, -3.7351760864257812, -3.3716635704040527, -3.008151054382324, -2.6446385383605957, -2.281125783920288, -1.9176132678985596, -1.554100751876831, -1.1905879974365234, -0.8270754814147949, -0.4635639190673828, -0.10005134344100952, 0.26346123218536377, 0.6269738674163818, 0.9904863834381104, 1.3539988994598389, 1.7175116539001465, 2.081024169921875, 2.4445366859436035, 2.808049201965332, 3.1715617179870605, 3.535074472427368, 3.8985869884490967, 4.262099266052246, 4.625612258911133, 4.989124774932861, 5.35263729095459, 5.716149806976318, 6.079662322998047, 6.443175315856934, 6.806687355041504, 7.170200347900391, 7.533712863922119, 7.897225379943848, 8.260738372802734, 8.624251365661621, 8.987763404846191, 9.351276397705078, 9.714788436889648, 10.078301429748535, 10.441814422607422, 10.805326461791992, 11.168838500976562]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 5.0, 4.0, 7.0, 8.0, 14.0, 17.0, 22.0, 21.0, 43.0, 57.0, 84.0, 94.0, 141.0, 255.0, 357.0, 584.0, 825.0, 1180.0, 1899.0, 2936.0, 4680.0, 7678.0, 12524.0, 21022.0, 36031.0, 64738.0, 120012.0, 214321.0, 236839.0, 142042.0, 76270.0, 41644.0, 24061.0, 14477.0, 8614.0, 5317.0, 3422.0, 2126.0, 1381.0, 913.0, 626.0, 426.0, 269.0, 172.0, 113.0, 72.0, 72.0, 42.0, 35.0, 19.0, 16.0, 16.0, 12.0, 1.0, 3.0, 4.0, 4.0, 3.0, 1.0], "bins": [-2.685546875, -2.6044921875, -2.5234375, -2.4423828125, -2.361328125, -2.2802734375, -2.19921875, -2.1181640625, -2.037109375, -1.9560546875, -1.875, -1.7939453125, -1.712890625, -1.6318359375, -1.55078125, -1.4697265625, -1.388671875, -1.3076171875, -1.2265625, -1.1455078125, -1.064453125, -0.9833984375, -0.90234375, -0.8212890625, -0.740234375, -0.6591796875, -0.578125, -0.4970703125, -0.416015625, -0.3349609375, -0.25390625, -0.1728515625, -0.091796875, -0.0107421875, 0.0703125, 0.1513671875, 0.232421875, 0.3134765625, 0.39453125, 0.4755859375, 0.556640625, 0.6376953125, 0.71875, 0.7998046875, 0.880859375, 0.9619140625, 1.04296875, 1.1240234375, 1.205078125, 1.2861328125, 1.3671875, 1.4482421875, 1.529296875, 1.6103515625, 1.69140625, 1.7724609375, 1.853515625, 1.9345703125, 2.015625, 2.0966796875, 2.177734375, 2.2587890625, 2.33984375, 2.4208984375, 2.501953125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 5.0, 3.0, 7.0, 6.0, 9.0, 11.0, 10.0, 22.0, 11.0, 21.0, 16.0, 18.0, 37.0, 30.0, 29.0, 37.0, 27.0, 30.0, 42.0, 40.0, 42.0, 32.0, 38.0, 41.0, 42.0, 41.0, 36.0, 30.0, 40.0, 31.0, 36.0, 25.0, 23.0, 17.0, 19.0, 13.0, 14.0, 15.0, 8.0, 15.0, 7.0, 11.0, 3.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 3.0], "bins": [-13.84375, -13.459228515625, -13.07470703125, -12.690185546875, -12.3056640625, -11.921142578125, -11.53662109375, -11.152099609375, -10.767578125, -10.383056640625, -9.99853515625, -9.614013671875, -9.2294921875, -8.844970703125, -8.46044921875, -8.075927734375, -7.69140625, -7.306884765625, -6.92236328125, -6.537841796875, -6.1533203125, -5.768798828125, -5.38427734375, -4.999755859375, -4.615234375, -4.230712890625, -3.84619140625, -3.461669921875, -3.0771484375, -2.692626953125, -2.30810546875, -1.923583984375, -1.5390625, -1.154541015625, -0.77001953125, -0.385498046875, -0.0009765625, 0.383544921875, 0.76806640625, 1.152587890625, 1.537109375, 1.921630859375, 2.30615234375, 2.690673828125, 3.0751953125, 3.459716796875, 3.84423828125, 4.228759765625, 4.61328125, 4.997802734375, 5.38232421875, 5.766845703125, 6.1513671875, 6.535888671875, 6.92041015625, 7.304931640625, 7.689453125, 8.073974609375, 8.45849609375, 8.843017578125, 9.2275390625, 9.612060546875, 9.99658203125, 10.381103515625, 10.765625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 11.0, 9.0, 11.0, 13.0, 17.0, 26.0, 32.0, 51.0, 59.0, 87.0, 113.0, 134.0, 217.0, 295.0, 404.0, 648.0, 980.0, 1672.0, 2968.0, 6504.0, 16754.0, 52231.0, 901537.0, 38520.0, 13063.0, 5333.0, 2633.0, 1415.0, 838.0, 552.0, 413.0, 274.0, 202.0, 126.0, 110.0, 79.0, 60.0, 46.0, 35.0, 17.0, 13.0, 15.0, 16.0, 15.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-7.890625, -7.63916015625, -7.3876953125, -7.13623046875, -6.884765625, -6.63330078125, -6.3818359375, -6.13037109375, -5.87890625, -5.62744140625, -5.3759765625, -5.12451171875, -4.873046875, -4.62158203125, -4.3701171875, -4.11865234375, -3.8671875, -3.61572265625, -3.3642578125, -3.11279296875, -2.861328125, -2.60986328125, -2.3583984375, -2.10693359375, -1.85546875, -1.60400390625, -1.3525390625, -1.10107421875, -0.849609375, -0.59814453125, -0.3466796875, -0.09521484375, 0.15625, 0.40771484375, 0.6591796875, 0.91064453125, 1.162109375, 1.41357421875, 1.6650390625, 1.91650390625, 2.16796875, 2.41943359375, 2.6708984375, 2.92236328125, 3.173828125, 3.42529296875, 3.6767578125, 3.92822265625, 4.1796875, 4.43115234375, 4.6826171875, 4.93408203125, 5.185546875, 5.43701171875, 5.6884765625, 5.93994140625, 6.19140625, 6.44287109375, 6.6943359375, 6.94580078125, 7.197265625, 7.44873046875, 7.7001953125, 7.95166015625, 8.203125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 3.0, 7.0, 12.0, 8.0, 11.0, 13.0, 20.0, 22.0, 26.0, 30.0, 32.0, 36.0, 24.0, 30.0, 40.0, 44.0, 52.0, 44.0, 47.0, 41.0, 47.0, 42.0, 34.0, 42.0, 47.0, 45.0, 29.0, 27.0, 22.0, 21.0, 19.0, 16.0, 13.0, 15.0, 11.0, 8.0, 8.0, 7.0, 1.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.1875, -9.88916015625, -9.5908203125, -9.29248046875, -8.994140625, -8.69580078125, -8.3974609375, -8.09912109375, -7.80078125, -7.50244140625, -7.2041015625, -6.90576171875, -6.607421875, -6.30908203125, -6.0107421875, -5.71240234375, -5.4140625, -5.11572265625, -4.8173828125, -4.51904296875, -4.220703125, -3.92236328125, -3.6240234375, -3.32568359375, -3.02734375, -2.72900390625, -2.4306640625, -2.13232421875, -1.833984375, -1.53564453125, -1.2373046875, -0.93896484375, -0.640625, -0.34228515625, -0.0439453125, 0.25439453125, 0.552734375, 0.85107421875, 1.1494140625, 1.44775390625, 1.74609375, 2.04443359375, 2.3427734375, 2.64111328125, 2.939453125, 3.23779296875, 3.5361328125, 3.83447265625, 4.1328125, 4.43115234375, 4.7294921875, 5.02783203125, 5.326171875, 5.62451171875, 5.9228515625, 6.22119140625, 6.51953125, 6.81787109375, 7.1162109375, 7.41455078125, 7.712890625, 8.01123046875, 8.3095703125, 8.60791015625, 8.90625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 2.0, 2.0, 5.0, 12.0, 6.0, 7.0, 11.0, 20.0, 26.0, 42.0, 35.0, 67.0, 86.0, 95.0, 143.0, 169.0, 255.0, 394.0, 509.0, 766.0, 1299.0, 2395.0, 4703.0, 11239.0, 38949.0, 929781.0, 36174.0, 10648.0, 4555.0, 2230.0, 1239.0, 827.0, 540.0, 356.0, 256.0, 173.0, 139.0, 99.0, 72.0, 53.0, 47.0, 37.0, 19.0, 16.0, 22.0, 9.0, 9.0, 9.0, 1.0, 5.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.56640625, -0.5489654541015625, -0.531524658203125, -0.5140838623046875, -0.49664306640625, -0.4792022705078125, -0.461761474609375, -0.4443206787109375, -0.4268798828125, -0.4094390869140625, -0.391998291015625, -0.3745574951171875, -0.35711669921875, -0.3396759033203125, -0.322235107421875, -0.3047943115234375, -0.287353515625, -0.2699127197265625, -0.252471923828125, -0.2350311279296875, -0.21759033203125, -0.2001495361328125, -0.182708740234375, -0.1652679443359375, -0.1478271484375, -0.1303863525390625, -0.112945556640625, -0.0955047607421875, -0.07806396484375, -0.0606231689453125, -0.043182373046875, -0.0257415771484375, -0.00830078125, 0.0091400146484375, 0.026580810546875, 0.0440216064453125, 0.06146240234375, 0.0789031982421875, 0.096343994140625, 0.1137847900390625, 0.1312255859375, 0.1486663818359375, 0.166107177734375, 0.1835479736328125, 0.20098876953125, 0.2184295654296875, 0.235870361328125, 0.2533111572265625, 0.270751953125, 0.2881927490234375, 0.305633544921875, 0.3230743408203125, 0.34051513671875, 0.3579559326171875, 0.375396728515625, 0.3928375244140625, 0.4102783203125, 0.4277191162109375, 0.445159912109375, 0.4626007080078125, 0.48004150390625, 0.4974822998046875, 0.514923095703125, 0.5323638916015625, 0.5498046875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 6.0, 1.0, 3.0, 3.0, 5.0, 8.0, 10.0, 12.0, 9.0, 11.0, 10.0, 23.0, 26.0, 27.0, 23.0, 32.0, 29.0, 38.0, 34.0, 40.0, 41.0, 55.0, 47.0, 45.0, 39.0, 37.0, 46.0, 36.0, 42.0, 37.0, 35.0, 25.0, 29.0, 18.0, 25.0, 18.0, 18.0, 11.0, 11.0, 9.0, 7.0, 9.0, 4.0, 7.0, 4.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.020069122314453e-06, -5.813315510749817e-06, -5.606561899185181e-06, -5.3998082876205444e-06, -5.193054676055908e-06, -4.986301064491272e-06, -4.779547452926636e-06, -4.5727938413619995e-06, -4.366040229797363e-06, -4.159286618232727e-06, -3.952533006668091e-06, -3.7457793951034546e-06, -3.5390257835388184e-06, -3.332272171974182e-06, -3.125518560409546e-06, -2.9187649488449097e-06, -2.7120113372802734e-06, -2.505257725715637e-06, -2.298504114151001e-06, -2.0917505025863647e-06, -1.8849968910217285e-06, -1.6782432794570923e-06, -1.471489667892456e-06, -1.2647360563278198e-06, -1.0579824447631836e-06, -8.512288331985474e-07, -6.444752216339111e-07, -4.377216100692749e-07, -2.3096799850463867e-07, -2.421438694000244e-08, 1.825392246246338e-07, 3.8929283618927e-07, 5.960464477539062e-07, 8.028000593185425e-07, 1.0095536708831787e-06, 1.216307282447815e-06, 1.4230608940124512e-06, 1.6298145055770874e-06, 1.8365681171417236e-06, 2.04332172870636e-06, 2.250075340270996e-06, 2.4568289518356323e-06, 2.6635825634002686e-06, 2.8703361749649048e-06, 3.077089786529541e-06, 3.2838433980941772e-06, 3.4905970096588135e-06, 3.6973506212234497e-06, 3.904104232788086e-06, 4.110857844352722e-06, 4.317611455917358e-06, 4.524365067481995e-06, 4.731118679046631e-06, 4.937872290611267e-06, 5.144625902175903e-06, 5.3513795137405396e-06, 5.558133125305176e-06, 5.764886736869812e-06, 5.971640348434448e-06, 6.1783939599990845e-06, 6.385147571563721e-06, 6.591901183128357e-06, 6.798654794692993e-06, 7.005408406257629e-06, 7.212162017822266e-06]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 12.0, 15.0, 26.0, 33.0, 48.0, 65.0, 125.0, 176.0, 259.0, 411.0, 596.0, 899.0, 1472.0, 2405.0, 3857.0, 6202.0, 9885.0, 16020.0, 26588.0, 45187.0, 81824.0, 170866.0, 322751.0, 166310.0, 80064.0, 44411.0, 26268.0, 15741.0, 9721.0, 6116.0, 3615.0, 2358.0, 1500.0, 960.0, 581.0, 408.0, 258.0, 177.0, 122.0, 71.0, 53.0, 28.0, 25.0, 12.0, 10.0, 13.0, 3.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.278564453125, -0.269989013671875, -0.26141357421875, -0.252838134765625, -0.2442626953125, -0.235687255859375, -0.22711181640625, -0.218536376953125, -0.2099609375, -0.201385498046875, -0.19281005859375, -0.184234619140625, -0.1756591796875, -0.167083740234375, -0.15850830078125, -0.149932861328125, -0.141357421875, -0.132781982421875, -0.12420654296875, -0.115631103515625, -0.1070556640625, -0.098480224609375, -0.08990478515625, -0.081329345703125, -0.07275390625, -0.064178466796875, -0.05560302734375, -0.047027587890625, -0.0384521484375, -0.029876708984375, -0.02130126953125, -0.012725830078125, -0.004150390625, 0.004425048828125, 0.01300048828125, 0.021575927734375, 0.0301513671875, 0.038726806640625, 0.04730224609375, 0.055877685546875, 0.064453125, 0.073028564453125, 0.08160400390625, 0.090179443359375, 0.0987548828125, 0.107330322265625, 0.11590576171875, 0.124481201171875, 0.133056640625, 0.141632080078125, 0.15020751953125, 0.158782958984375, 0.1673583984375, 0.175933837890625, 0.18450927734375, 0.193084716796875, 0.20166015625, 0.210235595703125, 0.21881103515625, 0.227386474609375, 0.2359619140625, 0.244537353515625, 0.25311279296875, 0.261688232421875, 0.270263671875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 4.0, 9.0, 8.0, 6.0, 13.0, 6.0, 14.0, 12.0, 15.0, 9.0, 26.0, 29.0, 27.0, 43.0, 70.0, 100.0, 220.0, 95.0, 72.0, 36.0, 32.0, 26.0, 21.0, 16.0, 16.0, 20.0, 11.0, 6.0, 10.0, 6.0, 8.0, 3.0, 3.0, 1.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.222412109375, -0.21557235717773438, -0.20873260498046875, -0.20189285278320312, -0.1950531005859375, -0.18821334838867188, -0.18137359619140625, -0.17453384399414062, -0.167694091796875, -0.16085433959960938, -0.15401458740234375, -0.14717483520507812, -0.1403350830078125, -0.13349533081054688, -0.12665557861328125, -0.11981582641601562, -0.11297607421875, -0.10613632202148438, -0.09929656982421875, -0.09245681762695312, -0.0856170654296875, -0.07877731323242188, -0.07193756103515625, -0.06509780883789062, -0.058258056640625, -0.051418304443359375, -0.04457855224609375, -0.037738800048828125, -0.0308990478515625, -0.024059295654296875, -0.01721954345703125, -0.010379791259765625, -0.0035400390625, 0.003299713134765625, 0.01013946533203125, 0.016979217529296875, 0.0238189697265625, 0.030658721923828125, 0.03749847412109375, 0.044338226318359375, 0.051177978515625, 0.058017730712890625, 0.06485748291015625, 0.07169723510742188, 0.0785369873046875, 0.08537673950195312, 0.09221649169921875, 0.09905624389648438, 0.10589599609375, 0.11273574829101562, 0.11957550048828125, 0.12641525268554688, 0.1332550048828125, 0.14009475708007812, 0.14693450927734375, 0.15377426147460938, 0.160614013671875, 0.16745376586914062, 0.17429351806640625, 0.18113327026367188, 0.1879730224609375, 0.19481277465820312, 0.20165252685546875, 0.20849227905273438, 0.21533203125]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 8.0, 1.0, 8.0, 15.0, 12.0, 8.0, 2.0, 15.0, 22.0, 12.0, 21.0, 27.0, 41.0, 25.0, 34.0, 33.0, 38.0, 40.0, 38.0, 53.0, 41.0, 46.0, 48.0, 45.0, 39.0, 38.0, 37.0, 37.0, 40.0, 26.0, 29.0, 19.0, 15.0, 15.0, 17.0, 10.0, 10.0, 7.0, 8.0, 6.0, 4.0, 9.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-9.347816467285156, -9.064899444580078, -8.781982421875, -8.499066352844238, -8.21614933013916, -7.933232307434082, -7.650315284729004, -7.367398738861084, -7.084482192993164, -6.801565170288086, -6.518648624420166, -6.235731601715088, -5.952815055847168, -5.66989803314209, -5.386981010437012, -5.104064464569092, -4.821147441864014, -4.5382304191589355, -4.255313873291016, -3.9723968505859375, -3.6894803047180176, -3.4065632820129395, -3.1236464977264404, -2.8407297134399414, -2.5578129291534424, -2.2748961448669434, -1.9919793605804443, -1.7090624570846558, -1.4261456727981567, -1.1432288885116577, -0.8603119850158691, -0.5773952007293701, -0.2944784164428711, -0.011561602354049683, 0.27135521173477173, 0.5542720556259155, 0.8371888399124146, 1.1201056241989136, 1.4030225276947021, 1.6859393119812012, 1.9688560962677002, 2.251772880554199, 2.5346896648406982, 2.8176064491271973, 3.1005234718322754, 3.3834400177001953, 3.6663570404052734, 3.9492738246917725, 4.2321906089782715, 4.51510763168335, 4.7980241775512695, 5.080941200256348, 5.363857746124268, 5.646774768829346, 5.929691314697266, 6.212608337402344, 6.495525360107422, 6.7784423828125, 7.06135892868042, 7.344275951385498, 7.627192497253418, 7.910109519958496, 8.193026542663574, 8.475942611694336, 8.758859634399414]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 8.0, 5.0, 6.0, 4.0, 9.0, 6.0, 7.0, 15.0, 9.0, 6.0, 20.0, 19.0, 24.0, 24.0, 24.0, 26.0, 28.0, 44.0, 30.0, 40.0, 35.0, 35.0, 43.0, 26.0, 33.0, 41.0, 43.0, 38.0, 31.0, 42.0, 42.0, 24.0, 28.0, 23.0, 28.0, 20.0, 23.0, 12.0, 12.0, 16.0, 17.0, 10.0, 10.0, 5.0, 4.0, 8.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.002235412597656, -11.638401985168457, -11.274567604064941, -10.910734176635742, -10.546900749206543, -10.183067321777344, -9.819232940673828, -9.455399513244629, -9.09156608581543, -8.72773265838623, -8.363898277282715, -8.000064849853516, -7.636231422424316, -7.272397518157959, -6.908563613891602, -6.544730186462402, -6.180895805358887, -5.817061901092529, -5.45322847366333, -5.089394569396973, -4.725561141967773, -4.361727237701416, -3.9978933334350586, -3.6340596675872803, -3.270226001739502, -2.9063923358917236, -2.5425586700439453, -2.178724765777588, -1.8148910999298096, -1.4510574340820312, -1.0872235298156738, -0.7233898639678955, -0.3595552444458008, 0.0042784810066223145, 0.3681122064590454, 0.7319459915161133, 1.0957796573638916, 1.45961332321167, 1.8234472274780273, 2.1872808933258057, 2.551114559173584, 2.9149482250213623, 3.2787818908691406, 3.642615795135498, 4.0064496994018555, 4.370283126831055, 4.734117031097412, 5.0979509353637695, 5.461784362792969, 5.825618267059326, 6.189451694488525, 6.553285598754883, 6.917119026184082, 7.2809529304504395, 7.644786834716797, 8.008620262145996, 8.372453689575195, 8.736287117004395, 9.10012149810791, 9.46395492553711, 9.827788352966309, 10.191621780395508, 10.555456161499023, 10.919289588928223, 11.283123970031738]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 9.0, 14.0, 25.0, 37.0, 37.0, 75.0, 140.0, 202.0, 336.0, 494.0, 855.0, 1308.0, 2115.0, 3344.0, 5088.0, 7862.0, 12356.0, 18194.0, 26767.0, 38296.0, 51154.0, 67356.0, 81915.0, 95243.0, 102354.0, 103207.0, 96817.0, 84893.0, 69606.0, 53748.0, 39805.0, 28334.0, 19574.0, 12992.0, 8763.0, 5652.0, 3525.0, 2346.0, 1400.0, 887.0, 538.0, 353.0, 187.0, 151.0, 86.0, 51.0, 29.0, 16.0, 12.0, 11.0, 3.0, 1.0, 4.0, 0.0, 1.0], "bins": [-6.16796875, -5.98699951171875, -5.8060302734375, -5.62506103515625, -5.444091796875, -5.26312255859375, -5.0821533203125, -4.90118408203125, -4.72021484375, -4.53924560546875, -4.3582763671875, -4.17730712890625, -3.996337890625, -3.81536865234375, -3.6343994140625, -3.45343017578125, -3.2724609375, -3.09149169921875, -2.9105224609375, -2.72955322265625, -2.548583984375, -2.36761474609375, -2.1866455078125, -2.00567626953125, -1.82470703125, -1.64373779296875, -1.4627685546875, -1.28179931640625, -1.100830078125, -0.91986083984375, -0.7388916015625, -0.55792236328125, -0.376953125, -0.19598388671875, -0.0150146484375, 0.16595458984375, 0.346923828125, 0.52789306640625, 0.7088623046875, 0.88983154296875, 1.07080078125, 1.25177001953125, 1.4327392578125, 1.61370849609375, 1.794677734375, 1.97564697265625, 2.1566162109375, 2.33758544921875, 2.5185546875, 2.69952392578125, 2.8804931640625, 3.06146240234375, 3.242431640625, 3.42340087890625, 3.6043701171875, 3.78533935546875, 3.96630859375, 4.14727783203125, 4.3282470703125, 4.50921630859375, 4.690185546875, 4.87115478515625, 5.0521240234375, 5.23309326171875, 5.4140625]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 1.0, 7.0, 9.0, 5.0, 8.0, 7.0, 7.0, 10.0, 14.0, 12.0, 14.0, 10.0, 19.0, 24.0, 28.0, 24.0, 30.0, 28.0, 25.0, 32.0, 23.0, 33.0, 29.0, 39.0, 34.0, 37.0, 28.0, 36.0, 36.0, 34.0, 41.0, 34.0, 31.0, 27.0, 24.0, 25.0, 20.0, 21.0, 14.0, 20.0, 19.0, 9.0, 17.0, 7.0, 11.0, 11.0, 8.0, 2.0, 4.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0], "bins": [-11.5, -11.1644287109375, -10.828857421875, -10.4932861328125, -10.15771484375, -9.8221435546875, -9.486572265625, -9.1510009765625, -8.8154296875, -8.4798583984375, -8.144287109375, -7.8087158203125, -7.47314453125, -7.1375732421875, -6.802001953125, -6.4664306640625, -6.130859375, -5.7952880859375, -5.459716796875, -5.1241455078125, -4.78857421875, -4.4530029296875, -4.117431640625, -3.7818603515625, -3.4462890625, -3.1107177734375, -2.775146484375, -2.4395751953125, -2.10400390625, -1.7684326171875, -1.432861328125, -1.0972900390625, -0.76171875, -0.4261474609375, -0.090576171875, 0.2449951171875, 0.58056640625, 0.9161376953125, 1.251708984375, 1.5872802734375, 1.9228515625, 2.2584228515625, 2.593994140625, 2.9295654296875, 3.26513671875, 3.6007080078125, 3.936279296875, 4.2718505859375, 4.607421875, 4.9429931640625, 5.278564453125, 5.6141357421875, 5.94970703125, 6.2852783203125, 6.620849609375, 6.9564208984375, 7.2919921875, 7.6275634765625, 7.963134765625, 8.2987060546875, 8.63427734375, 8.9698486328125, 9.305419921875, 9.6409912109375, 9.9765625]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 10.0, 16.0, 20.0, 28.0, 37.0, 62.0, 125.0, 192.0, 263.0, 389.0, 610.0, 960.0, 1464.0, 2161.0, 3417.0, 5123.0, 7484.0, 11527.0, 17011.0, 24228.0, 33993.0, 46188.0, 61010.0, 74941.0, 88285.0, 96830.0, 99516.0, 96698.0, 87142.0, 74638.0, 60064.0, 46084.0, 33861.0, 24136.0, 16652.0, 11402.0, 7586.0, 4864.0, 3236.0, 2221.0, 1405.0, 925.0, 595.0, 423.0, 267.0, 167.0, 100.0, 73.0, 51.0, 26.0, 22.0, 17.0, 12.0, 6.0, 1.0, 2.0, 1.0], "bins": [-5.91015625, -5.733642578125, -5.55712890625, -5.380615234375, -5.2041015625, -5.027587890625, -4.85107421875, -4.674560546875, -4.498046875, -4.321533203125, -4.14501953125, -3.968505859375, -3.7919921875, -3.615478515625, -3.43896484375, -3.262451171875, -3.0859375, -2.909423828125, -2.73291015625, -2.556396484375, -2.3798828125, -2.203369140625, -2.02685546875, -1.850341796875, -1.673828125, -1.497314453125, -1.32080078125, -1.144287109375, -0.9677734375, -0.791259765625, -0.61474609375, -0.438232421875, -0.26171875, -0.085205078125, 0.09130859375, 0.267822265625, 0.4443359375, 0.620849609375, 0.79736328125, 0.973876953125, 1.150390625, 1.326904296875, 1.50341796875, 1.679931640625, 1.8564453125, 2.032958984375, 2.20947265625, 2.385986328125, 2.5625, 2.739013671875, 2.91552734375, 3.092041015625, 3.2685546875, 3.445068359375, 3.62158203125, 3.798095703125, 3.974609375, 4.151123046875, 4.32763671875, 4.504150390625, 4.6806640625, 4.857177734375, 5.03369140625, 5.210205078125, 5.38671875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 2.0, 4.0, 4.0, 6.0, 6.0, 4.0, 4.0, 3.0, 12.0, 12.0, 14.0, 17.0, 13.0, 17.0, 28.0, 32.0, 30.0, 32.0, 24.0, 35.0, 34.0, 45.0, 39.0, 40.0, 43.0, 42.0, 36.0, 35.0, 33.0, 42.0, 27.0, 39.0, 19.0, 30.0, 31.0, 24.0, 20.0, 23.0, 20.0, 17.0, 13.0, 15.0, 9.0, 5.0, 8.0, 5.0, 6.0, 6.0, 4.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.0625, -6.81494140625, -6.5673828125, -6.31982421875, -6.072265625, -5.82470703125, -5.5771484375, -5.32958984375, -5.08203125, -4.83447265625, -4.5869140625, -4.33935546875, -4.091796875, -3.84423828125, -3.5966796875, -3.34912109375, -3.1015625, -2.85400390625, -2.6064453125, -2.35888671875, -2.111328125, -1.86376953125, -1.6162109375, -1.36865234375, -1.12109375, -0.87353515625, -0.6259765625, -0.37841796875, -0.130859375, 0.11669921875, 0.3642578125, 0.61181640625, 0.859375, 1.10693359375, 1.3544921875, 1.60205078125, 1.849609375, 2.09716796875, 2.3447265625, 2.59228515625, 2.83984375, 3.08740234375, 3.3349609375, 3.58251953125, 3.830078125, 4.07763671875, 4.3251953125, 4.57275390625, 4.8203125, 5.06787109375, 5.3154296875, 5.56298828125, 5.810546875, 6.05810546875, 6.3056640625, 6.55322265625, 6.80078125, 7.04833984375, 7.2958984375, 7.54345703125, 7.791015625, 8.03857421875, 8.2861328125, 8.53369140625, 8.78125]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 8.0, 16.0, 26.0, 42.0, 64.0, 85.0, 181.0, 287.0, 414.0, 730.0, 1125.0, 1852.0, 3097.0, 5308.0, 8545.0, 14064.0, 22627.0, 34583.0, 51232.0, 71293.0, 91697.0, 109573.0, 119153.0, 118216.0, 106898.0, 87698.0, 67012.0, 47155.0, 32176.0, 20585.0, 12907.0, 7951.0, 4730.0, 2879.0, 1688.0, 1016.0, 636.0, 364.0, 233.0, 162.0, 101.0, 47.0, 40.0, 17.0, 24.0, 10.0, 7.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.9931640625, -1.9286651611328125, -1.864166259765625, -1.7996673583984375, -1.73516845703125, -1.6706695556640625, -1.606170654296875, -1.5416717529296875, -1.4771728515625, -1.4126739501953125, -1.348175048828125, -1.2836761474609375, -1.21917724609375, -1.1546783447265625, -1.090179443359375, -1.0256805419921875, -0.961181640625, -0.8966827392578125, -0.832183837890625, -0.7676849365234375, -0.70318603515625, -0.6386871337890625, -0.574188232421875, -0.5096893310546875, -0.4451904296875, -0.3806915283203125, -0.316192626953125, -0.2516937255859375, -0.18719482421875, -0.1226959228515625, -0.058197021484375, 0.0063018798828125, 0.07080078125, 0.1352996826171875, 0.199798583984375, 0.2642974853515625, 0.32879638671875, 0.3932952880859375, 0.457794189453125, 0.5222930908203125, 0.5867919921875, 0.6512908935546875, 0.715789794921875, 0.7802886962890625, 0.84478759765625, 0.9092864990234375, 0.973785400390625, 1.0382843017578125, 1.102783203125, 1.1672821044921875, 1.231781005859375, 1.2962799072265625, 1.36077880859375, 1.4252777099609375, 1.489776611328125, 1.5542755126953125, 1.6187744140625, 1.6832733154296875, 1.747772216796875, 1.8122711181640625, 1.87677001953125, 1.9412689208984375, 2.005767822265625, 2.0702667236328125, 2.134765625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 6.0, 11.0, 8.0, 13.0, 13.0, 23.0, 17.0, 30.0, 31.0, 28.0, 35.0, 38.0, 24.0, 46.0, 36.0, 45.0, 56.0, 38.0, 51.0, 48.0, 49.0, 39.0, 33.0, 40.0, 37.0, 34.0, 33.0, 27.0, 15.0, 25.0, 14.0, 17.0, 7.0, 11.0, 7.0, 4.0, 6.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0002510547637939453, -0.00024380162358283997, -0.00023654848337173462, -0.00022929534316062927, -0.00022204220294952393, -0.00021478906273841858, -0.00020753592252731323, -0.00020028278231620789, -0.00019302964210510254, -0.0001857765018939972, -0.00017852336168289185, -0.0001712702214717865, -0.00016401708126068115, -0.0001567639410495758, -0.00014951080083847046, -0.0001422576606273651, -0.00013500452041625977, -0.00012775138020515442, -0.00012049823999404907, -0.00011324509978294373, -0.00010599195957183838, -9.873881936073303e-05, -9.148567914962769e-05, -8.423253893852234e-05, -7.697939872741699e-05, -6.972625851631165e-05, -6.24731183052063e-05, -5.521997809410095e-05, -4.7966837882995605e-05, -4.071369767189026e-05, -3.346055746078491e-05, -2.6207417249679565e-05, -1.895427703857422e-05, -1.1701136827468872e-05, -4.447996616363525e-06, 2.8051435947418213e-06, 1.0058283805847168e-05, 1.7311424016952515e-05, 2.456456422805786e-05, 3.181770443916321e-05, 3.9070844650268555e-05, 4.63239848613739e-05, 5.357712507247925e-05, 6.0830265283584595e-05, 6.808340549468994e-05, 7.533654570579529e-05, 8.258968591690063e-05, 8.984282612800598e-05, 9.709596633911133e-05, 0.00010434910655021667, 0.00011160224676132202, 0.00011885538697242737, 0.00012610852718353271, 0.00013336166739463806, 0.0001406148076057434, 0.00014786794781684875, 0.0001551210880279541, 0.00016237422823905945, 0.0001696273684501648, 0.00017688050866127014, 0.0001841336488723755, 0.00019138678908348083, 0.00019863992929458618, 0.00020589306950569153, 0.00021314620971679688]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 8.0, 6.0, 11.0, 8.0, 22.0, 21.0, 45.0, 81.0, 105.0, 174.0, 287.0, 486.0, 755.0, 1326.0, 2269.0, 4134.0, 7198.0, 12489.0, 22469.0, 38458.0, 62296.0, 92274.0, 122818.0, 144004.0, 146261.0, 126898.0, 98001.0, 66827.0, 41921.0, 24530.0, 14032.0, 7751.0, 4478.0, 2526.0, 1448.0, 848.0, 500.0, 319.0, 176.0, 112.0, 67.0, 41.0, 28.0, 18.0, 9.0, 11.0, 6.0, 3.0, 7.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.4140625, -2.3310546875, -2.248046875, -2.1650390625, -2.08203125, -1.9990234375, -1.916015625, -1.8330078125, -1.75, -1.6669921875, -1.583984375, -1.5009765625, -1.41796875, -1.3349609375, -1.251953125, -1.1689453125, -1.0859375, -1.0029296875, -0.919921875, -0.8369140625, -0.75390625, -0.6708984375, -0.587890625, -0.5048828125, -0.421875, -0.3388671875, -0.255859375, -0.1728515625, -0.08984375, -0.0068359375, 0.076171875, 0.1591796875, 0.2421875, 0.3251953125, 0.408203125, 0.4912109375, 0.57421875, 0.6572265625, 0.740234375, 0.8232421875, 0.90625, 0.9892578125, 1.072265625, 1.1552734375, 1.23828125, 1.3212890625, 1.404296875, 1.4873046875, 1.5703125, 1.6533203125, 1.736328125, 1.8193359375, 1.90234375, 1.9853515625, 2.068359375, 2.1513671875, 2.234375, 2.3173828125, 2.400390625, 2.4833984375, 2.56640625, 2.6494140625, 2.732421875, 2.8154296875, 2.8984375]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 4.0, 2.0, 9.0, 10.0, 11.0, 14.0, 11.0, 15.0, 20.0, 17.0, 23.0, 28.0, 26.0, 43.0, 53.0, 38.0, 49.0, 53.0, 54.0, 67.0, 55.0, 56.0, 44.0, 43.0, 41.0, 40.0, 26.0, 29.0, 23.0, 20.0, 21.0, 14.0, 9.0, 6.0, 9.0, 3.0, 7.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.140625, -1.10284423828125, -1.0650634765625, -1.02728271484375, -0.989501953125, -0.95172119140625, -0.9139404296875, -0.87615966796875, -0.83837890625, -0.80059814453125, -0.7628173828125, -0.72503662109375, -0.687255859375, -0.64947509765625, -0.6116943359375, -0.57391357421875, -0.5361328125, -0.49835205078125, -0.4605712890625, -0.42279052734375, -0.385009765625, -0.34722900390625, -0.3094482421875, -0.27166748046875, -0.23388671875, -0.19610595703125, -0.1583251953125, -0.12054443359375, -0.082763671875, -0.04498291015625, -0.0072021484375, 0.03057861328125, 0.068359375, 0.10614013671875, 0.1439208984375, 0.18170166015625, 0.219482421875, 0.25726318359375, 0.2950439453125, 0.33282470703125, 0.37060546875, 0.40838623046875, 0.4461669921875, 0.48394775390625, 0.521728515625, 0.55950927734375, 0.5972900390625, 0.63507080078125, 0.6728515625, 0.71063232421875, 0.7484130859375, 0.78619384765625, 0.823974609375, 0.86175537109375, 0.8995361328125, 0.93731689453125, 0.97509765625, 1.01287841796875, 1.0506591796875, 1.08843994140625, 1.126220703125, 1.16400146484375, 1.2017822265625, 1.23956298828125, 1.27734375]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 6.0, 2.0, 10.0, 8.0, 14.0, 9.0, 9.0, 15.0, 17.0, 15.0, 29.0, 31.0, 39.0, 40.0, 36.0, 41.0, 48.0, 40.0, 41.0, 62.0, 53.0, 48.0, 43.0, 38.0, 42.0, 30.0, 26.0, 29.0, 27.0, 30.0, 22.0, 25.0, 19.0, 14.0, 10.0, 6.0, 4.0, 9.0, 8.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.04843807220459, -9.7426118850708, -9.436785697937012, -9.130959510803223, -8.825133323669434, -8.519307136535645, -8.213480949401855, -7.907654762268066, -7.601828575134277, -7.296002388000488, -6.990176200866699, -6.68435001373291, -6.378523826599121, -6.072697639465332, -5.766871452331543, -5.461045265197754, -5.155219078063965, -4.849392890930176, -4.543566703796387, -4.237740516662598, -3.9319143295288086, -3.6260881423950195, -3.3202619552612305, -3.0144357681274414, -2.7086095809936523, -2.4027833938598633, -2.096957206726074, -1.7911310195922852, -1.485304832458496, -1.179478645324707, -0.873652458190918, -0.5678262710571289, -0.26200008392333984, 0.04382610321044922, 0.3496522903442383, 0.6554784774780273, 0.9613046646118164, 1.2671308517456055, 1.5729570388793945, 1.8787832260131836, 2.1846094131469727, 2.4904356002807617, 2.796261787414551, 3.10208797454834, 3.407914161682129, 3.713740348815918, 4.019566535949707, 4.325392723083496, 4.631218910217285, 4.937045097351074, 5.242871284484863, 5.548697471618652, 5.854523658752441, 6.1603498458862305, 6.4661760330200195, 6.772002220153809, 7.077828407287598, 7.383654594421387, 7.689480781555176, 7.995306968688965, 8.301133155822754, 8.606959342956543, 8.912785530090332, 9.218611717224121, 9.52443790435791]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 6.0, 6.0, 4.0, 5.0, 6.0, 6.0, 5.0, 8.0, 12.0, 18.0, 13.0, 18.0, 17.0, 14.0, 23.0, 27.0, 17.0, 23.0, 22.0, 31.0, 33.0, 31.0, 29.0, 45.0, 31.0, 39.0, 31.0, 21.0, 36.0, 34.0, 37.0, 33.0, 29.0, 31.0, 35.0, 30.0, 21.0, 23.0, 26.0, 22.0, 17.0, 14.0, 11.0, 13.0, 7.0, 7.0, 11.0, 7.0, 4.0, 7.0, 5.0, 2.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.000290870666504, -10.64266586303711, -10.285040855407715, -9.92741584777832, -9.56978988647461, -9.212164878845215, -8.85453987121582, -8.496914863586426, -8.139289855957031, -7.781664848327637, -7.424039363861084, -7.0664143562316895, -6.708788871765137, -6.351163864135742, -5.993538856506348, -5.635913848876953, -5.278287887573242, -4.920662879943848, -4.563037395477295, -4.2054123878479, -3.8477871417999268, -3.490161895751953, -3.1325368881225586, -2.774911642074585, -2.4172863960266113, -2.0596611499786377, -1.7020360231399536, -1.3444108963012695, -0.9867856502532959, -0.6291604042053223, -0.27153539657592773, 0.0860898494720459, 0.4437141418457031, 0.801339328289032, 1.1589645147323608, 1.516589641571045, 1.8742148876190186, 2.231840133666992, 2.5894651412963867, 2.9470903873443604, 3.304715633392334, 3.6623408794403076, 4.019966125488281, 4.377591133117676, 4.73521614074707, 5.092841625213623, 5.450466632843018, 5.80809211730957, 6.165717124938965, 6.523342132568359, 6.880967617034912, 7.238592624664307, 7.596218109130859, 7.953843116760254, 8.311468124389648, 8.669093132019043, 9.026718139648438, 9.384343147277832, 9.741968154907227, 10.099594116210938, 10.457219123840332, 10.814844131469727, 11.172469139099121, 11.530094146728516, 11.887720108032227]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 8.0, 7.0, 20.0, 31.0, 50.0, 93.0, 173.0, 224.0, 388.0, 612.0, 1022.0, 1676.0, 2827.0, 4520.0, 6984.0, 11146.0, 17672.0, 27112.0, 41269.0, 62278.0, 90230.0, 128382.0, 176532.0, 231658.0, 290754.0, 346089.0, 387984.0, 405011.0, 396340.0, 361814.0, 311317.0, 251018.0, 193575.0, 142783.0, 101961.0, 70579.0, 46542.0, 30951.0, 20145.0, 12581.0, 7822.0, 4790.0, 2958.0, 1826.0, 1075.0, 612.0, 382.0, 192.0, 108.0, 80.0, 45.0, 23.0, 11.0, 7.0, 4.0, 1.0, 0.0, 3.0], "bins": [-7.78125, -7.5501708984375, -7.319091796875, -7.0880126953125, -6.85693359375, -6.6258544921875, -6.394775390625, -6.1636962890625, -5.9326171875, -5.7015380859375, -5.470458984375, -5.2393798828125, -5.00830078125, -4.7772216796875, -4.546142578125, -4.3150634765625, -4.083984375, -3.8529052734375, -3.621826171875, -3.3907470703125, -3.15966796875, -2.9285888671875, -2.697509765625, -2.4664306640625, -2.2353515625, -2.0042724609375, -1.773193359375, -1.5421142578125, -1.31103515625, -1.0799560546875, -0.848876953125, -0.6177978515625, -0.38671875, -0.1556396484375, 0.075439453125, 0.3065185546875, 0.53759765625, 0.7686767578125, 0.999755859375, 1.2308349609375, 1.4619140625, 1.6929931640625, 1.924072265625, 2.1551513671875, 2.38623046875, 2.6173095703125, 2.848388671875, 3.0794677734375, 3.310546875, 3.5416259765625, 3.772705078125, 4.0037841796875, 4.23486328125, 4.4659423828125, 4.697021484375, 4.9281005859375, 5.1591796875, 5.3902587890625, 5.621337890625, 5.8524169921875, 6.08349609375, 6.3145751953125, 6.545654296875, 6.7767333984375, 7.0078125]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 6.0, 5.0, 8.0, 5.0, 8.0, 5.0, 9.0, 18.0, 12.0, 11.0, 20.0, 23.0, 17.0, 21.0, 22.0, 20.0, 26.0, 32.0, 24.0, 38.0, 35.0, 40.0, 36.0, 43.0, 38.0, 34.0, 35.0, 32.0, 31.0, 42.0, 30.0, 31.0, 27.0, 23.0, 18.0, 25.0, 24.0, 23.0, 20.0, 17.0, 15.0, 11.0, 5.0, 10.0, 2.0, 6.0, 9.0, 1.0, 6.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-9.8359375, -9.5245361328125, -9.213134765625, -8.9017333984375, -8.59033203125, -8.2789306640625, -7.967529296875, -7.6561279296875, -7.3447265625, -7.0333251953125, -6.721923828125, -6.4105224609375, -6.09912109375, -5.7877197265625, -5.476318359375, -5.1649169921875, -4.853515625, -4.5421142578125, -4.230712890625, -3.9193115234375, -3.60791015625, -3.2965087890625, -2.985107421875, -2.6737060546875, -2.3623046875, -2.0509033203125, -1.739501953125, -1.4281005859375, -1.11669921875, -0.8052978515625, -0.493896484375, -0.1824951171875, 0.12890625, 0.4403076171875, 0.751708984375, 1.0631103515625, 1.37451171875, 1.6859130859375, 1.997314453125, 2.3087158203125, 2.6201171875, 2.9315185546875, 3.242919921875, 3.5543212890625, 3.86572265625, 4.1771240234375, 4.488525390625, 4.7999267578125, 5.111328125, 5.4227294921875, 5.734130859375, 6.0455322265625, 6.35693359375, 6.6683349609375, 6.979736328125, 7.2911376953125, 7.6025390625, 7.9139404296875, 8.225341796875, 8.5367431640625, 8.84814453125, 9.1595458984375, 9.470947265625, 9.7823486328125, 10.09375]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 5.0, 14.0, 23.0, 30.0, 61.0, 82.0, 158.0, 242.0, 479.0, 828.0, 1310.0, 2153.0, 3778.0, 6380.0, 10595.0, 16881.0, 26930.0, 42391.0, 64065.0, 95351.0, 134480.0, 183292.0, 241291.0, 297232.0, 347798.0, 383806.0, 397416.0, 388058.0, 356146.0, 307505.0, 251905.0, 195101.0, 143942.0, 102071.0, 69729.0, 46479.0, 29516.0, 18441.0, 11241.0, 6971.0, 4216.0, 2475.0, 1449.0, 840.0, 496.0, 271.0, 157.0, 98.0, 53.0, 27.0, 21.0, 7.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-7.89453125, -7.65234375, -7.41015625, -7.16796875, -6.92578125, -6.68359375, -6.44140625, -6.19921875, -5.95703125, -5.71484375, -5.47265625, -5.23046875, -4.98828125, -4.74609375, -4.50390625, -4.26171875, -4.01953125, -3.77734375, -3.53515625, -3.29296875, -3.05078125, -2.80859375, -2.56640625, -2.32421875, -2.08203125, -1.83984375, -1.59765625, -1.35546875, -1.11328125, -0.87109375, -0.62890625, -0.38671875, -0.14453125, 0.09765625, 0.33984375, 0.58203125, 0.82421875, 1.06640625, 1.30859375, 1.55078125, 1.79296875, 2.03515625, 2.27734375, 2.51953125, 2.76171875, 3.00390625, 3.24609375, 3.48828125, 3.73046875, 3.97265625, 4.21484375, 4.45703125, 4.69921875, 4.94140625, 5.18359375, 5.42578125, 5.66796875, 5.91015625, 6.15234375, 6.39453125, 6.63671875, 6.87890625, 7.12109375, 7.36328125, 7.60546875]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 7.0, 11.0, 12.0, 16.0, 18.0, 17.0, 31.0, 32.0, 38.0, 55.0, 53.0, 61.0, 90.0, 116.0, 113.0, 121.0, 144.0, 168.0, 148.0, 199.0, 181.0, 191.0, 226.0, 208.0, 190.0, 170.0, 195.0, 162.0, 154.0, 140.0, 121.0, 104.0, 80.0, 84.0, 91.0, 68.0, 47.0, 50.0, 34.0, 34.0, 23.0, 16.0, 21.0, 9.0, 8.0, 10.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0], "bins": [-4.69140625, -4.53472900390625, -4.3780517578125, -4.22137451171875, -4.064697265625, -3.90802001953125, -3.7513427734375, -3.59466552734375, -3.43798828125, -3.28131103515625, -3.1246337890625, -2.96795654296875, -2.811279296875, -2.65460205078125, -2.4979248046875, -2.34124755859375, -2.1845703125, -2.02789306640625, -1.8712158203125, -1.71453857421875, -1.557861328125, -1.40118408203125, -1.2445068359375, -1.08782958984375, -0.93115234375, -0.77447509765625, -0.6177978515625, -0.46112060546875, -0.304443359375, -0.14776611328125, 0.0089111328125, 0.16558837890625, 0.322265625, 0.47894287109375, 0.6356201171875, 0.79229736328125, 0.948974609375, 1.10565185546875, 1.2623291015625, 1.41900634765625, 1.57568359375, 1.73236083984375, 1.8890380859375, 2.04571533203125, 2.202392578125, 2.35906982421875, 2.5157470703125, 2.67242431640625, 2.8291015625, 2.98577880859375, 3.1424560546875, 3.29913330078125, 3.455810546875, 3.61248779296875, 3.7691650390625, 3.92584228515625, 4.08251953125, 4.23919677734375, 4.3958740234375, 4.55255126953125, 4.709228515625, 4.86590576171875, 5.0225830078125, 5.17926025390625, 5.3359375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 2.0, 7.0, 7.0, 9.0, 5.0, 13.0, 13.0, 22.0, 20.0, 35.0, 30.0, 34.0, 32.0, 45.0, 42.0, 51.0, 64.0, 41.0, 46.0, 42.0, 48.0, 49.0, 49.0, 22.0, 31.0, 28.0, 41.0, 24.0, 33.0, 20.0, 18.0, 20.0, 12.0, 13.0, 8.0, 7.0, 3.0, 3.0, 6.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-13.385276794433594, -13.01187515258789, -12.638473510742188, -12.265071868896484, -11.891670227050781, -11.518268585205078, -11.144866943359375, -10.771465301513672, -10.398063659667969, -10.024662017822266, -9.651260375976562, -9.27785873413086, -8.904457092285156, -8.531055450439453, -8.15765380859375, -7.784252643585205, -7.41085147857666, -7.037449836730957, -6.664048194885254, -6.290646553039551, -5.917244911193848, -5.5438432693481445, -5.1704421043396, -4.7970404624938965, -4.423638820648193, -4.05023717880249, -3.676835536956787, -3.303434133529663, -2.93003249168396, -2.556630849838257, -2.183229446411133, -1.8098278045654297, -1.4364261627197266, -1.0630245208740234, -0.6896229982376099, -0.3162214756011963, 0.057180166244506836, 0.43058180809020996, 0.803983211517334, 1.177384853363037, 1.5507864952087402, 1.9241881370544434, 2.2975897789001465, 2.6709911823272705, 3.0443928241729736, 3.4177944660186768, 3.791195869445801, 4.164597511291504, 4.537999153137207, 4.91140079498291, 5.284802436828613, 5.658204078674316, 6.0316057205200195, 6.405007362365723, 6.778408527374268, 7.151810169219971, 7.525211811065674, 7.898613452911377, 8.272014617919922, 8.645416259765625, 9.018817901611328, 9.392219543457031, 9.765621185302734, 10.139022827148438, 10.51242446899414]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 4.0, 7.0, 3.0, 7.0, 5.0, 9.0, 14.0, 10.0, 10.0, 13.0, 15.0, 16.0, 21.0, 27.0, 20.0, 20.0, 27.0, 26.0, 38.0, 28.0, 35.0, 43.0, 30.0, 46.0, 53.0, 40.0, 42.0, 39.0, 34.0, 39.0, 27.0, 25.0, 25.0, 30.0, 19.0, 18.0, 19.0, 21.0, 15.0, 16.0, 7.0, 9.0, 14.0, 8.0, 5.0, 4.0, 10.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-14.16443920135498, -13.749457359313965, -13.334474563598633, -12.919492721557617, -12.504510879516602, -12.089529037475586, -11.67454719543457, -11.259564399719238, -10.844582557678223, -10.429600715637207, -10.014617919921875, -9.59963607788086, -9.184654235839844, -8.769672393798828, -8.354690551757812, -7.9397077560424805, -7.524725914001465, -7.109744071960449, -6.694761753082275, -6.279779434204102, -5.864797592163086, -5.44981575012207, -5.0348334312438965, -4.619851112365723, -4.204869270324707, -3.7898871898651123, -3.3749051094055176, -2.959923028945923, -2.544940948486328, -2.1299588680267334, -1.7149767875671387, -1.299994707107544, -0.8850126266479492, -0.4700305461883545, -0.055048465728759766, 0.35993361473083496, 0.7749156951904297, 1.1898977756500244, 1.6048798561096191, 2.019861936569214, 2.4348440170288086, 2.8498260974884033, 3.264808177947998, 3.6797902584075928, 4.0947723388671875, 4.509754180908203, 4.924736499786377, 5.339718818664551, 5.754700660705566, 6.169682502746582, 6.584664821624756, 6.99964714050293, 7.414628982543945, 7.829610824584961, 8.244592666625977, 8.659575462341309, 9.074557304382324, 9.48953914642334, 9.904521942138672, 10.319503784179688, 10.734485626220703, 11.149467468261719, 11.564449310302734, 11.979432106018066, 12.394413948059082]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 2.0, 7.0, 10.0, 15.0, 20.0, 21.0, 37.0, 76.0, 90.0, 150.0, 208.0, 244.0, 406.0, 565.0, 846.0, 1198.0, 1719.0, 2514.0, 3663.0, 5646.0, 8112.0, 12116.0, 18272.0, 28204.0, 44706.0, 72149.0, 120289.0, 185565.0, 194308.0, 129626.0, 79440.0, 48115.0, 30619.0, 19558.0, 12909.0, 8545.0, 5809.0, 3999.0, 2742.0, 1824.0, 1304.0, 905.0, 666.0, 420.0, 312.0, 214.0, 125.0, 96.0, 66.0, 37.0, 18.0, 26.0, 16.0, 12.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-2.26171875, -2.19122314453125, -2.1207275390625, -2.05023193359375, -1.979736328125, -1.90924072265625, -1.8387451171875, -1.76824951171875, -1.69775390625, -1.62725830078125, -1.5567626953125, -1.48626708984375, -1.415771484375, -1.34527587890625, -1.2747802734375, -1.20428466796875, -1.1337890625, -1.06329345703125, -0.9927978515625, -0.92230224609375, -0.851806640625, -0.78131103515625, -0.7108154296875, -0.64031982421875, -0.56982421875, -0.49932861328125, -0.4288330078125, -0.35833740234375, -0.287841796875, -0.21734619140625, -0.1468505859375, -0.07635498046875, -0.005859375, 0.06463623046875, 0.1351318359375, 0.20562744140625, 0.276123046875, 0.34661865234375, 0.4171142578125, 0.48760986328125, 0.55810546875, 0.62860107421875, 0.6990966796875, 0.76959228515625, 0.840087890625, 0.91058349609375, 0.9810791015625, 1.05157470703125, 1.1220703125, 1.19256591796875, 1.2630615234375, 1.33355712890625, 1.404052734375, 1.47454833984375, 1.5450439453125, 1.61553955078125, 1.68603515625, 1.75653076171875, 1.8270263671875, 1.89752197265625, 1.968017578125, 2.03851318359375, 2.1090087890625, 2.17950439453125, 2.25]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 5.0, 4.0, 7.0, 2.0, 8.0, 10.0, 13.0, 13.0, 18.0, 14.0, 11.0, 17.0, 16.0, 19.0, 17.0, 31.0, 28.0, 30.0, 40.0, 34.0, 50.0, 41.0, 45.0, 34.0, 51.0, 44.0, 41.0, 42.0, 32.0, 26.0, 26.0, 37.0, 28.0, 20.0, 18.0, 17.0, 22.0, 20.0, 15.0, 10.0, 15.0, 7.0, 8.0, 5.0, 4.0, 3.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.9921875, -13.54833984375, -13.1044921875, -12.66064453125, -12.216796875, -11.77294921875, -11.3291015625, -10.88525390625, -10.44140625, -9.99755859375, -9.5537109375, -9.10986328125, -8.666015625, -8.22216796875, -7.7783203125, -7.33447265625, -6.890625, -6.44677734375, -6.0029296875, -5.55908203125, -5.115234375, -4.67138671875, -4.2275390625, -3.78369140625, -3.33984375, -2.89599609375, -2.4521484375, -2.00830078125, -1.564453125, -1.12060546875, -0.6767578125, -0.23291015625, 0.2109375, 0.65478515625, 1.0986328125, 1.54248046875, 1.986328125, 2.43017578125, 2.8740234375, 3.31787109375, 3.76171875, 4.20556640625, 4.6494140625, 5.09326171875, 5.537109375, 5.98095703125, 6.4248046875, 6.86865234375, 7.3125, 7.75634765625, 8.2001953125, 8.64404296875, 9.087890625, 9.53173828125, 9.9755859375, 10.41943359375, 10.86328125, 11.30712890625, 11.7509765625, 12.19482421875, 12.638671875, 13.08251953125, 13.5263671875, 13.97021484375, 14.4140625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 6.0, 2.0, 5.0, 8.0, 7.0, 9.0, 13.0, 20.0, 23.0, 20.0, 34.0, 24.0, 52.0, 60.0, 69.0, 104.0, 152.0, 203.0, 239.0, 345.0, 461.0, 702.0, 1005.0, 1572.0, 2819.0, 5386.0, 12167.0, 32233.0, 887775.0, 63845.0, 20390.0, 8495.0, 3945.0, 2124.0, 1283.0, 826.0, 569.0, 365.0, 282.0, 209.0, 165.0, 135.0, 93.0, 79.0, 41.0, 42.0, 33.0, 23.0, 30.0, 22.0, 13.0, 10.0, 5.0, 11.0, 4.0, 3.0, 9.0, 2.0, 1.0, 2.0], "bins": [-8.515625, -8.255859375, -7.99609375, -7.736328125, -7.4765625, -7.216796875, -6.95703125, -6.697265625, -6.4375, -6.177734375, -5.91796875, -5.658203125, -5.3984375, -5.138671875, -4.87890625, -4.619140625, -4.359375, -4.099609375, -3.83984375, -3.580078125, -3.3203125, -3.060546875, -2.80078125, -2.541015625, -2.28125, -2.021484375, -1.76171875, -1.501953125, -1.2421875, -0.982421875, -0.72265625, -0.462890625, -0.203125, 0.056640625, 0.31640625, 0.576171875, 0.8359375, 1.095703125, 1.35546875, 1.615234375, 1.875, 2.134765625, 2.39453125, 2.654296875, 2.9140625, 3.173828125, 3.43359375, 3.693359375, 3.953125, 4.212890625, 4.47265625, 4.732421875, 4.9921875, 5.251953125, 5.51171875, 5.771484375, 6.03125, 6.291015625, 6.55078125, 6.810546875, 7.0703125, 7.330078125, 7.58984375, 7.849609375, 8.109375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 6.0, 2.0, 3.0, 6.0, 3.0, 5.0, 13.0, 9.0, 16.0, 11.0, 14.0, 15.0, 23.0, 20.0, 19.0, 18.0, 25.0, 23.0, 30.0, 31.0, 32.0, 48.0, 40.0, 34.0, 45.0, 57.0, 46.0, 37.0, 30.0, 26.0, 42.0, 25.0, 30.0, 24.0, 34.0, 20.0, 19.0, 23.0, 18.0, 19.0, 12.0, 13.0, 11.0, 2.0, 4.0, 5.0, 10.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.8125, -8.5220947265625, -8.231689453125, -7.9412841796875, -7.65087890625, -7.3604736328125, -7.070068359375, -6.7796630859375, -6.4892578125, -6.1988525390625, -5.908447265625, -5.6180419921875, -5.32763671875, -5.0372314453125, -4.746826171875, -4.4564208984375, -4.166015625, -3.8756103515625, -3.585205078125, -3.2947998046875, -3.00439453125, -2.7139892578125, -2.423583984375, -2.1331787109375, -1.8427734375, -1.5523681640625, -1.261962890625, -0.9715576171875, -0.68115234375, -0.3907470703125, -0.100341796875, 0.1900634765625, 0.48046875, 0.7708740234375, 1.061279296875, 1.3516845703125, 1.64208984375, 1.9324951171875, 2.222900390625, 2.5133056640625, 2.8037109375, 3.0941162109375, 3.384521484375, 3.6749267578125, 3.96533203125, 4.2557373046875, 4.546142578125, 4.8365478515625, 5.126953125, 5.4173583984375, 5.707763671875, 5.9981689453125, 6.28857421875, 6.5789794921875, 6.869384765625, 7.1597900390625, 7.4501953125, 7.7406005859375, 8.031005859375, 8.3214111328125, 8.61181640625, 8.9022216796875, 9.192626953125, 9.4830322265625, 9.7734375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 10.0, 11.0, 13.0, 14.0, 23.0, 21.0, 40.0, 38.0, 63.0, 95.0, 114.0, 139.0, 189.0, 300.0, 426.0, 643.0, 1016.0, 1769.0, 3541.0, 8115.0, 25336.0, 923479.0, 57927.0, 13685.0, 5213.0, 2396.0, 1361.0, 778.0, 552.0, 349.0, 235.0, 185.0, 114.0, 109.0, 69.0, 39.0, 39.0, 21.0, 20.0, 23.0, 13.0, 12.0, 2.0, 6.0, 7.0, 4.0, 5.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.66796875, -0.6481781005859375, -0.628387451171875, -0.6085968017578125, -0.58880615234375, -0.5690155029296875, -0.549224853515625, -0.5294342041015625, -0.5096435546875, -0.4898529052734375, -0.470062255859375, -0.4502716064453125, -0.43048095703125, -0.4106903076171875, -0.390899658203125, -0.3711090087890625, -0.351318359375, -0.3315277099609375, -0.311737060546875, -0.2919464111328125, -0.27215576171875, -0.2523651123046875, -0.232574462890625, -0.2127838134765625, -0.1929931640625, -0.1732025146484375, -0.153411865234375, -0.1336212158203125, -0.11383056640625, -0.0940399169921875, -0.074249267578125, -0.0544586181640625, -0.03466796875, -0.0148773193359375, 0.004913330078125, 0.0247039794921875, 0.04449462890625, 0.0642852783203125, 0.084075927734375, 0.1038665771484375, 0.1236572265625, 0.1434478759765625, 0.163238525390625, 0.1830291748046875, 0.20281982421875, 0.2226104736328125, 0.242401123046875, 0.2621917724609375, 0.281982421875, 0.3017730712890625, 0.321563720703125, 0.3413543701171875, 0.36114501953125, 0.3809356689453125, 0.400726318359375, 0.4205169677734375, 0.4403076171875, 0.4600982666015625, 0.479888916015625, 0.4996795654296875, 0.51947021484375, 0.5392608642578125, 0.559051513671875, 0.5788421630859375, 0.5986328125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 9.0, 10.0, 9.0, 14.0, 12.0, 14.0, 23.0, 17.0, 31.0, 33.0, 33.0, 43.0, 53.0, 43.0, 44.0, 45.0, 44.0, 46.0, 60.0, 42.0, 49.0, 44.0, 50.0, 34.0, 30.0, 26.0, 37.0, 20.0, 20.0, 14.0, 8.0, 22.0, 6.0, 5.0, 3.0, 7.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9141387939453125e-06, -6.662681698799133e-06, -6.411224603652954e-06, -6.159767508506775e-06, -5.908310413360596e-06, -5.6568533182144165e-06, -5.405396223068237e-06, -5.153939127922058e-06, -4.902482032775879e-06, -4.6510249376297e-06, -4.3995678424835205e-06, -4.148110747337341e-06, -3.896653652191162e-06, -3.645196557044983e-06, -3.3937394618988037e-06, -3.1422823667526245e-06, -2.8908252716064453e-06, -2.639368176460266e-06, -2.387911081314087e-06, -2.1364539861679077e-06, -1.8849968910217285e-06, -1.6335397958755493e-06, -1.3820827007293701e-06, -1.130625605583191e-06, -8.791685104370117e-07, -6.277114152908325e-07, -3.762543201446533e-07, -1.2479722499847412e-07, 1.2665987014770508e-07, 3.781169652938843e-07, 6.295740604400635e-07, 8.810311555862427e-07, 1.1324882507324219e-06, 1.383945345878601e-06, 1.6354024410247803e-06, 1.8868595361709595e-06, 2.1383166313171387e-06, 2.389773726463318e-06, 2.641230821609497e-06, 2.8926879167556763e-06, 3.1441450119018555e-06, 3.3956021070480347e-06, 3.647059202194214e-06, 3.898516297340393e-06, 4.149973392486572e-06, 4.4014304876327515e-06, 4.652887582778931e-06, 4.90434467792511e-06, 5.155801773071289e-06, 5.407258868217468e-06, 5.6587159633636475e-06, 5.910173058509827e-06, 6.161630153656006e-06, 6.413087248802185e-06, 6.664544343948364e-06, 6.9160014390945435e-06, 7.167458534240723e-06, 7.418915629386902e-06, 7.670372724533081e-06, 7.92182981967926e-06, 8.17328691482544e-06, 8.424744009971619e-06, 8.676201105117798e-06, 8.927658200263977e-06, 9.179115295410156e-06]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 6.0, 8.0, 2.0, 14.0, 18.0, 19.0, 24.0, 31.0, 75.0, 109.0, 153.0, 222.0, 350.0, 553.0, 758.0, 1221.0, 1893.0, 2794.0, 4421.0, 6829.0, 10536.0, 16605.0, 26607.0, 42735.0, 72795.0, 136480.0, 279317.0, 200039.0, 97156.0, 55325.0, 33414.0, 20667.0, 13219.0, 8602.0, 5436.0, 3453.0, 2304.0, 1458.0, 1061.0, 597.0, 419.0, 243.0, 203.0, 135.0, 84.0, 45.0, 50.0, 28.0, 12.0, 12.0, 4.0, 9.0, 3.0, 5.0, 3.0, 1.0, 4.0, 2.0], "bins": [-0.294921875, -0.2859153747558594, -0.27690887451171875, -0.2679023742675781, -0.2588958740234375, -0.24988937377929688, -0.24088287353515625, -0.23187637329101562, -0.222869873046875, -0.21386337280273438, -0.20485687255859375, -0.19585037231445312, -0.1868438720703125, -0.17783737182617188, -0.16883087158203125, -0.15982437133789062, -0.15081787109375, -0.14181137084960938, -0.13280487060546875, -0.12379837036132812, -0.1147918701171875, -0.10578536987304688, -0.09677886962890625, -0.08777236938476562, -0.078765869140625, -0.06975936889648438, -0.06075286865234375, -0.051746368408203125, -0.0427398681640625, -0.033733367919921875, -0.02472686767578125, -0.015720367431640625, -0.0067138671875, 0.002292633056640625, 0.01129913330078125, 0.020305633544921875, 0.0293121337890625, 0.038318634033203125, 0.04732513427734375, 0.056331634521484375, 0.065338134765625, 0.07434463500976562, 0.08335113525390625, 0.09235763549804688, 0.1013641357421875, 0.11037063598632812, 0.11937713623046875, 0.12838363647460938, 0.13739013671875, 0.14639663696289062, 0.15540313720703125, 0.16440963745117188, 0.1734161376953125, 0.18242263793945312, 0.19142913818359375, 0.20043563842773438, 0.209442138671875, 0.21844863891601562, 0.22745513916015625, 0.23646163940429688, 0.2454681396484375, 0.2544746398925781, 0.26348114013671875, 0.2724876403808594, 0.281494140625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 6.0, 11.0, 7.0, 6.0, 15.0, 14.0, 8.0, 17.0, 12.0, 21.0, 32.0, 27.0, 30.0, 46.0, 78.0, 61.0, 88.0, 93.0, 65.0, 79.0, 55.0, 48.0, 30.0, 26.0, 23.0, 15.0, 8.0, 10.0, 8.0, 14.0, 2.0, 8.0, 8.0, 11.0, 3.0, 2.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.2301025390625, -0.2231578826904297, -0.21621322631835938, -0.20926856994628906, -0.20232391357421875, -0.19537925720214844, -0.18843460083007812, -0.1814899444580078, -0.1745452880859375, -0.1676006317138672, -0.16065597534179688, -0.15371131896972656, -0.14676666259765625, -0.13982200622558594, -0.13287734985351562, -0.1259326934814453, -0.118988037109375, -0.11204338073730469, -0.10509872436523438, -0.09815406799316406, -0.09120941162109375, -0.08426475524902344, -0.07732009887695312, -0.07037544250488281, -0.0634307861328125, -0.05648612976074219, -0.049541473388671875, -0.04259681701660156, -0.03565216064453125, -0.028707504272460938, -0.021762847900390625, -0.014818191528320312, -0.00787353515625, -0.0009288787841796875, 0.006015777587890625, 0.012960433959960938, 0.01990509033203125, 0.026849746704101562, 0.033794403076171875, 0.04073905944824219, 0.0476837158203125, 0.05462837219238281, 0.061573028564453125, 0.06851768493652344, 0.07546234130859375, 0.08240699768066406, 0.08935165405273438, 0.09629631042480469, 0.103240966796875, 0.11018562316894531, 0.11713027954101562, 0.12407493591308594, 0.13101959228515625, 0.13796424865722656, 0.14490890502929688, 0.1518535614013672, 0.1587982177734375, 0.1657428741455078, 0.17268753051757812, 0.17963218688964844, 0.18657684326171875, 0.19352149963378906, 0.20046615600585938, 0.2074108123779297, 0.21435546875]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 3.0, 3.0, 6.0, 4.0, 12.0, 5.0, 14.0, 14.0, 18.0, 24.0, 32.0, 26.0, 38.0, 34.0, 38.0, 52.0, 49.0, 55.0, 46.0, 44.0, 39.0, 55.0, 50.0, 42.0, 26.0, 36.0, 34.0, 29.0, 31.0, 29.0, 23.0, 14.0, 21.0, 11.0, 12.0, 11.0, 7.0, 3.0, 2.0, 6.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-13.446080207824707, -13.072214126586914, -12.698347091674805, -12.324481010437012, -11.950614929199219, -11.576748847961426, -11.202882766723633, -10.829015731811523, -10.45514965057373, -10.081283569335938, -9.707416534423828, -9.333550453186035, -8.959684371948242, -8.58581829071045, -8.211952209472656, -7.838085174560547, -7.464219093322754, -7.090353012084961, -6.71648645401001, -6.342619895935059, -5.968753814697266, -5.594887733459473, -5.2210211753845215, -4.84715461730957, -4.473288536071777, -4.099422454833984, -3.725555896759033, -3.351689577102661, -2.977823257446289, -2.603956937789917, -2.230090618133545, -1.8562242984771729, -1.4823570251464844, -1.1084907054901123, -0.7346243858337402, -0.36075806617736816, 0.013108253479003906, 0.386974573135376, 0.760840892791748, 1.1347072124481201, 1.5085735321044922, 1.8824398517608643, 2.2563061714172363, 2.6301724910736084, 3.0040388107299805, 3.3779051303863525, 3.7517714500427246, 4.125638008117676, 4.499504089355469, 4.873370170593262, 5.247236728668213, 5.621103286743164, 5.994969367980957, 6.36883544921875, 6.742702007293701, 7.116568565368652, 7.490434646606445, 7.864300727844238, 8.238166809082031, 8.61203384399414, 8.985899925231934, 9.359766006469727, 9.733633041381836, 10.107499122619629, 10.481365203857422]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 4.0, 6.0, 3.0, 7.0, 6.0, 9.0, 14.0, 8.0, 13.0, 12.0, 17.0, 20.0, 12.0, 28.0, 25.0, 17.0, 32.0, 25.0, 33.0, 33.0, 41.0, 36.0, 35.0, 41.0, 53.0, 41.0, 40.0, 41.0, 40.0, 34.0, 23.0, 31.0, 27.0, 24.0, 19.0, 16.0, 24.0, 15.0, 17.0, 15.0, 8.0, 10.0, 14.0, 5.0, 6.0, 6.0, 8.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-14.201780319213867, -13.784958839416504, -13.36813735961914, -12.951315879821777, -12.534494400024414, -12.117673873901367, -11.700852394104004, -11.28403091430664, -10.867209434509277, -10.450387954711914, -10.03356647491455, -9.616744995117188, -9.19992446899414, -8.783102035522461, -8.366281509399414, -7.949460029602051, -7.5326385498046875, -7.115817070007324, -6.698995590209961, -6.282174587249756, -5.865353107452393, -5.448531627655029, -5.031710624694824, -4.614889144897461, -4.198067665100098, -3.7812461853027344, -3.36442494392395, -2.947603702545166, -2.5307822227478027, -2.1139607429504395, -1.6971395015716553, -1.280318260192871, -0.8634967803955078, -0.4466754198074341, -0.02985405921936035, 0.3869673013687134, 0.8037886619567871, 1.2206101417541504, 1.6374313831329346, 2.0542526245117188, 2.471074104309082, 2.8878955841064453, 3.3047168254852295, 3.7215380668640137, 4.138359546661377, 4.55518102645874, 4.972002029418945, 5.388823509216309, 5.805644989013672, 6.222466468811035, 6.639287948608398, 7.0561089515686035, 7.472930431365967, 7.88975191116333, 8.306572914123535, 8.723394393920898, 9.140215873718262, 9.557037353515625, 9.973858833312988, 10.390680313110352, 10.807500839233398, 11.224323272705078, 11.641143798828125, 12.057965278625488, 12.474786758422852]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 16.0, 15.0, 34.0, 63.0, 83.0, 148.0, 215.0, 317.0, 469.0, 718.0, 1204.0, 1675.0, 2496.0, 3849.0, 5623.0, 8212.0, 12107.0, 16905.0, 23375.0, 31645.0, 41698.0, 52747.0, 64171.0, 75244.0, 83300.0, 88197.0, 89541.0, 84666.0, 77251.0, 66826.0, 55349.0, 43605.0, 33292.0, 25035.0, 18074.0, 12992.0, 8963.0, 6151.0, 4062.0, 2789.0, 1856.0, 1257.0, 803.0, 567.0, 356.0, 224.0, 125.0, 103.0, 55.0, 39.0, 22.0, 5.0, 11.0, 6.0, 9.0, 3.0, 0.0, 1.0], "bins": [-5.37109375, -5.20379638671875, -5.0364990234375, -4.86920166015625, -4.701904296875, -4.53460693359375, -4.3673095703125, -4.20001220703125, -4.03271484375, -3.86541748046875, -3.6981201171875, -3.53082275390625, -3.363525390625, -3.19622802734375, -3.0289306640625, -2.86163330078125, -2.6943359375, -2.52703857421875, -2.3597412109375, -2.19244384765625, -2.025146484375, -1.85784912109375, -1.6905517578125, -1.52325439453125, -1.35595703125, -1.18865966796875, -1.0213623046875, -0.85406494140625, -0.686767578125, -0.51947021484375, -0.3521728515625, -0.18487548828125, -0.017578125, 0.14971923828125, 0.3170166015625, 0.48431396484375, 0.651611328125, 0.81890869140625, 0.9862060546875, 1.15350341796875, 1.32080078125, 1.48809814453125, 1.6553955078125, 1.82269287109375, 1.989990234375, 2.15728759765625, 2.3245849609375, 2.49188232421875, 2.6591796875, 2.82647705078125, 2.9937744140625, 3.16107177734375, 3.328369140625, 3.49566650390625, 3.6629638671875, 3.83026123046875, 3.99755859375, 4.16485595703125, 4.3321533203125, 4.49945068359375, 4.666748046875, 4.83404541015625, 5.0013427734375, 5.16864013671875, 5.3359375]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 4.0, 5.0, 0.0, 3.0, 5.0, 5.0, 6.0, 11.0, 14.0, 17.0, 6.0, 11.0, 16.0, 21.0, 14.0, 27.0, 29.0, 27.0, 33.0, 28.0, 30.0, 27.0, 36.0, 41.0, 45.0, 50.0, 39.0, 45.0, 41.0, 31.0, 31.0, 32.0, 32.0, 25.0, 17.0, 28.0, 19.0, 26.0, 22.0, 18.0, 8.0, 20.0, 9.0, 8.0, 7.0, 8.0, 8.0, 2.0, 6.0, 6.0, 5.0, 3.0, 2.0, 1.0, 2.0], "bins": [-14.5546875, -14.1370849609375, -13.719482421875, -13.3018798828125, -12.88427734375, -12.4666748046875, -12.049072265625, -11.6314697265625, -11.2138671875, -10.7962646484375, -10.378662109375, -9.9610595703125, -9.54345703125, -9.1258544921875, -8.708251953125, -8.2906494140625, -7.873046875, -7.4554443359375, -7.037841796875, -6.6202392578125, -6.20263671875, -5.7850341796875, -5.367431640625, -4.9498291015625, -4.5322265625, -4.1146240234375, -3.697021484375, -3.2794189453125, -2.86181640625, -2.4442138671875, -2.026611328125, -1.6090087890625, -1.19140625, -0.7738037109375, -0.356201171875, 0.0614013671875, 0.47900390625, 0.8966064453125, 1.314208984375, 1.7318115234375, 2.1494140625, 2.5670166015625, 2.984619140625, 3.4022216796875, 3.81982421875, 4.2374267578125, 4.655029296875, 5.0726318359375, 5.490234375, 5.9078369140625, 6.325439453125, 6.7430419921875, 7.16064453125, 7.5782470703125, 7.995849609375, 8.4134521484375, 8.8310546875, 9.2486572265625, 9.666259765625, 10.0838623046875, 10.50146484375, 10.9190673828125, 11.336669921875, 11.7542724609375, 12.171875]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 7.0, 6.0, 9.0, 12.0, 25.0, 24.0, 67.0, 110.0, 188.0, 315.0, 497.0, 812.0, 1336.0, 2111.0, 3554.0, 5675.0, 8692.0, 13457.0, 20366.0, 30038.0, 41866.0, 56532.0, 72977.0, 88000.0, 100095.0, 105950.0, 102889.0, 94078.0, 80679.0, 64034.0, 48911.0, 35139.0, 24664.0, 16547.0, 10686.0, 6784.0, 4473.0, 2601.0, 1676.0, 1044.0, 629.0, 384.0, 256.0, 163.0, 80.0, 48.0, 36.0, 21.0, 11.0, 8.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.3515625, -6.15142822265625, -5.9512939453125, -5.75115966796875, -5.551025390625, -5.35089111328125, -5.1507568359375, -4.95062255859375, -4.75048828125, -4.55035400390625, -4.3502197265625, -4.15008544921875, -3.949951171875, -3.74981689453125, -3.5496826171875, -3.34954833984375, -3.1494140625, -2.94927978515625, -2.7491455078125, -2.54901123046875, -2.348876953125, -2.14874267578125, -1.9486083984375, -1.74847412109375, -1.54833984375, -1.34820556640625, -1.1480712890625, -0.94793701171875, -0.747802734375, -0.54766845703125, -0.3475341796875, -0.14739990234375, 0.052734375, 0.25286865234375, 0.4530029296875, 0.65313720703125, 0.853271484375, 1.05340576171875, 1.2535400390625, 1.45367431640625, 1.65380859375, 1.85394287109375, 2.0540771484375, 2.25421142578125, 2.454345703125, 2.65447998046875, 2.8546142578125, 3.05474853515625, 3.2548828125, 3.45501708984375, 3.6551513671875, 3.85528564453125, 4.055419921875, 4.25555419921875, 4.4556884765625, 4.65582275390625, 4.85595703125, 5.05609130859375, 5.2562255859375, 5.45635986328125, 5.656494140625, 5.85662841796875, 6.0567626953125, 6.25689697265625, 6.45703125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 0.0, 4.0, 5.0, 6.0, 11.0, 6.0, 3.0, 13.0, 14.0, 18.0, 10.0, 17.0, 21.0, 26.0, 25.0, 29.0, 29.0, 27.0, 50.0, 30.0, 27.0, 31.0, 47.0, 34.0, 36.0, 39.0, 48.0, 45.0, 36.0, 40.0, 39.0, 34.0, 32.0, 23.0, 16.0, 39.0, 17.0, 22.0, 11.0, 9.0, 7.0, 1.0, 6.0, 8.0, 6.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.5078125, -8.212890625, -7.91796875, -7.623046875, -7.328125, -7.033203125, -6.73828125, -6.443359375, -6.1484375, -5.853515625, -5.55859375, -5.263671875, -4.96875, -4.673828125, -4.37890625, -4.083984375, -3.7890625, -3.494140625, -3.19921875, -2.904296875, -2.609375, -2.314453125, -2.01953125, -1.724609375, -1.4296875, -1.134765625, -0.83984375, -0.544921875, -0.25, 0.044921875, 0.33984375, 0.634765625, 0.9296875, 1.224609375, 1.51953125, 1.814453125, 2.109375, 2.404296875, 2.69921875, 2.994140625, 3.2890625, 3.583984375, 3.87890625, 4.173828125, 4.46875, 4.763671875, 5.05859375, 5.353515625, 5.6484375, 5.943359375, 6.23828125, 6.533203125, 6.828125, 7.123046875, 7.41796875, 7.712890625, 8.0078125, 8.302734375, 8.59765625, 8.892578125, 9.1875, 9.482421875, 9.77734375, 10.072265625, 10.3671875]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 7.0, 4.0, 10.0, 24.0, 34.0, 40.0, 59.0, 102.0, 158.0, 235.0, 401.0, 593.0, 1028.0, 1670.0, 2632.0, 4356.0, 6834.0, 10973.0, 16742.0, 24991.0, 36255.0, 50170.0, 65236.0, 81782.0, 94513.0, 103248.0, 104533.0, 98860.0, 87270.0, 72667.0, 56322.0, 42003.0, 29335.0, 19933.0, 13134.0, 8483.0, 5331.0, 3364.0, 1971.0, 1245.0, 772.0, 473.0, 284.0, 169.0, 107.0, 78.0, 45.0, 26.0, 23.0, 10.0, 8.0, 4.0, 5.0, 3.0, 3.0, 5.0, 2.0], "bins": [-2.166015625, -2.100799560546875, -2.03558349609375, -1.970367431640625, -1.9051513671875, -1.839935302734375, -1.77471923828125, -1.709503173828125, -1.644287109375, -1.579071044921875, -1.51385498046875, -1.448638916015625, -1.3834228515625, -1.318206787109375, -1.25299072265625, -1.187774658203125, -1.12255859375, -1.057342529296875, -0.99212646484375, -0.926910400390625, -0.8616943359375, -0.796478271484375, -0.73126220703125, -0.666046142578125, -0.600830078125, -0.535614013671875, -0.47039794921875, -0.405181884765625, -0.3399658203125, -0.274749755859375, -0.20953369140625, -0.144317626953125, -0.0791015625, -0.013885498046875, 0.05133056640625, 0.116546630859375, 0.1817626953125, 0.246978759765625, 0.31219482421875, 0.377410888671875, 0.442626953125, 0.507843017578125, 0.57305908203125, 0.638275146484375, 0.7034912109375, 0.768707275390625, 0.83392333984375, 0.899139404296875, 0.96435546875, 1.029571533203125, 1.09478759765625, 1.160003662109375, 1.2252197265625, 1.290435791015625, 1.35565185546875, 1.420867919921875, 1.486083984375, 1.551300048828125, 1.61651611328125, 1.681732177734375, 1.7469482421875, 1.812164306640625, 1.87738037109375, 1.942596435546875, 2.0078125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 8.0, 14.0, 2.0, 6.0, 10.0, 9.0, 12.0, 17.0, 24.0, 28.0, 25.0, 26.0, 30.0, 27.0, 23.0, 32.0, 38.0, 50.0, 43.0, 29.0, 48.0, 38.0, 42.0, 37.0, 52.0, 35.0, 34.0, 36.0, 23.0, 32.0, 24.0, 20.0, 21.0, 22.0, 23.0, 12.0, 6.0, 11.0, 10.0, 5.0, 2.0, 6.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002301931381225586, -0.00022248364984989166, -0.00021477416157722473, -0.0002070646733045578, -0.00019935518503189087, -0.00019164569675922394, -0.000183936208486557, -0.00017622672021389008, -0.00016851723194122314, -0.0001608077436685562, -0.00015309825539588928, -0.00014538876712322235, -0.00013767927885055542, -0.0001299697905778885, -0.00012226030230522156, -0.00011455081403255463, -0.0001068413257598877, -9.913183748722076e-05, -9.142234921455383e-05, -8.37128609418869e-05, -7.600337266921997e-05, -6.829388439655304e-05, -6.058439612388611e-05, -5.287490785121918e-05, -4.5165419578552246e-05, -3.7455931305885315e-05, -2.9746443033218384e-05, -2.2036954760551453e-05, -1.4327466487884521e-05, -6.61797821521759e-06, 1.0915100574493408e-06, 8.800998330116272e-06, 1.6510486602783203e-05, 2.4219974875450134e-05, 3.1929463148117065e-05, 3.9638951420783997e-05, 4.734843969345093e-05, 5.505792796611786e-05, 6.276741623878479e-05, 7.047690451145172e-05, 7.818639278411865e-05, 8.589588105678558e-05, 9.360536932945251e-05, 0.00010131485760211945, 0.00010902434587478638, 0.00011673383414745331, 0.00012444332242012024, 0.00013215281069278717, 0.0001398622989654541, 0.00014757178723812103, 0.00015528127551078796, 0.0001629907637834549, 0.00017070025205612183, 0.00017840974032878876, 0.0001861192286014557, 0.00019382871687412262, 0.00020153820514678955, 0.00020924769341945648, 0.0002169571816921234, 0.00022466666996479034, 0.00023237615823745728, 0.0002400856465101242, 0.00024779513478279114, 0.00025550462305545807, 0.000263214111328125]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 6.0, 13.0, 15.0, 14.0, 45.0, 46.0, 81.0, 91.0, 128.0, 189.0, 316.0, 472.0, 632.0, 1068.0, 1532.0, 2289.0, 3603.0, 5483.0, 8440.0, 12560.0, 18484.0, 26839.0, 37626.0, 50201.0, 64501.0, 78421.0, 90693.0, 98203.0, 99412.0, 93861.0, 84990.0, 71152.0, 56532.0, 43031.0, 31211.0, 21970.0, 14866.0, 10036.0, 6736.0, 4317.0, 2824.0, 1830.0, 1264.0, 852.0, 539.0, 374.0, 260.0, 156.0, 120.0, 75.0, 59.0, 39.0, 31.0, 16.0, 5.0, 8.0, 5.0, 2.0, 4.0, 2.0], "bins": [-2.095703125, -2.030670166015625, -1.96563720703125, -1.900604248046875, -1.8355712890625, -1.770538330078125, -1.70550537109375, -1.640472412109375, -1.575439453125, -1.510406494140625, -1.44537353515625, -1.380340576171875, -1.3153076171875, -1.250274658203125, -1.18524169921875, -1.120208740234375, -1.05517578125, -0.990142822265625, -0.92510986328125, -0.860076904296875, -0.7950439453125, -0.730010986328125, -0.66497802734375, -0.599945068359375, -0.534912109375, -0.469879150390625, -0.40484619140625, -0.339813232421875, -0.2747802734375, -0.209747314453125, -0.14471435546875, -0.079681396484375, -0.0146484375, 0.050384521484375, 0.11541748046875, 0.180450439453125, 0.2454833984375, 0.310516357421875, 0.37554931640625, 0.440582275390625, 0.505615234375, 0.570648193359375, 0.63568115234375, 0.700714111328125, 0.7657470703125, 0.830780029296875, 0.89581298828125, 0.960845947265625, 1.02587890625, 1.090911865234375, 1.15594482421875, 1.220977783203125, 1.2860107421875, 1.351043701171875, 1.41607666015625, 1.481109619140625, 1.546142578125, 1.611175537109375, 1.67620849609375, 1.741241455078125, 1.8062744140625, 1.871307373046875, 1.93634033203125, 2.001373291015625, 2.06640625]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 3.0, 10.0, 13.0, 10.0, 13.0, 14.0, 8.0, 12.0, 23.0, 15.0, 26.0, 24.0, 27.0, 39.0, 36.0, 36.0, 46.0, 52.0, 46.0, 54.0, 42.0, 48.0, 31.0, 30.0, 42.0, 38.0, 44.0, 35.0, 22.0, 26.0, 21.0, 27.0, 17.0, 13.0, 12.0, 11.0, 12.0, 3.0, 2.0, 6.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.126953125, -1.0884246826171875, -1.049896240234375, -1.0113677978515625, -0.97283935546875, -0.9343109130859375, -0.895782470703125, -0.8572540283203125, -0.8187255859375, -0.7801971435546875, -0.741668701171875, -0.7031402587890625, -0.66461181640625, -0.6260833740234375, -0.587554931640625, -0.5490264892578125, -0.510498046875, -0.4719696044921875, -0.433441162109375, -0.3949127197265625, -0.35638427734375, -0.3178558349609375, -0.279327392578125, -0.2407989501953125, -0.2022705078125, -0.1637420654296875, -0.125213623046875, -0.0866851806640625, -0.04815673828125, -0.0096282958984375, 0.028900146484375, 0.0674285888671875, 0.10595703125, 0.1444854736328125, 0.183013916015625, 0.2215423583984375, 0.26007080078125, 0.2985992431640625, 0.337127685546875, 0.3756561279296875, 0.4141845703125, 0.4527130126953125, 0.491241455078125, 0.5297698974609375, 0.56829833984375, 0.6068267822265625, 0.645355224609375, 0.6838836669921875, 0.722412109375, 0.7609405517578125, 0.799468994140625, 0.8379974365234375, 0.87652587890625, 0.9150543212890625, 0.953582763671875, 0.9921112060546875, 1.0306396484375, 1.0691680908203125, 1.107696533203125, 1.1462249755859375, 1.18475341796875, 1.2232818603515625, 1.261810302734375, 1.3003387451171875, 1.3388671875]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 3.0, 2.0, 5.0, 6.0, 10.0, 11.0, 20.0, 15.0, 14.0, 15.0, 30.0, 32.0, 38.0, 36.0, 39.0, 39.0, 54.0, 52.0, 47.0, 43.0, 39.0, 55.0, 43.0, 35.0, 36.0, 28.0, 34.0, 28.0, 29.0, 32.0, 25.0, 22.0, 18.0, 14.0, 8.0, 5.0, 11.0, 13.0, 8.0, 2.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.715560913085938, -12.352931022644043, -11.990301132202148, -11.627670288085938, -11.265040397644043, -10.902410507202148, -10.539780616760254, -10.17715072631836, -9.814519882202148, -9.451889991760254, -9.08926010131836, -8.726629257202148, -8.363999366760254, -8.00136947631836, -7.638739585876465, -7.27610969543457, -6.913479804992676, -6.550849914550781, -6.1882195472717285, -5.825589656829834, -5.462959289550781, -5.100329399108887, -4.737699508666992, -4.375069618225098, -4.012439250946045, -3.6498091220855713, -3.2871789932250977, -2.924549102783203, -2.5619189739227295, -2.199288845062256, -1.8366589546203613, -1.4740288257598877, -1.1113977432250977, -0.7487676739692688, -0.38613760471343994, -0.02350759506225586, 0.3391225337982178, 0.7017526626586914, 1.064382553100586, 1.4270126819610596, 1.7896428108215332, 2.152272939682007, 2.5149030685424805, 2.877532958984375, 3.2401630878448486, 3.6027932167053223, 3.965423107147217, 4.3280534744262695, 4.690683364868164, 5.053313255310059, 5.415943622589111, 5.778573513031006, 6.141203880310059, 6.503833770751953, 6.866463661193848, 7.229093551635742, 7.591723918914795, 7.9543538093566895, 8.316984176635742, 8.679614067077637, 9.042243957519531, 9.404874801635742, 9.76750373840332, 10.130134582519531, 10.492764472961426]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 9.0, 3.0, 10.0, 6.0, 7.0, 6.0, 11.0, 14.0, 12.0, 13.0, 17.0, 16.0, 17.0, 19.0, 23.0, 33.0, 30.0, 33.0, 41.0, 31.0, 44.0, 43.0, 38.0, 35.0, 34.0, 36.0, 31.0, 43.0, 45.0, 24.0, 41.0, 34.0, 35.0, 23.0, 16.0, 23.0, 17.0, 9.0, 16.0, 6.0, 10.0, 11.0, 7.0, 12.0, 7.0, 1.0, 6.0, 4.0, 2.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-15.29019546508789, -14.823490142822266, -14.356783866882324, -13.890077590942383, -13.423372268676758, -12.956666946411133, -12.489960670471191, -12.02325439453125, -11.556549072265625, -11.08984375, -10.623137474060059, -10.156431198120117, -9.689725875854492, -9.223020553588867, -8.756314277648926, -8.289608001708984, -7.822902679443359, -7.356196880340576, -6.889491081237793, -6.42278528213501, -5.956079483032227, -5.489373683929443, -5.02266788482666, -4.555962085723877, -4.089256286621094, -3.6225504875183105, -3.1558446884155273, -2.689138889312744, -2.222433090209961, -1.7557272911071777, -1.2890214920043945, -0.8223156929016113, -0.3556089401245117, 0.11109685897827148, 0.5778026580810547, 1.044508457183838, 1.511214256286621, 1.9779200553894043, 2.4446258544921875, 2.9113316535949707, 3.378037452697754, 3.844743251800537, 4.31144905090332, 4.7781548500061035, 5.244860649108887, 5.71156644821167, 6.178272247314453, 6.644978046417236, 7.1116838455200195, 7.578389644622803, 8.045095443725586, 8.511800765991211, 8.978507041931152, 9.445213317871094, 9.911918640136719, 10.378623962402344, 10.845330238342285, 11.312036514282227, 11.778741836547852, 12.245447158813477, 12.712153434753418, 13.17885971069336, 13.645565032958984, 14.11227035522461, 14.57897663116455]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 11.0, 29.0, 36.0, 65.0, 142.0, 193.0, 301.0, 509.0, 806.0, 1265.0, 1979.0, 3272.0, 5028.0, 7823.0, 12502.0, 19039.0, 28899.0, 43132.0, 63437.0, 90254.0, 127202.0, 171571.0, 223740.0, 280121.0, 331583.0, 371452.0, 388341.0, 385499.0, 357012.0, 312229.0, 258733.0, 204162.0, 154178.0, 111811.0, 79888.0, 54393.0, 36663.0, 24112.0, 15805.0, 10106.0, 6448.0, 3988.0, 2533.0, 1519.0, 969.0, 592.0, 352.0, 222.0, 143.0, 85.0, 41.0, 35.0, 11.0, 10.0, 10.0, 6.0, 1.0, 4.0], "bins": [-8.9296875, -8.657470703125, -8.38525390625, -8.113037109375, -7.8408203125, -7.568603515625, -7.29638671875, -7.024169921875, -6.751953125, -6.479736328125, -6.20751953125, -5.935302734375, -5.6630859375, -5.390869140625, -5.11865234375, -4.846435546875, -4.57421875, -4.302001953125, -4.02978515625, -3.757568359375, -3.4853515625, -3.213134765625, -2.94091796875, -2.668701171875, -2.396484375, -2.124267578125, -1.85205078125, -1.579833984375, -1.3076171875, -1.035400390625, -0.76318359375, -0.490966796875, -0.21875, 0.053466796875, 0.32568359375, 0.597900390625, 0.8701171875, 1.142333984375, 1.41455078125, 1.686767578125, 1.958984375, 2.231201171875, 2.50341796875, 2.775634765625, 3.0478515625, 3.320068359375, 3.59228515625, 3.864501953125, 4.13671875, 4.408935546875, 4.68115234375, 4.953369140625, 5.2255859375, 5.497802734375, 5.77001953125, 6.042236328125, 6.314453125, 6.586669921875, 6.85888671875, 7.131103515625, 7.4033203125, 7.675537109375, 7.94775390625, 8.219970703125, 8.4921875]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 2.0, 5.0, 4.0, 8.0, 11.0, 7.0, 11.0, 13.0, 17.0, 13.0, 19.0, 8.0, 17.0, 25.0, 21.0, 16.0, 42.0, 29.0, 31.0, 29.0, 28.0, 45.0, 37.0, 48.0, 43.0, 41.0, 41.0, 32.0, 38.0, 32.0, 27.0, 37.0, 28.0, 28.0, 27.0, 24.0, 12.0, 11.0, 16.0, 12.0, 10.0, 8.0, 13.0, 8.0, 4.0, 8.0, 4.0, 3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0], "bins": [-13.0, -12.5941162109375, -12.188232421875, -11.7823486328125, -11.37646484375, -10.9705810546875, -10.564697265625, -10.1588134765625, -9.7529296875, -9.3470458984375, -8.941162109375, -8.5352783203125, -8.12939453125, -7.7235107421875, -7.317626953125, -6.9117431640625, -6.505859375, -6.0999755859375, -5.694091796875, -5.2882080078125, -4.88232421875, -4.4764404296875, -4.070556640625, -3.6646728515625, -3.2587890625, -2.8529052734375, -2.447021484375, -2.0411376953125, -1.63525390625, -1.2293701171875, -0.823486328125, -0.4176025390625, -0.01171875, 0.3941650390625, 0.800048828125, 1.2059326171875, 1.61181640625, 2.0177001953125, 2.423583984375, 2.8294677734375, 3.2353515625, 3.6412353515625, 4.047119140625, 4.4530029296875, 4.85888671875, 5.2647705078125, 5.670654296875, 6.0765380859375, 6.482421875, 6.8883056640625, 7.294189453125, 7.7000732421875, 8.10595703125, 8.5118408203125, 8.917724609375, 9.3236083984375, 9.7294921875, 10.1353759765625, 10.541259765625, 10.9471435546875, 11.35302734375, 11.7589111328125, 12.164794921875, 12.5706787109375, 12.9765625]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 5.0, 5.0, 8.0, 25.0, 36.0, 44.0, 83.0, 186.0, 293.0, 593.0, 971.0, 1684.0, 3001.0, 4894.0, 8164.0, 13512.0, 22238.0, 36169.0, 56136.0, 84596.0, 124043.0, 173420.0, 233267.0, 293663.0, 352287.0, 395229.0, 412496.0, 405891.0, 372511.0, 319331.0, 258365.0, 197040.0, 144177.0, 100294.0, 66998.0, 43488.0, 27296.0, 16993.0, 10091.0, 6176.0, 3546.0, 2204.0, 1182.0, 715.0, 401.0, 219.0, 142.0, 78.0, 41.0, 26.0, 18.0, 11.0, 6.0, 5.0, 1.0, 2.0], "bins": [-10.8046875, -10.493408203125, -10.18212890625, -9.870849609375, -9.5595703125, -9.248291015625, -8.93701171875, -8.625732421875, -8.314453125, -8.003173828125, -7.69189453125, -7.380615234375, -7.0693359375, -6.758056640625, -6.44677734375, -6.135498046875, -5.82421875, -5.512939453125, -5.20166015625, -4.890380859375, -4.5791015625, -4.267822265625, -3.95654296875, -3.645263671875, -3.333984375, -3.022705078125, -2.71142578125, -2.400146484375, -2.0888671875, -1.777587890625, -1.46630859375, -1.155029296875, -0.84375, -0.532470703125, -0.22119140625, 0.090087890625, 0.4013671875, 0.712646484375, 1.02392578125, 1.335205078125, 1.646484375, 1.957763671875, 2.26904296875, 2.580322265625, 2.8916015625, 3.202880859375, 3.51416015625, 3.825439453125, 4.13671875, 4.447998046875, 4.75927734375, 5.070556640625, 5.3818359375, 5.693115234375, 6.00439453125, 6.315673828125, 6.626953125, 6.938232421875, 7.24951171875, 7.560791015625, 7.8720703125, 8.183349609375, 8.49462890625, 8.805908203125, 9.1171875]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 4.0, 2.0, 12.0, 5.0, 18.0, 23.0, 16.0, 18.0, 28.0, 36.0, 44.0, 57.0, 79.0, 93.0, 99.0, 110.0, 122.0, 142.0, 153.0, 180.0, 174.0, 189.0, 171.0, 222.0, 204.0, 202.0, 192.0, 202.0, 193.0, 183.0, 138.0, 130.0, 117.0, 113.0, 86.0, 64.0, 52.0, 42.0, 41.0, 33.0, 18.0, 15.0, 17.0, 13.0, 11.0, 7.0, 1.0, 4.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.83984375, -5.63104248046875, -5.4222412109375, -5.21343994140625, -5.004638671875, -4.79583740234375, -4.5870361328125, -4.37823486328125, -4.16943359375, -3.96063232421875, -3.7518310546875, -3.54302978515625, -3.334228515625, -3.12542724609375, -2.9166259765625, -2.70782470703125, -2.4990234375, -2.29022216796875, -2.0814208984375, -1.87261962890625, -1.663818359375, -1.45501708984375, -1.2462158203125, -1.03741455078125, -0.82861328125, -0.61981201171875, -0.4110107421875, -0.20220947265625, 0.006591796875, 0.21539306640625, 0.4241943359375, 0.63299560546875, 0.841796875, 1.05059814453125, 1.2593994140625, 1.46820068359375, 1.677001953125, 1.88580322265625, 2.0946044921875, 2.30340576171875, 2.51220703125, 2.72100830078125, 2.9298095703125, 3.13861083984375, 3.347412109375, 3.55621337890625, 3.7650146484375, 3.97381591796875, 4.1826171875, 4.39141845703125, 4.6002197265625, 4.80902099609375, 5.017822265625, 5.22662353515625, 5.4354248046875, 5.64422607421875, 5.85302734375, 6.06182861328125, 6.2706298828125, 6.47943115234375, 6.688232421875, 6.89703369140625, 7.1058349609375, 7.31463623046875, 7.5234375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 2.0, 6.0, 5.0, 5.0, 15.0, 18.0, 18.0, 20.0, 14.0, 15.0, 24.0, 31.0, 28.0, 32.0, 64.0, 36.0, 45.0, 59.0, 50.0, 60.0, 44.0, 39.0, 49.0, 44.0, 50.0, 32.0, 36.0, 26.0, 27.0, 16.0, 19.0, 17.0, 18.0, 8.0, 7.0, 8.0, 7.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.104876518249512, -14.599799156188965, -14.094720840454102, -13.589643478393555, -13.084566116333008, -12.579488754272461, -12.074411392211914, -11.56933307647705, -11.064255714416504, -10.559178352355957, -10.054100036621094, -9.549022674560547, -9.0439453125, -8.538867950439453, -8.033790588378906, -7.528712272644043, -7.023634910583496, -6.518557548522949, -6.013479709625244, -5.508401870727539, -5.003324508666992, -4.498247146606445, -3.9931693077087402, -3.4880917072296143, -2.9830141067504883, -2.4779365062713623, -1.9728589057922363, -1.4677813053131104, -0.9627037048339844, -0.4576261043548584, 0.04745149612426758, 0.5525290966033936, 1.0576057434082031, 1.562683343887329, 2.067760944366455, 2.572838544845581, 3.077916145324707, 3.582993745803833, 4.088071346282959, 4.593149185180664, 5.098226547241211, 5.603303909301758, 6.108381748199463, 6.613459587097168, 7.118536949157715, 7.623614311218262, 8.128692626953125, 8.633769989013672, 9.138847351074219, 9.643924713134766, 10.149002075195312, 10.654080390930176, 11.159157752990723, 11.66423511505127, 12.169313430786133, 12.67439079284668, 13.179468154907227, 13.684545516967773, 14.18962287902832, 14.694701194763184, 15.19977855682373, 15.704855918884277, 16.20993423461914, 16.715011596679688, 17.220088958740234]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 5.0, 8.0, 5.0, 7.0, 11.0, 13.0, 16.0, 14.0, 17.0, 14.0, 17.0, 23.0, 33.0, 26.0, 33.0, 36.0, 35.0, 39.0, 40.0, 28.0, 35.0, 38.0, 38.0, 37.0, 38.0, 43.0, 27.0, 42.0, 37.0, 37.0, 26.0, 38.0, 20.0, 19.0, 16.0, 18.0, 9.0, 8.0, 9.0, 9.0, 4.0, 9.0, 8.0, 6.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0], "bins": [-19.51291847229004, -18.950393676757812, -18.387868881225586, -17.82534408569336, -17.262821197509766, -16.70029640197754, -16.137771606445312, -15.575246810913086, -15.01272201538086, -14.450197219848633, -13.887672424316406, -13.325148582458496, -12.76262378692627, -12.200098991394043, -11.637575149536133, -11.075050354003906, -10.51252555847168, -9.950000762939453, -9.387475967407227, -8.824952125549316, -8.26242733001709, -7.699902534484863, -7.137378215789795, -6.574853897094727, -6.0123291015625, -5.449804306030273, -4.887279987335205, -4.324755668640137, -3.76223087310791, -3.1997063159942627, -2.6371817588806152, -2.0746572017669678, -1.5121326446533203, -0.9496080875396729, -0.3870835304260254, 0.17544102668762207, 0.7379655838012695, 1.300490140914917, 1.8630146980285645, 2.425539255142212, 2.9880638122558594, 3.550588369369507, 4.113112926483154, 4.675637245178223, 5.238162040710449, 5.800686836242676, 6.363211154937744, 6.9257354736328125, 7.488260269165039, 8.050785064697266, 8.613309860229492, 9.175833702087402, 9.738358497619629, 10.300883293151855, 10.863407135009766, 11.425931930541992, 11.988456726074219, 12.550981521606445, 13.113506317138672, 13.676030158996582, 14.238554954528809, 14.801079750061035, 15.363603591918945, 15.926128387451172, 16.4886531829834]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 5.0, 1.0, 4.0, 10.0, 15.0, 11.0, 27.0, 50.0, 80.0, 132.0, 174.0, 244.0, 448.0, 698.0, 1200.0, 2033.0, 3467.0, 5940.0, 10527.0, 18757.0, 35177.0, 68784.0, 143086.0, 280489.0, 240670.0, 114493.0, 56007.0, 28951.0, 15738.0, 8791.0, 5023.0, 3016.0, 1749.0, 1034.0, 659.0, 384.0, 231.0, 157.0, 97.0, 66.0, 54.0, 30.0, 23.0, 13.0, 5.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.04296875, -3.91192626953125, -3.7808837890625, -3.64984130859375, -3.518798828125, -3.38775634765625, -3.2567138671875, -3.12567138671875, -2.99462890625, -2.86358642578125, -2.7325439453125, -2.60150146484375, -2.470458984375, -2.33941650390625, -2.2083740234375, -2.07733154296875, -1.9462890625, -1.81524658203125, -1.6842041015625, -1.55316162109375, -1.422119140625, -1.29107666015625, -1.1600341796875, -1.02899169921875, -0.89794921875, -0.76690673828125, -0.6358642578125, -0.50482177734375, -0.373779296875, -0.24273681640625, -0.1116943359375, 0.01934814453125, 0.150390625, 0.28143310546875, 0.4124755859375, 0.54351806640625, 0.674560546875, 0.80560302734375, 0.9366455078125, 1.06768798828125, 1.19873046875, 1.32977294921875, 1.4608154296875, 1.59185791015625, 1.722900390625, 1.85394287109375, 1.9849853515625, 2.11602783203125, 2.2470703125, 2.37811279296875, 2.5091552734375, 2.64019775390625, 2.771240234375, 2.90228271484375, 3.0333251953125, 3.16436767578125, 3.29541015625, 3.42645263671875, 3.5574951171875, 3.68853759765625, 3.819580078125, 3.95062255859375, 4.0816650390625, 4.21270751953125, 4.34375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 7.0, 5.0, 10.0, 13.0, 17.0, 17.0, 14.0, 15.0, 24.0, 21.0, 21.0, 25.0, 32.0, 28.0, 41.0, 46.0, 34.0, 45.0, 25.0, 43.0, 27.0, 39.0, 35.0, 55.0, 41.0, 46.0, 30.0, 27.0, 23.0, 31.0, 27.0, 23.0, 19.0, 18.0, 15.0, 20.0, 2.0, 7.0, 8.0, 4.0, 7.0, 2.0, 4.0, 3.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0], "bins": [-20.515625, -19.914794921875, -19.31396484375, -18.713134765625, -18.1123046875, -17.511474609375, -16.91064453125, -16.309814453125, -15.708984375, -15.108154296875, -14.50732421875, -13.906494140625, -13.3056640625, -12.704833984375, -12.10400390625, -11.503173828125, -10.90234375, -10.301513671875, -9.70068359375, -9.099853515625, -8.4990234375, -7.898193359375, -7.29736328125, -6.696533203125, -6.095703125, -5.494873046875, -4.89404296875, -4.293212890625, -3.6923828125, -3.091552734375, -2.49072265625, -1.889892578125, -1.2890625, -0.688232421875, -0.08740234375, 0.513427734375, 1.1142578125, 1.715087890625, 2.31591796875, 2.916748046875, 3.517578125, 4.118408203125, 4.71923828125, 5.320068359375, 5.9208984375, 6.521728515625, 7.12255859375, 7.723388671875, 8.32421875, 8.925048828125, 9.52587890625, 10.126708984375, 10.7275390625, 11.328369140625, 11.92919921875, 12.530029296875, 13.130859375, 13.731689453125, 14.33251953125, 14.933349609375, 15.5341796875, 16.135009765625, 16.73583984375, 17.336669921875, 17.9375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 9.0, 7.0, 11.0, 18.0, 10.0, 17.0, 23.0, 25.0, 41.0, 45.0, 66.0, 82.0, 120.0, 149.0, 194.0, 266.0, 372.0, 503.0, 729.0, 1128.0, 1855.0, 3268.0, 6796.0, 16035.0, 45178.0, 896421.0, 44195.0, 15609.0, 6631.0, 3186.0, 1796.0, 1091.0, 760.0, 517.0, 356.0, 257.0, 185.0, 129.0, 108.0, 93.0, 58.0, 48.0, 30.0, 32.0, 18.0, 21.0, 19.0, 11.0, 7.0, 8.0, 10.0, 3.0, 6.0, 2.0, 1.0, 0.0, 3.0, 1.0], "bins": [-10.03125, -9.712646484375, -9.39404296875, -9.075439453125, -8.7568359375, -8.438232421875, -8.11962890625, -7.801025390625, -7.482421875, -7.163818359375, -6.84521484375, -6.526611328125, -6.2080078125, -5.889404296875, -5.57080078125, -5.252197265625, -4.93359375, -4.614990234375, -4.29638671875, -3.977783203125, -3.6591796875, -3.340576171875, -3.02197265625, -2.703369140625, -2.384765625, -2.066162109375, -1.74755859375, -1.428955078125, -1.1103515625, -0.791748046875, -0.47314453125, -0.154541015625, 0.1640625, 0.482666015625, 0.80126953125, 1.119873046875, 1.4384765625, 1.757080078125, 2.07568359375, 2.394287109375, 2.712890625, 3.031494140625, 3.35009765625, 3.668701171875, 3.9873046875, 4.305908203125, 4.62451171875, 4.943115234375, 5.26171875, 5.580322265625, 5.89892578125, 6.217529296875, 6.5361328125, 6.854736328125, 7.17333984375, 7.491943359375, 7.810546875, 8.129150390625, 8.44775390625, 8.766357421875, 9.0849609375, 9.403564453125, 9.72216796875, 10.040771484375, 10.359375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 2.0, 6.0, 1.0, 0.0, 4.0, 4.0, 8.0, 4.0, 4.0, 6.0, 9.0, 19.0, 12.0, 12.0, 26.0, 30.0, 14.0, 24.0, 20.0, 36.0, 39.0, 27.0, 35.0, 30.0, 38.0, 28.0, 30.0, 48.0, 31.0, 33.0, 35.0, 35.0, 35.0, 37.0, 42.0, 23.0, 30.0, 18.0, 21.0, 22.0, 26.0, 16.0, 17.0, 16.0, 8.0, 6.0, 8.0, 6.0, 7.0, 2.0, 2.0, 3.0, 10.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0], "bins": [-11.3046875, -10.9471435546875, -10.589599609375, -10.2320556640625, -9.87451171875, -9.5169677734375, -9.159423828125, -8.8018798828125, -8.4443359375, -8.0867919921875, -7.729248046875, -7.3717041015625, -7.01416015625, -6.6566162109375, -6.299072265625, -5.9415283203125, -5.583984375, -5.2264404296875, -4.868896484375, -4.5113525390625, -4.15380859375, -3.7962646484375, -3.438720703125, -3.0811767578125, -2.7236328125, -2.3660888671875, -2.008544921875, -1.6510009765625, -1.29345703125, -0.9359130859375, -0.578369140625, -0.2208251953125, 0.13671875, 0.4942626953125, 0.851806640625, 1.2093505859375, 1.56689453125, 1.9244384765625, 2.281982421875, 2.6395263671875, 2.9970703125, 3.3546142578125, 3.712158203125, 4.0697021484375, 4.42724609375, 4.7847900390625, 5.142333984375, 5.4998779296875, 5.857421875, 6.2149658203125, 6.572509765625, 6.9300537109375, 7.28759765625, 7.6451416015625, 8.002685546875, 8.3602294921875, 8.7177734375, 9.0753173828125, 9.432861328125, 9.7904052734375, 10.14794921875, 10.5054931640625, 10.863037109375, 11.2205810546875, 11.578125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 6.0, 2.0, 12.0, 5.0, 11.0, 18.0, 19.0, 24.0, 43.0, 44.0, 59.0, 73.0, 113.0, 169.0, 248.0, 316.0, 498.0, 796.0, 1252.0, 2358.0, 5138.0, 14367.0, 70633.0, 917193.0, 20956.0, 6881.0, 3043.0, 1532.0, 894.0, 602.0, 338.0, 249.0, 187.0, 127.0, 88.0, 74.0, 56.0, 33.0, 31.0, 17.0, 14.0, 11.0, 9.0, 7.0, 7.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.9453125, -0.917633056640625, -0.88995361328125, -0.862274169921875, -0.8345947265625, -0.806915283203125, -0.77923583984375, -0.751556396484375, -0.723876953125, -0.696197509765625, -0.66851806640625, -0.640838623046875, -0.6131591796875, -0.585479736328125, -0.55780029296875, -0.530120849609375, -0.50244140625, -0.474761962890625, -0.44708251953125, -0.419403076171875, -0.3917236328125, -0.364044189453125, -0.33636474609375, -0.308685302734375, -0.281005859375, -0.253326416015625, -0.22564697265625, -0.197967529296875, -0.1702880859375, -0.142608642578125, -0.11492919921875, -0.087249755859375, -0.0595703125, -0.031890869140625, -0.00421142578125, 0.023468017578125, 0.0511474609375, 0.078826904296875, 0.10650634765625, 0.134185791015625, 0.161865234375, 0.189544677734375, 0.21722412109375, 0.244903564453125, 0.2725830078125, 0.300262451171875, 0.32794189453125, 0.355621337890625, 0.38330078125, 0.410980224609375, 0.43865966796875, 0.466339111328125, 0.4940185546875, 0.521697998046875, 0.54937744140625, 0.577056884765625, 0.604736328125, 0.632415771484375, 0.66009521484375, 0.687774658203125, 0.7154541015625, 0.743133544921875, 0.77081298828125, 0.798492431640625, 0.826171875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 5.0, 11.0, 3.0, 1.0, 9.0, 9.0, 11.0, 14.0, 19.0, 14.0, 20.0, 23.0, 17.0, 27.0, 37.0, 30.0, 37.0, 31.0, 38.0, 34.0, 33.0, 52.0, 47.0, 37.0, 31.0, 33.0, 48.0, 27.0, 42.0, 35.0, 27.0, 33.0, 24.0, 19.0, 20.0, 16.0, 14.0, 21.0, 7.0, 13.0, 11.0, 2.0, 10.0, 2.0, 5.0, 2.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0], "bins": [-8.106231689453125e-06, -7.871538400650024e-06, -7.636845111846924e-06, -7.402151823043823e-06, -7.167458534240723e-06, -6.932765245437622e-06, -6.6980719566345215e-06, -6.463378667831421e-06, -6.22868537902832e-06, -5.99399209022522e-06, -5.759298801422119e-06, -5.5246055126190186e-06, -5.289912223815918e-06, -5.055218935012817e-06, -4.820525646209717e-06, -4.585832357406616e-06, -4.351139068603516e-06, -4.116445779800415e-06, -3.8817524909973145e-06, -3.647059202194214e-06, -3.4123659133911133e-06, -3.1776726245880127e-06, -2.942979335784912e-06, -2.7082860469818115e-06, -2.473592758178711e-06, -2.2388994693756104e-06, -2.0042061805725098e-06, -1.7695128917694092e-06, -1.5348196029663086e-06, -1.300126314163208e-06, -1.0654330253601074e-06, -8.307397365570068e-07, -5.960464477539062e-07, -3.6135315895080566e-07, -1.2665987014770508e-07, 1.0803341865539551e-07, 3.427267074584961e-07, 5.774199962615967e-07, 8.121132850646973e-07, 1.0468065738677979e-06, 1.2814998626708984e-06, 1.516193151473999e-06, 1.7508864402770996e-06, 1.9855797290802e-06, 2.2202730178833008e-06, 2.4549663066864014e-06, 2.689659595489502e-06, 2.9243528842926025e-06, 3.159046173095703e-06, 3.3937394618988037e-06, 3.6284327507019043e-06, 3.863126039505005e-06, 4.0978193283081055e-06, 4.332512617111206e-06, 4.567205905914307e-06, 4.801899194717407e-06, 5.036592483520508e-06, 5.271285772323608e-06, 5.505979061126709e-06, 5.7406723499298096e-06, 5.97536563873291e-06, 6.210058927536011e-06, 6.444752216339111e-06, 6.679445505142212e-06, 6.9141387939453125e-06]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 5.0, 11.0, 14.0, 19.0, 34.0, 53.0, 75.0, 108.0, 176.0, 210.0, 300.0, 439.0, 660.0, 970.0, 1447.0, 2167.0, 3136.0, 4752.0, 6838.0, 10245.0, 15181.0, 22889.0, 35139.0, 56136.0, 95160.0, 188817.0, 260858.0, 135202.0, 74707.0, 45800.0, 28927.0, 19163.0, 12581.0, 8525.0, 5750.0, 3877.0, 2564.0, 1860.0, 1219.0, 840.0, 591.0, 350.0, 228.0, 190.0, 112.0, 70.0, 54.0, 32.0, 20.0, 21.0, 19.0, 11.0, 3.0, 5.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.2978515625, -0.2876777648925781, -0.27750396728515625, -0.2673301696777344, -0.2571563720703125, -0.24698257446289062, -0.23680877685546875, -0.22663497924804688, -0.216461181640625, -0.20628738403320312, -0.19611358642578125, -0.18593978881835938, -0.1757659912109375, -0.16559219360351562, -0.15541839599609375, -0.14524459838867188, -0.13507080078125, -0.12489700317382812, -0.11472320556640625, -0.10454940795898438, -0.0943756103515625, -0.08420181274414062, -0.07402801513671875, -0.06385421752929688, -0.053680419921875, -0.043506622314453125, -0.03333282470703125, -0.023159027099609375, -0.0129852294921875, -0.002811431884765625, 0.00736236572265625, 0.017536163330078125, 0.0277099609375, 0.037883758544921875, 0.04805755615234375, 0.058231353759765625, 0.0684051513671875, 0.07857894897460938, 0.08875274658203125, 0.09892654418945312, 0.109100341796875, 0.11927413940429688, 0.12944793701171875, 0.13962173461914062, 0.1497955322265625, 0.15996932983398438, 0.17014312744140625, 0.18031692504882812, 0.19049072265625, 0.20066452026367188, 0.21083831787109375, 0.22101211547851562, 0.2311859130859375, 0.24135971069335938, 0.25153350830078125, 0.2617073059082031, 0.271881103515625, 0.2820549011230469, 0.29222869873046875, 0.3024024963378906, 0.3125762939453125, 0.3227500915527344, 0.33292388916015625, 0.3430976867675781, 0.353271484375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 5.0, 2.0, 5.0, 6.0, 5.0, 9.0, 5.0, 13.0, 7.0, 10.0, 16.0, 16.0, 19.0, 28.0, 43.0, 56.0, 49.0, 53.0, 71.0, 60.0, 65.0, 61.0, 65.0, 56.0, 43.0, 45.0, 42.0, 25.0, 21.0, 20.0, 8.0, 13.0, 9.0, 7.0, 13.0, 7.0, 4.0, 9.0, 4.0, 4.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 4.0, 1.0, 2.0], "bins": [-0.2215576171875, -0.21425819396972656, -0.20695877075195312, -0.1996593475341797, -0.19235992431640625, -0.1850605010986328, -0.17776107788085938, -0.17046165466308594, -0.1631622314453125, -0.15586280822753906, -0.14856338500976562, -0.1412639617919922, -0.13396453857421875, -0.1266651153564453, -0.11936569213867188, -0.11206626892089844, -0.104766845703125, -0.09746742248535156, -0.09016799926757812, -0.08286857604980469, -0.07556915283203125, -0.06826972961425781, -0.060970306396484375, -0.05367088317871094, -0.0463714599609375, -0.03907203674316406, -0.031772613525390625, -0.024473190307617188, -0.01717376708984375, -0.009874343872070312, -0.002574920654296875, 0.0047245025634765625, 0.01202392578125, 0.019323348999023438, 0.026622772216796875, 0.03392219543457031, 0.04122161865234375, 0.04852104187011719, 0.055820465087890625, 0.06311988830566406, 0.0704193115234375, 0.07771873474121094, 0.08501815795898438, 0.09231758117675781, 0.09961700439453125, 0.10691642761230469, 0.11421585083007812, 0.12151527404785156, 0.128814697265625, 0.13611412048339844, 0.14341354370117188, 0.1507129669189453, 0.15801239013671875, 0.1653118133544922, 0.17261123657226562, 0.17991065979003906, 0.1872100830078125, 0.19450950622558594, 0.20180892944335938, 0.2091083526611328, 0.21640777587890625, 0.2237071990966797, 0.23100662231445312, 0.23830604553222656, 0.24560546875]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 7.0, 4.0, 5.0, 4.0, 10.0, 23.0, 14.0, 18.0, 15.0, 19.0, 18.0, 31.0, 28.0, 35.0, 55.0, 45.0, 44.0, 48.0, 62.0, 57.0, 49.0, 35.0, 51.0, 42.0, 45.0, 43.0, 36.0, 27.0, 27.0, 17.0, 19.0, 18.0, 18.0, 9.0, 6.0, 10.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.551993370056152, -15.039097785949707, -14.526201248168945, -14.0133056640625, -13.500410079956055, -12.98751449584961, -12.474618911743164, -11.961722373962402, -11.448826789855957, -10.935931205749512, -10.42303466796875, -9.910139083862305, -9.39724349975586, -8.884347915649414, -8.371452331542969, -7.858555793762207, -7.345660209655762, -6.832764625549316, -6.319868564605713, -5.806972503662109, -5.294076919555664, -4.781181335449219, -4.268285274505615, -3.755389451980591, -3.2424936294555664, -2.729597806930542, -2.2167019844055176, -1.7038061618804932, -1.1909103393554688, -0.6780145168304443, -0.16511869430541992, 0.3477771282196045, 0.8606719970703125, 1.373567819595337, 1.8864636421203613, 2.3993594646453857, 2.91225528717041, 3.4251511096954346, 3.938046932220459, 4.4509429931640625, 4.963838577270508, 5.476734161376953, 5.989630222320557, 6.50252628326416, 7.0154218673706055, 7.528317451477051, 8.041213989257812, 8.554109573364258, 9.067005157470703, 9.579900741577148, 10.092796325683594, 10.605692863464355, 11.1185884475708, 11.631484031677246, 12.144380569458008, 12.657276153564453, 13.170171737670898, 13.683067321777344, 14.195962905883789, 14.70885944366455, 15.221755027770996, 15.734650611877441, 16.247547149658203, 16.76044273376465, 17.273338317871094]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 5.0, 8.0, 5.0, 9.0, 10.0, 11.0, 18.0, 13.0, 19.0, 15.0, 14.0, 27.0, 30.0, 30.0, 33.0, 36.0, 34.0, 40.0, 34.0, 33.0, 35.0, 37.0, 36.0, 36.0, 41.0, 40.0, 30.0, 47.0, 35.0, 35.0, 29.0, 31.0, 21.0, 22.0, 13.0, 18.0, 9.0, 7.0, 10.0, 9.0, 4.0, 9.0, 7.0, 7.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0], "bins": [-19.511669158935547, -18.949382781982422, -18.387096405029297, -17.824811935424805, -17.26252555847168, -16.700239181518555, -16.137954711914062, -15.575668334960938, -15.013381958007812, -14.451095581054688, -13.888810157775879, -13.32652473449707, -12.764238357543945, -12.20195198059082, -11.639666557312012, -11.077381134033203, -10.515094757080078, -9.952808380126953, -9.390522956848145, -8.828237533569336, -8.265951156616211, -7.703665256500244, -7.141379356384277, -6.5790934562683105, -6.016807556152344, -5.454521656036377, -4.89223575592041, -4.329949855804443, -3.7676639556884766, -3.2053780555725098, -2.643092155456543, -2.080806255340576, -1.5185222625732422, -0.9562363624572754, -0.3939504623413086, 0.1683354377746582, 0.730621337890625, 1.2929072380065918, 1.8551931381225586, 2.4174790382385254, 2.979764938354492, 3.542050838470459, 4.104336738586426, 4.666622638702393, 5.228908538818359, 5.791194438934326, 6.353480339050293, 6.91576623916626, 7.478052139282227, 8.040338516235352, 8.60262393951416, 9.164909362792969, 9.727195739746094, 10.289482116699219, 10.851767539978027, 11.414052963256836, 11.976339340209961, 12.538625717163086, 13.100911140441895, 13.663196563720703, 14.225482940673828, 14.787769317626953, 15.350054740905762, 15.91234016418457, 16.474626541137695]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 8.0, 7.0, 18.0, 21.0, 55.0, 84.0, 118.0, 195.0, 278.0, 466.0, 753.0, 1197.0, 1852.0, 2924.0, 4713.0, 7094.0, 10872.0, 16573.0, 24077.0, 34274.0, 46794.0, 61726.0, 77122.0, 90926.0, 100445.0, 102600.0, 99030.0, 88611.0, 73698.0, 58790.0, 45339.0, 32033.0, 22334.0, 15197.0, 9968.0, 6653.0, 4269.0, 2679.0, 1759.0, 1077.0, 736.0, 442.0, 298.0, 176.0, 112.0, 61.0, 48.0, 24.0, 18.0, 10.0, 4.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0], "bins": [-7.1328125, -6.9127197265625, -6.692626953125, -6.4725341796875, -6.25244140625, -6.0323486328125, -5.812255859375, -5.5921630859375, -5.3720703125, -5.1519775390625, -4.931884765625, -4.7117919921875, -4.49169921875, -4.2716064453125, -4.051513671875, -3.8314208984375, -3.611328125, -3.3912353515625, -3.171142578125, -2.9510498046875, -2.73095703125, -2.5108642578125, -2.290771484375, -2.0706787109375, -1.8505859375, -1.6304931640625, -1.410400390625, -1.1903076171875, -0.97021484375, -0.7501220703125, -0.530029296875, -0.3099365234375, -0.08984375, 0.1302490234375, 0.350341796875, 0.5704345703125, 0.79052734375, 1.0106201171875, 1.230712890625, 1.4508056640625, 1.6708984375, 1.8909912109375, 2.111083984375, 2.3311767578125, 2.55126953125, 2.7713623046875, 2.991455078125, 3.2115478515625, 3.431640625, 3.6517333984375, 3.871826171875, 4.0919189453125, 4.31201171875, 4.5321044921875, 4.752197265625, 4.9722900390625, 5.1923828125, 5.4124755859375, 5.632568359375, 5.8526611328125, 6.07275390625, 6.2928466796875, 6.512939453125, 6.7330322265625, 6.953125]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 5.0, 4.0, 7.0, 3.0, 11.0, 6.0, 15.0, 19.0, 9.0, 13.0, 24.0, 15.0, 27.0, 29.0, 26.0, 39.0, 39.0, 36.0, 46.0, 41.0, 32.0, 35.0, 42.0, 57.0, 48.0, 34.0, 30.0, 33.0, 31.0, 38.0, 29.0, 31.0, 16.0, 30.0, 26.0, 8.0, 17.0, 9.0, 7.0, 10.0, 8.0, 6.0, 5.0, 5.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.375, -18.775390625, -18.17578125, -17.576171875, -16.9765625, -16.376953125, -15.77734375, -15.177734375, -14.578125, -13.978515625, -13.37890625, -12.779296875, -12.1796875, -11.580078125, -10.98046875, -10.380859375, -9.78125, -9.181640625, -8.58203125, -7.982421875, -7.3828125, -6.783203125, -6.18359375, -5.583984375, -4.984375, -4.384765625, -3.78515625, -3.185546875, -2.5859375, -1.986328125, -1.38671875, -0.787109375, -0.1875, 0.412109375, 1.01171875, 1.611328125, 2.2109375, 2.810546875, 3.41015625, 4.009765625, 4.609375, 5.208984375, 5.80859375, 6.408203125, 7.0078125, 7.607421875, 8.20703125, 8.806640625, 9.40625, 10.005859375, 10.60546875, 11.205078125, 11.8046875, 12.404296875, 13.00390625, 13.603515625, 14.203125, 14.802734375, 15.40234375, 16.001953125, 16.6015625, 17.201171875, 17.80078125, 18.400390625, 19.0]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 6.0, 10.0, 20.0, 23.0, 40.0, 66.0, 118.0, 193.0, 300.0, 475.0, 713.0, 1273.0, 1976.0, 3249.0, 5237.0, 8080.0, 12460.0, 18667.0, 27733.0, 39658.0, 53738.0, 70659.0, 86808.0, 99279.0, 106576.0, 105660.0, 96854.0, 82927.0, 66250.0, 49872.0, 36345.0, 25341.0, 17162.0, 11298.0, 7202.0, 4651.0, 2846.0, 1799.0, 1141.0, 735.0, 420.0, 252.0, 174.0, 104.0, 61.0, 44.0, 24.0, 14.0, 12.0, 7.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.6796875, -7.43878173828125, -7.1978759765625, -6.95697021484375, -6.716064453125, -6.47515869140625, -6.2342529296875, -5.99334716796875, -5.75244140625, -5.51153564453125, -5.2706298828125, -5.02972412109375, -4.788818359375, -4.54791259765625, -4.3070068359375, -4.06610107421875, -3.8251953125, -3.58428955078125, -3.3433837890625, -3.10247802734375, -2.861572265625, -2.62066650390625, -2.3797607421875, -2.13885498046875, -1.89794921875, -1.65704345703125, -1.4161376953125, -1.17523193359375, -0.934326171875, -0.69342041015625, -0.4525146484375, -0.21160888671875, 0.029296875, 0.27020263671875, 0.5111083984375, 0.75201416015625, 0.992919921875, 1.23382568359375, 1.4747314453125, 1.71563720703125, 1.95654296875, 2.19744873046875, 2.4383544921875, 2.67926025390625, 2.920166015625, 3.16107177734375, 3.4019775390625, 3.64288330078125, 3.8837890625, 4.12469482421875, 4.3656005859375, 4.60650634765625, 4.847412109375, 5.08831787109375, 5.3292236328125, 5.57012939453125, 5.81103515625, 6.05194091796875, 6.2928466796875, 6.53375244140625, 6.774658203125, 7.01556396484375, 7.2564697265625, 7.49737548828125, 7.73828125]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 8.0, 5.0, 8.0, 6.0, 6.0, 13.0, 14.0, 21.0, 20.0, 18.0, 25.0, 18.0, 30.0, 36.0, 25.0, 41.0, 46.0, 38.0, 40.0, 51.0, 38.0, 42.0, 33.0, 37.0, 34.0, 28.0, 34.0, 35.0, 38.0, 36.0, 34.0, 20.0, 13.0, 15.0, 15.0, 18.0, 15.0, 8.0, 12.0, 7.0, 8.0, 4.0, 3.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-11.8046875, -11.427001953125, -11.04931640625, -10.671630859375, -10.2939453125, -9.916259765625, -9.53857421875, -9.160888671875, -8.783203125, -8.405517578125, -8.02783203125, -7.650146484375, -7.2724609375, -6.894775390625, -6.51708984375, -6.139404296875, -5.76171875, -5.384033203125, -5.00634765625, -4.628662109375, -4.2509765625, -3.873291015625, -3.49560546875, -3.117919921875, -2.740234375, -2.362548828125, -1.98486328125, -1.607177734375, -1.2294921875, -0.851806640625, -0.47412109375, -0.096435546875, 0.28125, 0.658935546875, 1.03662109375, 1.414306640625, 1.7919921875, 2.169677734375, 2.54736328125, 2.925048828125, 3.302734375, 3.680419921875, 4.05810546875, 4.435791015625, 4.8134765625, 5.191162109375, 5.56884765625, 5.946533203125, 6.32421875, 6.701904296875, 7.07958984375, 7.457275390625, 7.8349609375, 8.212646484375, 8.59033203125, 8.968017578125, 9.345703125, 9.723388671875, 10.10107421875, 10.478759765625, 10.8564453125, 11.234130859375, 11.61181640625, 11.989501953125, 12.3671875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 4.0, 7.0, 6.0, 13.0, 14.0, 26.0, 35.0, 52.0, 65.0, 118.0, 179.0, 289.0, 443.0, 661.0, 1108.0, 1871.0, 2948.0, 4843.0, 7638.0, 12146.0, 18729.0, 27966.0, 39569.0, 53501.0, 69558.0, 84578.0, 97543.0, 103852.0, 103154.0, 96350.0, 83738.0, 69031.0, 53419.0, 38505.0, 26887.0, 18047.0, 11873.0, 7473.0, 4700.0, 2857.0, 1722.0, 1144.0, 729.0, 413.0, 266.0, 192.0, 101.0, 78.0, 42.0, 33.0, 15.0, 13.0, 12.0, 4.0, 9.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.580078125, -2.49676513671875, -2.4134521484375, -2.33013916015625, -2.246826171875, -2.16351318359375, -2.0802001953125, -1.99688720703125, -1.91357421875, -1.83026123046875, -1.7469482421875, -1.66363525390625, -1.580322265625, -1.49700927734375, -1.4136962890625, -1.33038330078125, -1.2470703125, -1.16375732421875, -1.0804443359375, -0.99713134765625, -0.913818359375, -0.83050537109375, -0.7471923828125, -0.66387939453125, -0.58056640625, -0.49725341796875, -0.4139404296875, -0.33062744140625, -0.247314453125, -0.16400146484375, -0.0806884765625, 0.00262451171875, 0.0859375, 0.16925048828125, 0.2525634765625, 0.33587646484375, 0.419189453125, 0.50250244140625, 0.5858154296875, 0.66912841796875, 0.75244140625, 0.83575439453125, 0.9190673828125, 1.00238037109375, 1.085693359375, 1.16900634765625, 1.2523193359375, 1.33563232421875, 1.4189453125, 1.50225830078125, 1.5855712890625, 1.66888427734375, 1.752197265625, 1.83551025390625, 1.9188232421875, 2.00213623046875, 2.08544921875, 2.16876220703125, 2.2520751953125, 2.33538818359375, 2.418701171875, 2.50201416015625, 2.5853271484375, 2.66864013671875, 2.751953125]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 4.0, 3.0, 1.0, 5.0, 3.0, 3.0, 11.0, 15.0, 10.0, 16.0, 14.0, 28.0, 26.0, 29.0, 39.0, 25.0, 28.0, 28.0, 26.0, 34.0, 31.0, 45.0, 47.0, 35.0, 34.0, 31.0, 36.0, 41.0, 41.0, 38.0, 41.0, 37.0, 28.0, 25.0, 25.0, 19.0, 14.0, 10.0, 8.0, 8.0, 9.0, 13.0, 8.0, 6.0, 12.0, 5.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 3.0], "bins": [-0.000308990478515625, -0.0002996101975440979, -0.0002902299165725708, -0.0002808496356010437, -0.0002714693546295166, -0.0002620890736579895, -0.0002527087926864624, -0.0002433285117149353, -0.0002339482307434082, -0.0002245679497718811, -0.000215187668800354, -0.0002058073878288269, -0.0001964271068572998, -0.0001870468258857727, -0.0001776665449142456, -0.0001682862639427185, -0.0001589059829711914, -0.0001495257019996643, -0.0001401454210281372, -0.0001307651400566101, -0.00012138485908508301, -0.00011200457811355591, -0.00010262429714202881, -9.324401617050171e-05, -8.386373519897461e-05, -7.448345422744751e-05, -6.510317325592041e-05, -5.572289228439331e-05, -4.634261131286621e-05, -3.696233034133911e-05, -2.7582049369812012e-05, -1.8201768398284912e-05, -8.821487426757812e-06, 5.587935447692871e-07, 9.939074516296387e-06, 1.9319355487823486e-05, 2.8699636459350586e-05, 3.8079917430877686e-05, 4.7460198402404785e-05, 5.6840479373931885e-05, 6.622076034545898e-05, 7.560104131698608e-05, 8.498132228851318e-05, 9.436160326004028e-05, 0.00010374188423156738, 0.00011312216520309448, 0.00012250244617462158, 0.00013188272714614868, 0.00014126300811767578, 0.00015064328908920288, 0.00016002357006072998, 0.00016940385103225708, 0.00017878413200378418, 0.00018816441297531128, 0.00019754469394683838, 0.00020692497491836548, 0.00021630525588989258, 0.00022568553686141968, 0.00023506581783294678, 0.0002444460988044739, 0.000253826379776001, 0.0002632066607475281, 0.0002725869417190552, 0.0002819672226905823, 0.0002913475036621094]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 7.0, 16.0, 13.0, 28.0, 47.0, 73.0, 126.0, 208.0, 371.0, 704.0, 1299.0, 2467.0, 4702.0, 9260.0, 17897.0, 33171.0, 57640.0, 92139.0, 128476.0, 154918.0, 157320.0, 137190.0, 101653.0, 66173.0, 38210.0, 21265.0, 11030.0, 5561.0, 2980.0, 1623.0, 851.0, 442.0, 301.0, 159.0, 99.0, 50.0, 36.0, 16.0, 15.0, 8.0, 5.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.75390625, -4.61859130859375, -4.4832763671875, -4.34796142578125, -4.212646484375, -4.07733154296875, -3.9420166015625, -3.80670166015625, -3.67138671875, -3.53607177734375, -3.4007568359375, -3.26544189453125, -3.130126953125, -2.99481201171875, -2.8594970703125, -2.72418212890625, -2.5888671875, -2.45355224609375, -2.3182373046875, -2.18292236328125, -2.047607421875, -1.91229248046875, -1.7769775390625, -1.64166259765625, -1.50634765625, -1.37103271484375, -1.2357177734375, -1.10040283203125, -0.965087890625, -0.82977294921875, -0.6944580078125, -0.55914306640625, -0.423828125, -0.28851318359375, -0.1531982421875, -0.01788330078125, 0.117431640625, 0.25274658203125, 0.3880615234375, 0.52337646484375, 0.65869140625, 0.79400634765625, 0.9293212890625, 1.06463623046875, 1.199951171875, 1.33526611328125, 1.4705810546875, 1.60589599609375, 1.7412109375, 1.87652587890625, 2.0118408203125, 2.14715576171875, 2.282470703125, 2.41778564453125, 2.5531005859375, 2.68841552734375, 2.82373046875, 2.95904541015625, 3.0943603515625, 3.22967529296875, 3.364990234375, 3.50030517578125, 3.6356201171875, 3.77093505859375, 3.90625]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 2.0, 11.0, 9.0, 4.0, 8.0, 17.0, 11.0, 17.0, 20.0, 25.0, 16.0, 28.0, 31.0, 43.0, 28.0, 32.0, 51.0, 43.0, 45.0, 41.0, 46.0, 34.0, 37.0, 35.0, 33.0, 38.0, 30.0, 40.0, 30.0, 32.0, 18.0, 20.0, 19.0, 20.0, 15.0, 15.0, 16.0, 3.0, 13.0, 3.0, 6.0, 4.0, 2.0, 0.0, 4.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.306640625, -1.266998291015625, -1.22735595703125, -1.187713623046875, -1.1480712890625, -1.108428955078125, -1.06878662109375, -1.029144287109375, -0.989501953125, -0.949859619140625, -0.91021728515625, -0.870574951171875, -0.8309326171875, -0.791290283203125, -0.75164794921875, -0.712005615234375, -0.67236328125, -0.632720947265625, -0.59307861328125, -0.553436279296875, -0.5137939453125, -0.474151611328125, -0.43450927734375, -0.394866943359375, -0.355224609375, -0.315582275390625, -0.27593994140625, -0.236297607421875, -0.1966552734375, -0.157012939453125, -0.11737060546875, -0.077728271484375, -0.0380859375, 0.001556396484375, 0.04119873046875, 0.080841064453125, 0.1204833984375, 0.160125732421875, 0.19976806640625, 0.239410400390625, 0.279052734375, 0.318695068359375, 0.35833740234375, 0.397979736328125, 0.4376220703125, 0.477264404296875, 0.51690673828125, 0.556549072265625, 0.59619140625, 0.635833740234375, 0.67547607421875, 0.715118408203125, 0.7547607421875, 0.794403076171875, 0.83404541015625, 0.873687744140625, 0.913330078125, 0.952972412109375, 0.99261474609375, 1.032257080078125, 1.0718994140625, 1.111541748046875, 1.15118408203125, 1.190826416015625, 1.23046875]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 0.0, 1.0, 5.0, 7.0, 8.0, 11.0, 16.0, 15.0, 17.0, 16.0, 26.0, 24.0, 33.0, 31.0, 45.0, 48.0, 56.0, 52.0, 54.0, 62.0, 52.0, 50.0, 42.0, 53.0, 44.0, 31.0, 44.0, 40.0, 22.0, 20.0, 19.0, 16.0, 10.0, 14.0, 8.0, 3.0, 3.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.918413162231445, -16.36451530456543, -15.81061840057373, -15.256721496582031, -14.702824592590332, -14.148927688598633, -13.595029830932617, -13.041132926940918, -12.487236022949219, -11.93333911895752, -11.379441261291504, -10.825544357299805, -10.271647453308105, -9.717750549316406, -9.16385269165039, -8.609955787658691, -8.056057929992676, -7.502160549163818, -6.948263645172119, -6.394366264343262, -5.8404693603515625, -5.286571979522705, -4.732674598693848, -4.178777694702148, -3.624880313873291, -3.0709831714630127, -2.5170860290527344, -1.963188648223877, -1.4092915058135986, -0.8553943634033203, -0.3014969825744629, 0.25240015983581543, 0.8062973022460938, 1.360194444656372, 1.91409170627594, 2.467988967895508, 3.021886110305786, 3.5757832527160645, 4.129680633544922, 4.683577537536621, 5.2374749183654785, 5.791372299194336, 6.345269203186035, 6.899166584014893, 7.45306396484375, 8.00696086883545, 8.560857772827148, 9.114755630493164, 9.668652534484863, 10.222549438476562, 10.776447296142578, 11.330344200134277, 11.884241104125977, 12.438138961791992, 12.992035865783691, 13.54593276977539, 14.099830627441406, 14.653727531433105, 15.207625389099121, 15.76152229309082, 16.315420150756836, 16.86931610107422, 17.423213958740234, 17.97711181640625, 18.531007766723633]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 9.0, 5.0, 6.0, 12.0, 10.0, 18.0, 16.0, 15.0, 16.0, 15.0, 17.0, 18.0, 29.0, 37.0, 43.0, 33.0, 37.0, 37.0, 36.0, 34.0, 47.0, 43.0, 47.0, 37.0, 27.0, 40.0, 42.0, 35.0, 43.0, 30.0, 23.0, 23.0, 13.0, 14.0, 15.0, 12.0, 12.0, 12.0, 10.0, 9.0, 8.0, 6.0, 5.0, 2.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-21.1395320892334, -20.482078552246094, -19.824623107910156, -19.16716957092285, -18.509716033935547, -17.852262496948242, -17.194808959960938, -16.537353515625, -15.879899978637695, -15.22244644165039, -14.56499195098877, -13.907537460327148, -13.250083923339844, -12.592630386352539, -11.935175895690918, -11.277721405029297, -10.620267868041992, -9.962814331054688, -9.305359840393066, -8.647905349731445, -7.990451812744141, -7.332997798919678, -6.675543785095215, -6.018089771270752, -5.360635757446289, -4.703181743621826, -4.045727729797363, -3.3882737159729004, -2.7308197021484375, -2.0733656883239746, -1.4159116744995117, -0.7584576606750488, -0.10100364685058594, 0.556450366973877, 1.2139043807983398, 1.8713583946228027, 2.5288124084472656, 3.1862664222717285, 3.8437204360961914, 4.501174449920654, 5.158628463745117, 5.81608247756958, 6.473536491394043, 7.130990505218506, 7.788444519042969, 8.445898056030273, 9.103352546691895, 9.760807037353516, 10.41826057434082, 11.075714111328125, 11.733168601989746, 12.390623092651367, 13.048076629638672, 13.705530166625977, 14.362984657287598, 15.020439147949219, 15.677892684936523, 16.335346221923828, 16.992801666259766, 17.65025520324707, 18.307708740234375, 18.96516227722168, 19.622615814208984, 20.280071258544922, 20.937524795532227]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 5.0, 9.0, 27.0, 27.0, 55.0, 86.0, 133.0, 235.0, 339.0, 579.0, 895.0, 1434.0, 2330.0, 3736.0, 5669.0, 9027.0, 13783.0, 21994.0, 33594.0, 50828.0, 76109.0, 111081.0, 156787.0, 214106.0, 275785.0, 337144.0, 386609.0, 415719.0, 412167.0, 382265.0, 329188.0, 269554.0, 207396.0, 152803.0, 107590.0, 74575.0, 49834.0, 32484.0, 21207.0, 13598.0, 8784.0, 5456.0, 3430.0, 2185.0, 1409.0, 869.0, 515.0, 321.0, 201.0, 128.0, 76.0, 61.0, 27.0, 23.0, 11.0, 5.0, 3.0, 3.0, 2.0], "bins": [-12.71875, -12.332763671875, -11.94677734375, -11.560791015625, -11.1748046875, -10.788818359375, -10.40283203125, -10.016845703125, -9.630859375, -9.244873046875, -8.85888671875, -8.472900390625, -8.0869140625, -7.700927734375, -7.31494140625, -6.928955078125, -6.54296875, -6.156982421875, -5.77099609375, -5.385009765625, -4.9990234375, -4.613037109375, -4.22705078125, -3.841064453125, -3.455078125, -3.069091796875, -2.68310546875, -2.297119140625, -1.9111328125, -1.525146484375, -1.13916015625, -0.753173828125, -0.3671875, 0.018798828125, 0.40478515625, 0.790771484375, 1.1767578125, 1.562744140625, 1.94873046875, 2.334716796875, 2.720703125, 3.106689453125, 3.49267578125, 3.878662109375, 4.2646484375, 4.650634765625, 5.03662109375, 5.422607421875, 5.80859375, 6.194580078125, 6.58056640625, 6.966552734375, 7.3525390625, 7.738525390625, 8.12451171875, 8.510498046875, 8.896484375, 9.282470703125, 9.66845703125, 10.054443359375, 10.4404296875, 10.826416015625, 11.21240234375, 11.598388671875, 11.984375]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 3.0, 5.0, 3.0, 8.0, 19.0, 14.0, 14.0, 17.0, 14.0, 17.0, 22.0, 28.0, 24.0, 38.0, 41.0, 34.0, 32.0, 44.0, 36.0, 25.0, 42.0, 65.0, 44.0, 36.0, 36.0, 43.0, 35.0, 24.0, 42.0, 28.0, 23.0, 26.0, 16.0, 14.0, 15.0, 15.0, 12.0, 5.0, 7.0, 9.0, 7.0, 9.0, 2.0, 3.0, 3.0, 0.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.546875, -18.935791015625, -18.32470703125, -17.713623046875, -17.1025390625, -16.491455078125, -15.88037109375, -15.269287109375, -14.658203125, -14.047119140625, -13.43603515625, -12.824951171875, -12.2138671875, -11.602783203125, -10.99169921875, -10.380615234375, -9.76953125, -9.158447265625, -8.54736328125, -7.936279296875, -7.3251953125, -6.714111328125, -6.10302734375, -5.491943359375, -4.880859375, -4.269775390625, -3.65869140625, -3.047607421875, -2.4365234375, -1.825439453125, -1.21435546875, -0.603271484375, 0.0078125, 0.618896484375, 1.22998046875, 1.841064453125, 2.4521484375, 3.063232421875, 3.67431640625, 4.285400390625, 4.896484375, 5.507568359375, 6.11865234375, 6.729736328125, 7.3408203125, 7.951904296875, 8.56298828125, 9.174072265625, 9.78515625, 10.396240234375, 11.00732421875, 11.618408203125, 12.2294921875, 12.840576171875, 13.45166015625, 14.062744140625, 14.673828125, 15.284912109375, 15.89599609375, 16.507080078125, 17.1181640625, 17.729248046875, 18.34033203125, 18.951416015625, 19.5625]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [4.0, 5.0, 7.0, 7.0, 19.0, 20.0, 39.0, 50.0, 81.0, 150.0, 223.0, 353.0, 576.0, 1038.0, 1639.0, 2604.0, 4261.0, 6663.0, 10715.0, 17382.0, 27021.0, 42725.0, 64296.0, 94821.0, 135919.0, 186175.0, 245868.0, 305640.0, 360754.0, 398701.0, 410971.0, 395941.0, 357058.0, 302744.0, 240142.0, 182225.0, 131810.0, 91975.0, 62160.0, 40586.0, 26470.0, 16905.0, 10426.0, 6383.0, 4155.0, 2548.0, 1544.0, 927.0, 600.0, 364.0, 234.0, 137.0, 83.0, 54.0, 34.0, 25.0, 16.0, 11.0, 6.0, 6.0, 3.0, 3.0, 0.0, 2.0], "bins": [-12.90625, -12.4825439453125, -12.058837890625, -11.6351318359375, -11.21142578125, -10.7877197265625, -10.364013671875, -9.9403076171875, -9.5166015625, -9.0928955078125, -8.669189453125, -8.2454833984375, -7.82177734375, -7.3980712890625, -6.974365234375, -6.5506591796875, -6.126953125, -5.7032470703125, -5.279541015625, -4.8558349609375, -4.43212890625, -4.0084228515625, -3.584716796875, -3.1610107421875, -2.7373046875, -2.3135986328125, -1.889892578125, -1.4661865234375, -1.04248046875, -0.6187744140625, -0.195068359375, 0.2286376953125, 0.65234375, 1.0760498046875, 1.499755859375, 1.9234619140625, 2.34716796875, 2.7708740234375, 3.194580078125, 3.6182861328125, 4.0419921875, 4.4656982421875, 4.889404296875, 5.3131103515625, 5.73681640625, 6.1605224609375, 6.584228515625, 7.0079345703125, 7.431640625, 7.8553466796875, 8.279052734375, 8.7027587890625, 9.12646484375, 9.5501708984375, 9.973876953125, 10.3975830078125, 10.8212890625, 11.2449951171875, 11.668701171875, 12.0924072265625, 12.51611328125, 12.9398193359375, 13.363525390625, 13.7872314453125, 14.2109375]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 5.0, 7.0, 5.0, 8.0, 9.0, 12.0, 22.0, 26.0, 29.0, 36.0, 48.0, 58.0, 70.0, 91.0, 92.0, 118.0, 117.0, 141.0, 159.0, 151.0, 191.0, 176.0, 205.0, 213.0, 186.0, 206.0, 174.0, 180.0, 183.0, 161.0, 154.0, 151.0, 119.0, 105.0, 87.0, 61.0, 68.0, 53.0, 47.0, 38.0, 28.0, 22.0, 19.0, 14.0, 9.0, 11.0, 6.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.890625, -8.6051025390625, -8.319580078125, -8.0340576171875, -7.74853515625, -7.4630126953125, -7.177490234375, -6.8919677734375, -6.6064453125, -6.3209228515625, -6.035400390625, -5.7498779296875, -5.46435546875, -5.1788330078125, -4.893310546875, -4.6077880859375, -4.322265625, -4.0367431640625, -3.751220703125, -3.4656982421875, -3.18017578125, -2.8946533203125, -2.609130859375, -2.3236083984375, -2.0380859375, -1.7525634765625, -1.467041015625, -1.1815185546875, -0.89599609375, -0.6104736328125, -0.324951171875, -0.0394287109375, 0.24609375, 0.5316162109375, 0.817138671875, 1.1026611328125, 1.38818359375, 1.6737060546875, 1.959228515625, 2.2447509765625, 2.5302734375, 2.8157958984375, 3.101318359375, 3.3868408203125, 3.67236328125, 3.9578857421875, 4.243408203125, 4.5289306640625, 4.814453125, 5.0999755859375, 5.385498046875, 5.6710205078125, 5.95654296875, 6.2420654296875, 6.527587890625, 6.8131103515625, 7.0986328125, 7.3841552734375, 7.669677734375, 7.9552001953125, 8.24072265625, 8.5262451171875, 8.811767578125, 9.0972900390625, 9.3828125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 7.0, 2.0, 3.0, 0.0, 7.0, 7.0, 15.0, 10.0, 16.0, 20.0, 28.0, 26.0, 44.0, 58.0, 37.0, 45.0, 59.0, 65.0, 55.0, 74.0, 74.0, 51.0, 57.0, 46.0, 28.0, 38.0, 31.0, 29.0, 19.0, 20.0, 13.0, 6.0, 4.0, 5.0, 4.0, 5.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.66039276123047, -21.780624389648438, -20.900856018066406, -20.021087646484375, -19.14131736755371, -18.26154899597168, -17.38178062438965, -16.502012252807617, -15.62224292755127, -14.742474555969238, -13.86270523071289, -12.98293685913086, -12.103168487548828, -11.22339916229248, -10.34363079071045, -9.463861465454102, -8.58409309387207, -7.704324245452881, -6.824555397033691, -5.94478702545166, -5.065018177032471, -4.185249328613281, -3.30548095703125, -2.4257121086120605, -1.545943260192871, -0.6661745309829712, 0.2135941982269287, 1.093362808227539, 1.9731316566467285, 2.852900505065918, 3.732668876647949, 4.612437725067139, 5.492206573486328, 6.371975421905518, 7.251744270324707, 8.131512641906738, 9.011281967163086, 9.891050338745117, 10.770818710327148, 11.65058708190918, 12.530356407165527, 13.410124778747559, 14.289894104003906, 15.169662475585938, 16.04943084716797, 16.92919921875, 17.80896759033203, 18.688737869262695, 19.568506240844727, 20.448274612426758, 21.32804298400879, 22.207813262939453, 23.087581634521484, 23.967350006103516, 24.847118377685547, 25.726886749267578, 26.60665512084961, 27.48642349243164, 28.366191864013672, 29.245960235595703, 30.125730514526367, 31.0054988861084, 31.88526725769043, 32.765037536621094, 33.644805908203125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 3.0, 0.0, 3.0, 4.0, 5.0, 5.0, 6.0, 5.0, 9.0, 15.0, 12.0, 28.0, 15.0, 21.0, 31.0, 25.0, 34.0, 37.0, 51.0, 44.0, 44.0, 43.0, 51.0, 40.0, 31.0, 42.0, 39.0, 38.0, 44.0, 40.0, 33.0, 21.0, 25.0, 28.0, 25.0, 18.0, 17.0, 12.0, 12.0, 7.0, 13.0, 8.0, 10.0, 4.0, 2.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.026453018188477, -28.11346435546875, -27.20047378540039, -26.287485122680664, -25.374496459960938, -24.461505889892578, -23.54851722717285, -22.635528564453125, -21.722537994384766, -20.80954933166504, -19.89655876159668, -18.983570098876953, -18.070579528808594, -17.157590866088867, -16.24460220336914, -15.331612586975098, -14.418622970581055, -13.505633354187012, -12.592643737792969, -11.679655075073242, -10.7666654586792, -9.853675842285156, -8.94068717956543, -8.027697563171387, -7.114707946777344, -6.201718330383301, -5.288729190826416, -4.375740051269531, -3.4627504348754883, -2.5497608184814453, -1.6367716789245605, -0.7237825393676758, 0.1892070770263672, 1.102196455001831, 2.015185832977295, 2.928175210952759, 3.8411645889282227, 4.754154205322266, 5.66714334487915, 6.580132484436035, 7.493122100830078, 8.406111717224121, 9.319101333618164, 10.23208999633789, 11.145079612731934, 12.058069229125977, 12.971057891845703, 13.884047508239746, 14.797037124633789, 15.710026741027832, 16.623016357421875, 17.5360050201416, 18.448993682861328, 19.361984252929688, 20.274972915649414, 21.18796157836914, 22.1009521484375, 23.013940811157227, 23.926931381225586, 24.839920043945312, 25.752910614013672, 26.6658992767334, 27.578887939453125, 28.491878509521484, 29.40486717224121]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 6.0, 5.0, 5.0, 14.0, 10.0, 33.0, 36.0, 64.0, 91.0, 157.0, 291.0, 392.0, 738.0, 1354.0, 2366.0, 4535.0, 8809.0, 18383.0, 38822.0, 85523.0, 200660.0, 330987.0, 196268.0, 84095.0, 38018.0, 17851.0, 8999.0, 4539.0, 2365.0, 1318.0, 713.0, 429.0, 258.0, 149.0, 109.0, 56.0, 41.0, 24.0, 13.0, 12.0, 8.0, 3.0, 2.0, 3.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.92578125, -5.7177734375, -5.509765625, -5.3017578125, -5.09375, -4.8857421875, -4.677734375, -4.4697265625, -4.26171875, -4.0537109375, -3.845703125, -3.6376953125, -3.4296875, -3.2216796875, -3.013671875, -2.8056640625, -2.59765625, -2.3896484375, -2.181640625, -1.9736328125, -1.765625, -1.5576171875, -1.349609375, -1.1416015625, -0.93359375, -0.7255859375, -0.517578125, -0.3095703125, -0.1015625, 0.1064453125, 0.314453125, 0.5224609375, 0.73046875, 0.9384765625, 1.146484375, 1.3544921875, 1.5625, 1.7705078125, 1.978515625, 2.1865234375, 2.39453125, 2.6025390625, 2.810546875, 3.0185546875, 3.2265625, 3.4345703125, 3.642578125, 3.8505859375, 4.05859375, 4.2666015625, 4.474609375, 4.6826171875, 4.890625, 5.0986328125, 5.306640625, 5.5146484375, 5.72265625, 5.9306640625, 6.138671875, 6.3466796875, 6.5546875, 6.7626953125, 6.970703125, 7.1787109375, 7.38671875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 6.0, 6.0, 6.0, 4.0, 11.0, 9.0, 13.0, 21.0, 20.0, 15.0, 25.0, 29.0, 39.0, 41.0, 32.0, 51.0, 45.0, 43.0, 47.0, 49.0, 56.0, 40.0, 40.0, 39.0, 40.0, 38.0, 39.0, 25.0, 32.0, 20.0, 25.0, 16.0, 18.0, 15.0, 10.0, 4.0, 11.0, 7.0, 8.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.65625, -27.66015625, -26.6640625, -25.66796875, -24.671875, -23.67578125, -22.6796875, -21.68359375, -20.6875, -19.69140625, -18.6953125, -17.69921875, -16.703125, -15.70703125, -14.7109375, -13.71484375, -12.71875, -11.72265625, -10.7265625, -9.73046875, -8.734375, -7.73828125, -6.7421875, -5.74609375, -4.75, -3.75390625, -2.7578125, -1.76171875, -0.765625, 0.23046875, 1.2265625, 2.22265625, 3.21875, 4.21484375, 5.2109375, 6.20703125, 7.203125, 8.19921875, 9.1953125, 10.19140625, 11.1875, 12.18359375, 13.1796875, 14.17578125, 15.171875, 16.16796875, 17.1640625, 18.16015625, 19.15625, 20.15234375, 21.1484375, 22.14453125, 23.140625, 24.13671875, 25.1328125, 26.12890625, 27.125, 28.12109375, 29.1171875, 30.11328125, 31.109375, 32.10546875, 33.1015625, 34.09765625, 35.09375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 4.0, 14.0, 6.0, 11.0, 18.0, 30.0, 35.0, 41.0, 76.0, 90.0, 128.0, 212.0, 297.0, 404.0, 655.0, 1067.0, 1953.0, 4041.0, 10747.0, 34159.0, 908940.0, 57737.0, 15903.0, 5827.0, 2534.0, 1252.0, 811.0, 501.0, 297.0, 243.0, 163.0, 109.0, 61.0, 45.0, 41.0, 24.0, 29.0, 14.0, 14.0, 8.0, 9.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.953125, -16.400634765625, -15.84814453125, -15.295654296875, -14.7431640625, -14.190673828125, -13.63818359375, -13.085693359375, -12.533203125, -11.980712890625, -11.42822265625, -10.875732421875, -10.3232421875, -9.770751953125, -9.21826171875, -8.665771484375, -8.11328125, -7.560791015625, -7.00830078125, -6.455810546875, -5.9033203125, -5.350830078125, -4.79833984375, -4.245849609375, -3.693359375, -3.140869140625, -2.58837890625, -2.035888671875, -1.4833984375, -0.930908203125, -0.37841796875, 0.174072265625, 0.7265625, 1.279052734375, 1.83154296875, 2.384033203125, 2.9365234375, 3.489013671875, 4.04150390625, 4.593994140625, 5.146484375, 5.698974609375, 6.25146484375, 6.803955078125, 7.3564453125, 7.908935546875, 8.46142578125, 9.013916015625, 9.56640625, 10.118896484375, 10.67138671875, 11.223876953125, 11.7763671875, 12.328857421875, 12.88134765625, 13.433837890625, 13.986328125, 14.538818359375, 15.09130859375, 15.643798828125, 16.1962890625, 16.748779296875, 17.30126953125, 17.853759765625, 18.40625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 5.0, 7.0, 5.0, 12.0, 7.0, 21.0, 14.0, 16.0, 15.0, 21.0, 26.0, 23.0, 25.0, 34.0, 50.0, 35.0, 35.0, 34.0, 37.0, 40.0, 46.0, 41.0, 43.0, 44.0, 38.0, 45.0, 33.0, 31.0, 24.0, 31.0, 25.0, 20.0, 20.0, 16.0, 14.0, 11.0, 12.0, 3.0, 8.0, 7.0, 3.0, 2.0, 5.0, 5.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-19.109375, -18.535888671875, -17.96240234375, -17.388916015625, -16.8154296875, -16.241943359375, -15.66845703125, -15.094970703125, -14.521484375, -13.947998046875, -13.37451171875, -12.801025390625, -12.2275390625, -11.654052734375, -11.08056640625, -10.507080078125, -9.93359375, -9.360107421875, -8.78662109375, -8.213134765625, -7.6396484375, -7.066162109375, -6.49267578125, -5.919189453125, -5.345703125, -4.772216796875, -4.19873046875, -3.625244140625, -3.0517578125, -2.478271484375, -1.90478515625, -1.331298828125, -0.7578125, -0.184326171875, 0.38916015625, 0.962646484375, 1.5361328125, 2.109619140625, 2.68310546875, 3.256591796875, 3.830078125, 4.403564453125, 4.97705078125, 5.550537109375, 6.1240234375, 6.697509765625, 7.27099609375, 7.844482421875, 8.41796875, 8.991455078125, 9.56494140625, 10.138427734375, 10.7119140625, 11.285400390625, 11.85888671875, 12.432373046875, 13.005859375, 13.579345703125, 14.15283203125, 14.726318359375, 15.2998046875, 15.873291015625, 16.44677734375, 17.020263671875, 17.59375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 6.0, 5.0, 6.0, 17.0, 23.0, 38.0, 49.0, 78.0, 108.0, 164.0, 251.0, 408.0, 671.0, 1302.0, 2693.0, 7365.0, 30813.0, 958760.0, 32412.0, 7542.0, 2739.0, 1290.0, 646.0, 439.0, 241.0, 154.0, 109.0, 68.0, 47.0, 36.0, 20.0, 16.0, 13.0, 9.0, 6.0, 3.0, 3.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9326171875, -1.8692779541015625, -1.805938720703125, -1.7425994873046875, -1.67926025390625, -1.6159210205078125, -1.552581787109375, -1.4892425537109375, -1.4259033203125, -1.3625640869140625, -1.299224853515625, -1.2358856201171875, -1.17254638671875, -1.1092071533203125, -1.045867919921875, -0.9825286865234375, -0.919189453125, -0.8558502197265625, -0.792510986328125, -0.7291717529296875, -0.66583251953125, -0.6024932861328125, -0.539154052734375, -0.4758148193359375, -0.4124755859375, -0.3491363525390625, -0.285797119140625, -0.2224578857421875, -0.15911865234375, -0.0957794189453125, -0.032440185546875, 0.0308990478515625, 0.09423828125, 0.1575775146484375, 0.220916748046875, 0.2842559814453125, 0.34759521484375, 0.4109344482421875, 0.474273681640625, 0.5376129150390625, 0.6009521484375, 0.6642913818359375, 0.727630615234375, 0.7909698486328125, 0.85430908203125, 0.9176483154296875, 0.980987548828125, 1.0443267822265625, 1.107666015625, 1.1710052490234375, 1.234344482421875, 1.2976837158203125, 1.36102294921875, 1.4243621826171875, 1.487701416015625, 1.5510406494140625, 1.6143798828125, 1.6777191162109375, 1.741058349609375, 1.8043975830078125, 1.86773681640625, 1.9310760498046875, 1.994415283203125, 2.0577545166015625, 2.12109375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 1.0, 1.0, 4.0, 8.0, 1.0, 7.0, 4.0, 9.0, 11.0, 12.0, 13.0, 21.0, 21.0, 26.0, 23.0, 18.0, 34.0, 35.0, 41.0, 38.0, 30.0, 39.0, 55.0, 46.0, 42.0, 49.0, 42.0, 52.0, 27.0, 37.0, 50.0, 26.0, 25.0, 35.0, 15.0, 24.0, 20.0, 16.0, 13.0, 9.0, 3.0, 7.0, 5.0, 3.0, 2.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0907649993896484e-05, -1.0503455996513367e-05, -1.0099261999130249e-05, -9.695068001747131e-06, -9.290874004364014e-06, -8.886680006980896e-06, -8.482486009597778e-06, -8.07829201221466e-06, -7.674098014831543e-06, -7.269904017448425e-06, -6.865710020065308e-06, -6.46151602268219e-06, -6.057322025299072e-06, -5.653128027915955e-06, -5.248934030532837e-06, -4.844740033149719e-06, -4.4405460357666016e-06, -4.036352038383484e-06, -3.632158041000366e-06, -3.2279640436172485e-06, -2.823770046234131e-06, -2.419576048851013e-06, -2.0153820514678955e-06, -1.6111880540847778e-06, -1.2069940567016602e-06, -8.028000593185425e-07, -3.986060619354248e-07, 5.587935447692871e-09, 4.0978193283081055e-07, 8.139759302139282e-07, 1.218169927597046e-06, 1.6223639249801636e-06, 2.0265579223632812e-06, 2.430751919746399e-06, 2.8349459171295166e-06, 3.2391399145126343e-06, 3.643333911895752e-06, 4.04752790927887e-06, 4.451721906661987e-06, 4.855915904045105e-06, 5.260109901428223e-06, 5.66430389881134e-06, 6.068497896194458e-06, 6.472691893577576e-06, 6.876885890960693e-06, 7.281079888343811e-06, 7.685273885726929e-06, 8.089467883110046e-06, 8.493661880493164e-06, 8.897855877876282e-06, 9.3020498752594e-06, 9.706243872642517e-06, 1.0110437870025635e-05, 1.0514631867408752e-05, 1.091882586479187e-05, 1.1323019862174988e-05, 1.1727213859558105e-05, 1.2131407856941223e-05, 1.253560185432434e-05, 1.2939795851707458e-05, 1.3343989849090576e-05, 1.3748183846473694e-05, 1.4152377843856812e-05, 1.455657184123993e-05, 1.4960765838623047e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 4.0, 7.0, 12.0, 14.0, 12.0, 18.0, 34.0, 62.0, 76.0, 124.0, 169.0, 258.0, 408.0, 671.0, 1028.0, 1660.0, 2609.0, 4364.0, 7133.0, 12060.0, 20257.0, 35169.0, 62056.0, 121143.0, 296710.0, 246361.0, 104182.0, 55029.0, 31197.0, 17981.0, 10832.0, 6400.0, 3961.0, 2474.0, 1488.0, 922.0, 606.0, 379.0, 226.0, 159.0, 97.0, 69.0, 52.0, 38.0, 19.0, 11.0, 9.0, 7.0, 8.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73388671875, -0.7084884643554688, -0.6830902099609375, -0.6576919555664062, -0.632293701171875, -0.6068954467773438, -0.5814971923828125, -0.5560989379882812, -0.53070068359375, -0.5053024291992188, -0.4799041748046875, -0.45450592041015625, -0.429107666015625, -0.40370941162109375, -0.3783111572265625, -0.35291290283203125, -0.3275146484375, -0.30211639404296875, -0.2767181396484375, -0.25131988525390625, -0.225921630859375, -0.20052337646484375, -0.1751251220703125, -0.14972686767578125, -0.12432861328125, -0.09893035888671875, -0.0735321044921875, -0.04813385009765625, -0.022735595703125, 0.00266265869140625, 0.0280609130859375, 0.05345916748046875, 0.078857421875, 0.10425567626953125, 0.1296539306640625, 0.15505218505859375, 0.180450439453125, 0.20584869384765625, 0.2312469482421875, 0.25664520263671875, 0.28204345703125, 0.30744171142578125, 0.3328399658203125, 0.35823822021484375, 0.383636474609375, 0.40903472900390625, 0.4344329833984375, 0.45983123779296875, 0.4852294921875, 0.5106277465820312, 0.5360260009765625, 0.5614242553710938, 0.586822509765625, 0.6122207641601562, 0.6376190185546875, 0.6630172729492188, 0.68841552734375, 0.7138137817382812, 0.7392120361328125, 0.7646102905273438, 0.790008544921875, 0.8154067993164062, 0.8408050537109375, 0.8662033081054688, 0.8916015625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 6.0, 4.0, 4.0, 7.0, 11.0, 11.0, 10.0, 3.0, 17.0, 14.0, 22.0, 28.0, 21.0, 33.0, 31.0, 47.0, 62.0, 73.0, 93.0, 108.0, 67.0, 49.0, 47.0, 38.0, 35.0, 28.0, 36.0, 20.0, 10.0, 15.0, 11.0, 15.0, 10.0, 5.0, 6.0, 2.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57275390625, -0.5563545227050781, -0.5399551391601562, -0.5235557556152344, -0.5071563720703125, -0.4907569885253906, -0.47435760498046875, -0.4579582214355469, -0.441558837890625, -0.4251594543457031, -0.40876007080078125, -0.3923606872558594, -0.3759613037109375, -0.3595619201660156, -0.34316253662109375, -0.3267631530761719, -0.31036376953125, -0.2939643859863281, -0.27756500244140625, -0.2611656188964844, -0.2447662353515625, -0.22836685180664062, -0.21196746826171875, -0.19556808471679688, -0.179168701171875, -0.16276931762695312, -0.14636993408203125, -0.12997055053710938, -0.1135711669921875, -0.09717178344726562, -0.08077239990234375, -0.06437301635742188, -0.0479736328125, -0.031574249267578125, -0.01517486572265625, 0.001224517822265625, 0.0176239013671875, 0.034023284912109375, 0.05042266845703125, 0.06682205200195312, 0.083221435546875, 0.09962081909179688, 0.11602020263671875, 0.13241958618164062, 0.1488189697265625, 0.16521835327148438, 0.18161773681640625, 0.19801712036132812, 0.21441650390625, 0.23081588745117188, 0.24721527099609375, 0.2636146545410156, 0.2800140380859375, 0.2964134216308594, 0.31281280517578125, 0.3292121887207031, 0.345611572265625, 0.3620109558105469, 0.37841033935546875, 0.3948097229003906, 0.4112091064453125, 0.4276084899902344, 0.44400787353515625, 0.4604072570800781, 0.476806640625]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 5.0, 3.0, 3.0, 2.0, 7.0, 10.0, 10.0, 14.0, 12.0, 23.0, 23.0, 36.0, 42.0, 55.0, 40.0, 40.0, 55.0, 69.0, 59.0, 73.0, 68.0, 53.0, 61.0, 46.0, 25.0, 36.0, 36.0, 25.0, 20.0, 19.0, 13.0, 6.0, 5.0, 4.0, 4.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.61943817138672, -21.743730545043945, -20.868022918701172, -19.9923152923584, -19.116607666015625, -18.24090003967285, -17.365192413330078, -16.489482879638672, -15.613776206970215, -14.738068580627441, -13.862360954284668, -12.986652374267578, -12.110944747924805, -11.235237121582031, -10.359529495239258, -9.483821868896484, -8.608114242553711, -7.7324066162109375, -6.856698989868164, -5.980990886688232, -5.105283260345459, -4.2295756340026855, -3.353867530822754, -2.4781599044799805, -1.602452278137207, -0.726744532585144, 0.14896321296691895, 1.0246710777282715, 1.900378704071045, 2.7760863304138184, 3.65179443359375, 4.527502059936523, 5.403209686279297, 6.27891731262207, 7.154624938964844, 8.030332565307617, 8.90604019165039, 9.781747817993164, 10.657456398010254, 11.533164024353027, 12.4088716506958, 13.284579277038574, 14.160286903381348, 15.035995483398438, 15.911703109741211, 16.787410736083984, 17.663118362426758, 18.53882598876953, 19.414533615112305, 20.290241241455078, 21.16594886779785, 22.041656494140625, 22.9173641204834, 23.793071746826172, 24.668781280517578, 25.54448699951172, 26.420196533203125, 27.2959041595459, 28.171611785888672, 29.047319412231445, 29.92302703857422, 30.798734664916992, 31.674442291259766, 32.55015182495117, 33.42585754394531]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 3.0, 4.0, 5.0, 4.0, 7.0, 6.0, 10.0, 13.0, 15.0, 23.0, 17.0, 22.0, 32.0, 22.0, 36.0, 41.0, 52.0, 41.0, 47.0, 40.0, 51.0, 42.0, 29.0, 42.0, 40.0, 37.0, 44.0, 39.0, 32.0, 23.0, 22.0, 31.0, 24.0, 15.0, 20.0, 11.0, 12.0, 5.0, 15.0, 8.0, 8.0, 5.0, 2.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.958463668823242, -28.042707443237305, -27.126949310302734, -26.211193084716797, -25.29543685913086, -24.379680633544922, -23.463924407958984, -22.548166275024414, -21.632410049438477, -20.71665382385254, -19.80089569091797, -18.88513946533203, -17.969383239746094, -17.053627014160156, -16.13787078857422, -15.222112655639648, -14.306356430053711, -13.390600204467773, -12.47484302520752, -11.559085845947266, -10.643329620361328, -9.72757339477539, -8.811816215515137, -7.896059513092041, -6.980302810668945, -6.06454610824585, -5.148789405822754, -4.233032703399658, -3.3172760009765625, -2.401519298553467, -1.485762596130371, -0.5700058937072754, 0.3457508087158203, 1.261507511138916, 2.1772642135620117, 3.0930209159851074, 4.008777618408203, 4.924534320831299, 5.8402910232543945, 6.75604772567749, 7.671804428100586, 8.587560653686523, 9.503317832946777, 10.419075012207031, 11.334831237792969, 12.250587463378906, 13.16634464263916, 14.082101821899414, 14.997858047485352, 15.913614273071289, 16.82937240600586, 17.745128631591797, 18.660884857177734, 19.576641082763672, 20.49239730834961, 21.40815544128418, 22.323911666870117, 23.239667892456055, 24.155426025390625, 25.071182250976562, 25.9869384765625, 26.902694702148438, 27.818450927734375, 28.734209060668945, 29.649965286254883]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 9.0, 12.0, 23.0, 38.0, 57.0, 75.0, 126.0, 185.0, 290.0, 468.0, 769.0, 1252.0, 1994.0, 3403.0, 5371.0, 8938.0, 14558.0, 23449.0, 36726.0, 55191.0, 77583.0, 101754.0, 120099.0, 127628.0, 121902.0, 103575.0, 81029.0, 57551.0, 39197.0, 25162.0, 15713.0, 9449.0, 5744.0, 3543.0, 2182.0, 1316.0, 826.0, 487.0, 318.0, 192.0, 121.0, 92.0, 65.0, 34.0, 16.0, 17.0, 15.0, 7.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.890625, -11.513916015625, -11.13720703125, -10.760498046875, -10.3837890625, -10.007080078125, -9.63037109375, -9.253662109375, -8.876953125, -8.500244140625, -8.12353515625, -7.746826171875, -7.3701171875, -6.993408203125, -6.61669921875, -6.239990234375, -5.86328125, -5.486572265625, -5.10986328125, -4.733154296875, -4.3564453125, -3.979736328125, -3.60302734375, -3.226318359375, -2.849609375, -2.472900390625, -2.09619140625, -1.719482421875, -1.3427734375, -0.966064453125, -0.58935546875, -0.212646484375, 0.1640625, 0.540771484375, 0.91748046875, 1.294189453125, 1.6708984375, 2.047607421875, 2.42431640625, 2.801025390625, 3.177734375, 3.554443359375, 3.93115234375, 4.307861328125, 4.6845703125, 5.061279296875, 5.43798828125, 5.814697265625, 6.19140625, 6.568115234375, 6.94482421875, 7.321533203125, 7.6982421875, 8.074951171875, 8.45166015625, 8.828369140625, 9.205078125, 9.581787109375, 9.95849609375, 10.335205078125, 10.7119140625, 11.088623046875, 11.46533203125, 11.842041015625, 12.21875]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 6.0, 7.0, 7.0, 7.0, 11.0, 15.0, 18.0, 23.0, 21.0, 27.0, 32.0, 44.0, 39.0, 54.0, 43.0, 46.0, 50.0, 42.0, 40.0, 39.0, 40.0, 57.0, 35.0, 38.0, 36.0, 37.0, 28.0, 22.0, 28.0, 15.0, 18.0, 15.0, 9.0, 12.0, 8.0, 5.0, 7.0, 8.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.875, -28.921142578125, -27.96728515625, -27.013427734375, -26.0595703125, -25.105712890625, -24.15185546875, -23.197998046875, -22.244140625, -21.290283203125, -20.33642578125, -19.382568359375, -18.4287109375, -17.474853515625, -16.52099609375, -15.567138671875, -14.61328125, -13.659423828125, -12.70556640625, -11.751708984375, -10.7978515625, -9.843994140625, -8.89013671875, -7.936279296875, -6.982421875, -6.028564453125, -5.07470703125, -4.120849609375, -3.1669921875, -2.213134765625, -1.25927734375, -0.305419921875, 0.6484375, 1.602294921875, 2.55615234375, 3.510009765625, 4.4638671875, 5.417724609375, 6.37158203125, 7.325439453125, 8.279296875, 9.233154296875, 10.18701171875, 11.140869140625, 12.0947265625, 13.048583984375, 14.00244140625, 14.956298828125, 15.91015625, 16.864013671875, 17.81787109375, 18.771728515625, 19.7255859375, 20.679443359375, 21.63330078125, 22.587158203125, 23.541015625, 24.494873046875, 25.44873046875, 26.402587890625, 27.3564453125, 28.310302734375, 29.26416015625, 30.218017578125, 31.171875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 5.0, 4.0, 20.0, 16.0, 32.0, 32.0, 68.0, 100.0, 150.0, 227.0, 350.0, 515.0, 775.0, 1099.0, 1745.0, 2529.0, 3859.0, 5864.0, 9208.0, 13995.0, 21002.0, 30977.0, 45548.0, 64608.0, 85422.0, 104756.0, 117460.0, 119092.0, 108603.0, 89720.0, 68546.0, 50230.0, 34533.0, 23008.0, 15452.0, 10003.0, 6536.0, 4235.0, 2737.0, 1853.0, 1228.0, 823.0, 521.0, 373.0, 251.0, 141.0, 117.0, 75.0, 38.0, 26.0, 15.0, 11.0, 13.0, 11.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0], "bins": [-12.75, -12.3402099609375, -11.930419921875, -11.5206298828125, -11.11083984375, -10.7010498046875, -10.291259765625, -9.8814697265625, -9.4716796875, -9.0618896484375, -8.652099609375, -8.2423095703125, -7.83251953125, -7.4227294921875, -7.012939453125, -6.6031494140625, -6.193359375, -5.7835693359375, -5.373779296875, -4.9639892578125, -4.55419921875, -4.1444091796875, -3.734619140625, -3.3248291015625, -2.9150390625, -2.5052490234375, -2.095458984375, -1.6856689453125, -1.27587890625, -0.8660888671875, -0.456298828125, -0.0465087890625, 0.36328125, 0.7730712890625, 1.182861328125, 1.5926513671875, 2.00244140625, 2.4122314453125, 2.822021484375, 3.2318115234375, 3.6416015625, 4.0513916015625, 4.461181640625, 4.8709716796875, 5.28076171875, 5.6905517578125, 6.100341796875, 6.5101318359375, 6.919921875, 7.3297119140625, 7.739501953125, 8.1492919921875, 8.55908203125, 8.9688720703125, 9.378662109375, 9.7884521484375, 10.1982421875, 10.6080322265625, 11.017822265625, 11.4276123046875, 11.83740234375, 12.2471923828125, 12.656982421875, 13.0667724609375, 13.4765625]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 3.0, 5.0, 5.0, 4.0, 8.0, 10.0, 1.0, 13.0, 19.0, 11.0, 15.0, 22.0, 31.0, 22.0, 27.0, 30.0, 38.0, 30.0, 43.0, 37.0, 39.0, 51.0, 44.0, 36.0, 45.0, 39.0, 38.0, 48.0, 36.0, 34.0, 37.0, 23.0, 24.0, 16.0, 18.0, 24.0, 18.0, 11.0, 15.0, 6.0, 14.0, 8.0, 1.0, 5.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.59375, -18.008544921875, -17.42333984375, -16.838134765625, -16.2529296875, -15.667724609375, -15.08251953125, -14.497314453125, -13.912109375, -13.326904296875, -12.74169921875, -12.156494140625, -11.5712890625, -10.986083984375, -10.40087890625, -9.815673828125, -9.23046875, -8.645263671875, -8.06005859375, -7.474853515625, -6.8896484375, -6.304443359375, -5.71923828125, -5.134033203125, -4.548828125, -3.963623046875, -3.37841796875, -2.793212890625, -2.2080078125, -1.622802734375, -1.03759765625, -0.452392578125, 0.1328125, 0.718017578125, 1.30322265625, 1.888427734375, 2.4736328125, 3.058837890625, 3.64404296875, 4.229248046875, 4.814453125, 5.399658203125, 5.98486328125, 6.570068359375, 7.1552734375, 7.740478515625, 8.32568359375, 8.910888671875, 9.49609375, 10.081298828125, 10.66650390625, 11.251708984375, 11.8369140625, 12.422119140625, 13.00732421875, 13.592529296875, 14.177734375, 14.762939453125, 15.34814453125, 15.933349609375, 16.5185546875, 17.103759765625, 17.68896484375, 18.274169921875, 18.859375]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 7.0, 10.0, 24.0, 28.0, 57.0, 87.0, 171.0, 243.0, 387.0, 658.0, 1088.0, 1809.0, 3060.0, 4879.0, 8076.0, 12996.0, 19714.0, 29790.0, 42437.0, 57646.0, 73399.0, 89286.0, 101010.0, 105598.0, 104258.0, 95522.0, 81142.0, 65170.0, 48725.0, 35212.0, 24171.0, 15620.0, 10136.0, 6401.0, 3974.0, 2321.0, 1376.0, 828.0, 507.0, 290.0, 166.0, 103.0, 67.0, 39.0, 21.0, 20.0, 8.0, 9.0, 7.0, 1.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.0625, -3.9302978515625, -3.798095703125, -3.6658935546875, -3.53369140625, -3.4014892578125, -3.269287109375, -3.1370849609375, -3.0048828125, -2.8726806640625, -2.740478515625, -2.6082763671875, -2.47607421875, -2.3438720703125, -2.211669921875, -2.0794677734375, -1.947265625, -1.8150634765625, -1.682861328125, -1.5506591796875, -1.41845703125, -1.2862548828125, -1.154052734375, -1.0218505859375, -0.8896484375, -0.7574462890625, -0.625244140625, -0.4930419921875, -0.36083984375, -0.2286376953125, -0.096435546875, 0.0357666015625, 0.16796875, 0.3001708984375, 0.432373046875, 0.5645751953125, 0.69677734375, 0.8289794921875, 0.961181640625, 1.0933837890625, 1.2255859375, 1.3577880859375, 1.489990234375, 1.6221923828125, 1.75439453125, 1.8865966796875, 2.018798828125, 2.1510009765625, 2.283203125, 2.4154052734375, 2.547607421875, 2.6798095703125, 2.81201171875, 2.9442138671875, 3.076416015625, 3.2086181640625, 3.3408203125, 3.4730224609375, 3.605224609375, 3.7374267578125, 3.86962890625, 4.0018310546875, 4.134033203125, 4.2662353515625, 4.3984375]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 3.0, 4.0, 6.0, 7.0, 10.0, 13.0, 11.0, 18.0, 24.0, 20.0, 24.0, 37.0, 42.0, 45.0, 49.0, 44.0, 40.0, 37.0, 53.0, 61.0, 66.0, 62.0, 53.0, 41.0, 46.0, 25.0, 25.0, 22.0, 18.0, 12.0, 14.0, 18.0, 13.0, 9.0, 7.0, 7.0, 6.0, 4.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005030632019042969, -0.0004849284887313843, -0.0004667937755584717, -0.0004486590623855591, -0.0004305243492126465, -0.0004123896360397339, -0.0003942549228668213, -0.0003761202096939087, -0.0003579854965209961, -0.0003398507833480835, -0.0003217160701751709, -0.0003035813570022583, -0.0002854466438293457, -0.0002673119306564331, -0.0002491772174835205, -0.0002310425043106079, -0.0002129077911376953, -0.00019477307796478271, -0.00017663836479187012, -0.00015850365161895752, -0.00014036893844604492, -0.00012223422527313232, -0.00010409951210021973, -8.596479892730713e-05, -6.783008575439453e-05, -4.9695372581481934e-05, -3.1560659408569336e-05, -1.3425946235656738e-05, 4.708766937255859e-06, 2.2843480110168457e-05, 4.0978193283081055e-05, 5.911290645599365e-05, 7.724761962890625e-05, 9.538233280181885e-05, 0.00011351704597473145, 0.00013165175914764404, 0.00014978647232055664, 0.00016792118549346924, 0.00018605589866638184, 0.00020419061183929443, 0.00022232532501220703, 0.00024046003818511963, 0.0002585947513580322, 0.0002767294645309448, 0.0002948641777038574, 0.00031299889087677, 0.0003311336040496826, 0.0003492683172225952, 0.0003674030303955078, 0.0003855377435684204, 0.000403672456741333, 0.0004218071699142456, 0.0004399418830871582, 0.0004580765962600708, 0.0004762113094329834, 0.000494346022605896, 0.0005124807357788086, 0.0005306154489517212, 0.0005487501621246338, 0.0005668848752975464, 0.000585019588470459, 0.0006031543016433716, 0.0006212890148162842, 0.0006394237279891968, 0.0006575584411621094]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 7.0, 5.0, 9.0, 15.0, 20.0, 36.0, 65.0, 77.0, 114.0, 174.0, 311.0, 479.0, 735.0, 1181.0, 1956.0, 3057.0, 4900.0, 7490.0, 11433.0, 16922.0, 24651.0, 34409.0, 46641.0, 59946.0, 74521.0, 86198.0, 95057.0, 98565.0, 95917.0, 87707.0, 75506.0, 61692.0, 47844.0, 35144.0, 25224.0, 17331.0, 11823.0, 7728.0, 4997.0, 3154.0, 2009.0, 1238.0, 855.0, 504.0, 323.0, 222.0, 148.0, 64.0, 60.0, 41.0, 22.0, 19.0, 11.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-4.015625, -3.8883056640625, -3.760986328125, -3.6336669921875, -3.50634765625, -3.3790283203125, -3.251708984375, -3.1243896484375, -2.9970703125, -2.8697509765625, -2.742431640625, -2.6151123046875, -2.48779296875, -2.3604736328125, -2.233154296875, -2.1058349609375, -1.978515625, -1.8511962890625, -1.723876953125, -1.5965576171875, -1.46923828125, -1.3419189453125, -1.214599609375, -1.0872802734375, -0.9599609375, -0.8326416015625, -0.705322265625, -0.5780029296875, -0.45068359375, -0.3233642578125, -0.196044921875, -0.0687255859375, 0.05859375, 0.1859130859375, 0.313232421875, 0.4405517578125, 0.56787109375, 0.6951904296875, 0.822509765625, 0.9498291015625, 1.0771484375, 1.2044677734375, 1.331787109375, 1.4591064453125, 1.58642578125, 1.7137451171875, 1.841064453125, 1.9683837890625, 2.095703125, 2.2230224609375, 2.350341796875, 2.4776611328125, 2.60498046875, 2.7322998046875, 2.859619140625, 2.9869384765625, 3.1142578125, 3.2415771484375, 3.368896484375, 3.4962158203125, 3.62353515625, 3.7508544921875, 3.878173828125, 4.0054931640625, 4.1328125]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 3.0, 2.0, 3.0, 6.0, 10.0, 8.0, 7.0, 10.0, 10.0, 11.0, 20.0, 22.0, 26.0, 24.0, 28.0, 32.0, 35.0, 30.0, 28.0, 24.0, 32.0, 37.0, 30.0, 52.0, 33.0, 45.0, 33.0, 36.0, 43.0, 41.0, 36.0, 31.0, 28.0, 37.0, 16.0, 22.0, 20.0, 18.0, 8.0, 16.0, 10.0, 8.0, 5.0, 8.0, 8.0, 4.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 3.0, 0.0, 3.0], "bins": [-1.888671875, -1.8318023681640625, -1.774932861328125, -1.7180633544921875, -1.66119384765625, -1.6043243408203125, -1.547454833984375, -1.4905853271484375, -1.4337158203125, -1.3768463134765625, -1.319976806640625, -1.2631072998046875, -1.20623779296875, -1.1493682861328125, -1.092498779296875, -1.0356292724609375, -0.978759765625, -0.9218902587890625, -0.865020751953125, -0.8081512451171875, -0.75128173828125, -0.6944122314453125, -0.637542724609375, -0.5806732177734375, -0.5238037109375, -0.4669342041015625, -0.410064697265625, -0.3531951904296875, -0.29632568359375, -0.2394561767578125, -0.182586669921875, -0.1257171630859375, -0.06884765625, -0.0119781494140625, 0.044891357421875, 0.1017608642578125, 0.15863037109375, 0.2154998779296875, 0.272369384765625, 0.3292388916015625, 0.3861083984375, 0.4429779052734375, 0.499847412109375, 0.5567169189453125, 0.61358642578125, 0.6704559326171875, 0.727325439453125, 0.7841949462890625, 0.841064453125, 0.8979339599609375, 0.954803466796875, 1.0116729736328125, 1.06854248046875, 1.1254119873046875, 1.182281494140625, 1.2391510009765625, 1.2960205078125, 1.3528900146484375, 1.409759521484375, 1.4666290283203125, 1.52349853515625, 1.5803680419921875, 1.637237548828125, 1.6941070556640625, 1.7509765625]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 4.0, 8.0, 10.0, 6.0, 16.0, 24.0, 11.0, 30.0, 38.0, 39.0, 37.0, 46.0, 48.0, 58.0, 61.0, 65.0, 66.0, 52.0, 52.0, 55.0, 47.0, 45.0, 31.0, 28.0, 27.0, 18.0, 20.0, 17.0, 9.0, 9.0, 8.0, 3.0, 1.0, 7.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.35736846923828, -21.492076873779297, -20.62678337097168, -19.761491775512695, -18.896198272705078, -18.030906677246094, -17.16561508178711, -16.300321578979492, -15.435029983520508, -14.569737434387207, -13.704444885253906, -12.839153289794922, -11.973860740661621, -11.10856819152832, -10.24327564239502, -9.377983093261719, -8.512690544128418, -7.647397994995117, -6.782105922698975, -5.916813373565674, -5.051521301269531, -4.1862287521362305, -3.3209362030029297, -2.455644130706787, -1.5903515815734863, -0.7250592112541199, 0.14023315906524658, 1.0055255889892578, 1.8708178997039795, 2.736110210418701, 3.601402759552002, 4.4666948318481445, 5.331987380981445, 6.197279930114746, 7.062572002410889, 7.9278645515441895, 8.793156623840332, 9.658449172973633, 10.523741722106934, 11.389034271240234, 12.254325866699219, 13.11961841583252, 13.98491096496582, 14.850202560424805, 15.715495109558105, 16.580787658691406, 17.44607925415039, 18.311372756958008, 19.176666259765625, 20.04195785522461, 20.907251358032227, 21.77254295349121, 22.637836456298828, 23.503128051757812, 24.368419647216797, 25.233713150024414, 26.0990047454834, 26.964296340942383, 27.82958984375, 28.694881439208984, 29.5601749420166, 30.425466537475586, 31.290760040283203, 32.15605163574219, 33.02134323120117]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 4.0, 2.0, 3.0, 4.0, 7.0, 6.0, 12.0, 17.0, 16.0, 19.0, 34.0, 21.0, 30.0, 34.0, 49.0, 54.0, 44.0, 46.0, 61.0, 49.0, 47.0, 52.0, 45.0, 34.0, 49.0, 43.0, 37.0, 25.0, 31.0, 25.0, 18.0, 13.0, 18.0, 16.0, 10.0, 6.0, 9.0, 3.0, 8.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-39.68611526489258, -38.43584442138672, -37.18557357788086, -35.935302734375, -34.685035705566406, -33.43476486206055, -32.18449401855469, -30.934223175048828, -29.68395233154297, -28.43368148803711, -27.183412551879883, -25.933141708374023, -24.682870864868164, -23.432601928710938, -22.182331085205078, -20.93206024169922, -19.681791305541992, -18.431520462036133, -17.181251525878906, -15.930980682373047, -14.680709838867188, -13.430439949035645, -12.180170059204102, -10.929899215698242, -9.6796293258667, -8.429359436035156, -7.179088592529297, -5.928818702697754, -4.678548336029053, -3.4282779693603516, -2.1780080795288086, -0.9277372360229492, 0.32253265380859375, 1.5728029012680054, 2.823073148727417, 4.073343276977539, 5.32361364364624, 6.573884010314941, 7.824153900146484, 9.074424743652344, 10.324694633483887, 11.57496452331543, 12.825235366821289, 14.075505256652832, 15.325775146484375, 16.576045989990234, 17.826316833496094, 19.076587677001953, 20.32685661315918, 21.57712745666504, 22.827396392822266, 24.077667236328125, 25.327938079833984, 26.578208923339844, 27.82847785949707, 29.07874870300293, 30.329017639160156, 31.579288482666016, 32.829559326171875, 34.07982635498047, 35.33009719848633, 36.58036804199219, 37.83063888549805, 39.080909729003906, 40.331180572509766]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 7.0, 5.0, 5.0, 18.0, 17.0, 30.0, 38.0, 47.0, 69.0, 94.0, 180.0, 224.0, 265.0, 416.0, 570.0, 868.0, 1159.0, 1561.0, 2147.0, 3001.0, 4032.0, 5262.0, 6458.0, 1002410.0, 5546.0, 4334.0, 3263.0, 2428.0, 1754.0, 1291.0, 885.0, 640.0, 487.0, 301.0, 241.0, 156.0, 123.0, 97.0, 51.0, 35.0, 28.0, 22.0, 12.0, 11.0, 10.0, 3.0, 8.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-208.37640380859375, -201.4647216796875, -194.5530242919922, -187.64134216308594, -180.72964477539062, -173.81796264648438, -166.90626525878906, -159.9945831298828, -153.0828857421875, -146.17120361328125, -139.25950622558594, -132.3478240966797, -125.43612670898438, -118.52444458007812, -111.61274719238281, -104.70106506347656, -97.78937530517578, -90.877685546875, -83.96599578857422, -77.05430603027344, -70.14261627197266, -63.23093032836914, -56.31924057006836, -49.40755081176758, -42.4958610534668, -35.584171295166016, -28.672481536865234, -21.760793685913086, -14.849103927612305, -7.937416076660156, -1.025726318359375, 5.885963439941406, 12.797653198242188, 19.70934295654297, 26.62103271484375, 33.53272247314453, 40.44441223144531, 47.35609817504883, 54.26778793334961, 61.17947769165039, 68.09117126464844, 75.00286102294922, 81.91455078125, 88.82624053955078, 95.73793029785156, 102.64961242675781, 109.56130981445312, 116.47299194335938, 123.38468170166016, 130.29637145996094, 137.2080535888672, 144.1197509765625, 151.03143310546875, 157.94313049316406, 164.8548126220703, 171.76651000976562, 178.67819213867188, 185.58987426757812, 192.50157165527344, 199.4132537841797, 206.324951171875, 213.23663330078125, 220.14833068847656, 227.0600128173828, 233.97171020507812]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 11.0, 7.0, 8.0, 12.0, 12.0, 9.0, 15.0, 29.0, 29.0, 39.0, 41.0, 49.0, 66.0, 97.0, 134.0, 254.0, 381.0, 641.0, 1167.0, 2140.0, 3954.0, 7951.0, 15781.0, 28511.0, 55647.0, 51243444.0, 51654.0, 27158.0, 15412.0, 7700.0, 3953.0, 2090.0, 1099.0, 650.0, 401.0, 236.0, 135.0, 116.0, 70.0, 39.0, 39.0, 28.0, 24.0, 24.0, 16.0, 17.0, 13.0, 7.0, 12.0, 5.0, 6.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-402.75, -389.953125, -377.15625, -364.359375, -351.5625, -338.765625, -325.96875, -313.171875, -300.375, -287.578125, -274.78125, -261.984375, -249.1875, -236.390625, -223.59375, -210.796875, -198.0, -185.203125, -172.40625, -159.609375, -146.8125, -134.015625, -121.21875, -108.421875, -95.625, -82.828125, -70.03125, -57.234375, -44.4375, -31.640625, -18.84375, -6.046875, 6.75, 19.546875, 32.34375, 45.140625, 57.9375, 70.734375, 83.53125, 96.328125, 109.125, 121.921875, 134.71875, 147.515625, 160.3125, 173.109375, 185.90625, 198.703125, 211.5, 224.296875, 237.09375, 249.890625, 262.6875, 275.484375, 288.28125, 301.078125, 313.875, 326.671875, 339.46875, 352.265625, 365.0625, 377.859375, 390.65625, 403.453125, 416.25]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 14.0, 19.0, 33.0, 93.0, 267.0, 364.0, 138.0, 47.0, 15.0, 7.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.69442749023438, -77.61419677734375, -74.5339584350586, -71.45372772216797, -68.37348937988281, -65.29325866699219, -62.2130241394043, -59.132789611816406, -56.052555084228516, -52.972320556640625, -49.892086029052734, -46.811851501464844, -43.73162078857422, -40.65138244628906, -37.57115173339844, -34.49091720581055, -31.410682678222656, -28.330448150634766, -25.250213623046875, -22.169981002807617, -19.089746475219727, -16.009511947631836, -12.929279327392578, -9.849044799804688, -6.768810272216797, -3.6885762214660645, -0.608342170715332, 2.471891403198242, 5.552125930786133, 8.632360458374023, 11.712593078613281, 14.792827606201172, 17.87305450439453, 20.953289031982422, 24.033523559570312, 27.11375617980957, 30.19399070739746, 33.27422332763672, 36.35445785522461, 39.4346923828125, 42.51492691040039, 45.59516143798828, 48.67539596557617, 51.75563049316406, 54.83586120605469, 57.916099548339844, 60.99633026123047, 64.07656860351562, 67.15679931640625, 70.23703002929688, 73.31726837158203, 76.39749908447266, 79.47773742675781, 82.55796813964844, 85.63819885253906, 88.71843719482422, 91.79867553710938, 94.87890625, 97.95914459228516, 101.03937530517578, 104.11961364746094, 107.19984436035156, 110.28007507324219, 113.36031341552734, 116.44054412841797]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 7.0, 18.0, 16.0, 25.0, 38.0, 69.0, 124.0, 165.0, 199.0, 145.0, 79.0, 45.0, 20.0, 16.0, 10.0, 6.0, 4.0, 5.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-167.71533203125, -162.93698120117188, -158.15863037109375, -153.3802947998047, -148.60194396972656, -143.82359313964844, -139.04525756835938, -134.26690673828125, -129.48855590820312, -124.710205078125, -119.9318618774414, -115.15351867675781, -110.37516784667969, -105.59681701660156, -100.81847381591797, -96.04013061523438, -91.26177978515625, -86.48342895507812, -81.70508575439453, -76.92674255371094, -72.14839172363281, -67.37004089355469, -62.591697692871094, -57.813350677490234, -53.035003662109375, -48.256656646728516, -43.478309631347656, -38.6999626159668, -33.92161560058594, -29.143268585205078, -24.36492156982422, -19.58657455444336, -14.808242797851562, -10.029895782470703, -5.251548767089844, -0.4732017517089844, 4.305145263671875, 9.083492279052734, 13.861839294433594, 18.640186309814453, 23.418533325195312, 28.196880340576172, 32.97522735595703, 37.75357437133789, 42.53192138671875, 47.31026840209961, 52.08861541748047, 56.86696243286133, 61.64530944824219, 66.42366027832031, 71.2020034790039, 75.9803466796875, 80.75869750976562, 85.53704833984375, 90.31539154052734, 95.09373474121094, 99.87208557128906, 104.65043640136719, 109.42877960205078, 114.20712280273438, 118.9854736328125, 123.76382446289062, 128.54217529296875, 133.3205108642578, 138.09886169433594]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 6.0, 12.0, 14.0, 24.0, 26.0, 48.0, 69.0, 71.0, 121.0, 208.0, 353.0, 485.0, 760.0, 1129.0, 1923.0, 3418.0, 6248.0, 13193.0, 35914.0, 249335.0, 3793840.0, 52943.0, 16856.0, 7580.0, 3862.0, 2168.0, 1311.0, 793.0, 502.0, 334.0, 217.0, 157.0, 96.0, 79.0, 63.0, 39.0, 18.0, 18.0, 12.0, 9.0, 6.0, 6.0, 7.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.220703125, -1.1757659912109375, -1.130828857421875, -1.0858917236328125, -1.04095458984375, -0.9960174560546875, -0.951080322265625, -0.9061431884765625, -0.8612060546875, -0.8162689208984375, -0.771331787109375, -0.7263946533203125, -0.68145751953125, -0.6365203857421875, -0.591583251953125, -0.5466461181640625, -0.501708984375, -0.4567718505859375, -0.411834716796875, -0.3668975830078125, -0.32196044921875, -0.2770233154296875, -0.232086181640625, -0.1871490478515625, -0.1422119140625, -0.0972747802734375, -0.052337646484375, -0.0074005126953125, 0.03753662109375, 0.0824737548828125, 0.127410888671875, 0.1723480224609375, 0.21728515625, 0.2622222900390625, 0.307159423828125, 0.3520965576171875, 0.39703369140625, 0.4419708251953125, 0.486907958984375, 0.5318450927734375, 0.5767822265625, 0.6217193603515625, 0.666656494140625, 0.7115936279296875, 0.75653076171875, 0.8014678955078125, 0.846405029296875, 0.8913421630859375, 0.936279296875, 0.9812164306640625, 1.026153564453125, 1.0710906982421875, 1.11602783203125, 1.1609649658203125, 1.205902099609375, 1.2508392333984375, 1.2957763671875, 1.3407135009765625, 1.385650634765625, 1.4305877685546875, 1.47552490234375, 1.5204620361328125, 1.565399169921875, 1.6103363037109375, 1.6552734375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 8.0, 8.0, 6.0, 10.0, 10.0, 14.0, 16.0, 62.0, 627.0, 113.0, 22.0, 18.0, 10.0, 8.0, 8.0, 6.0, 7.0, 5.0, 3.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.194580078125, -0.18776702880859375, -0.1809539794921875, -0.17414093017578125, -0.167327880859375, -0.16051483154296875, -0.1537017822265625, -0.14688873291015625, -0.14007568359375, -0.13326263427734375, -0.1264495849609375, -0.11963653564453125, -0.112823486328125, -0.10601043701171875, -0.0991973876953125, -0.09238433837890625, -0.0855712890625, -0.07875823974609375, -0.0719451904296875, -0.06513214111328125, -0.058319091796875, -0.05150604248046875, -0.0446929931640625, -0.03787994384765625, -0.03106689453125, -0.02425384521484375, -0.0174407958984375, -0.01062774658203125, -0.003814697265625, 0.00299835205078125, 0.0098114013671875, 0.01662445068359375, 0.0234375, 0.03025054931640625, 0.0370635986328125, 0.04387664794921875, 0.050689697265625, 0.05750274658203125, 0.0643157958984375, 0.07112884521484375, 0.07794189453125, 0.08475494384765625, 0.0915679931640625, 0.09838104248046875, 0.105194091796875, 0.11200714111328125, 0.1188201904296875, 0.12563323974609375, 0.1324462890625, 0.13925933837890625, 0.1460723876953125, 0.15288543701171875, 0.159698486328125, 0.16651153564453125, 0.1733245849609375, 0.18013763427734375, 0.18695068359375, 0.19376373291015625, 0.2005767822265625, 0.20738983154296875, 0.214202880859375, 0.22101593017578125, 0.2278289794921875, 0.23464202880859375, 0.241455078125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 6.0, 7.0, 11.0, 10.0, 14.0, 29.0, 49.0, 59.0, 105.0, 116.0, 203.0, 269.0, 408.0, 751.0, 1450.0, 3264.0, 7462.0, 21123.0, 84449.0, 1086983.0, 2843341.0, 105050.0, 23915.0, 8186.0, 3241.0, 1555.0, 802.0, 479.0, 304.0, 192.0, 128.0, 85.0, 75.0, 36.0, 33.0, 23.0, 21.0, 15.0, 17.0, 8.0, 1.0, 5.0, 6.0, 0.0, 4.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.474609375, -1.4325714111328125, -1.390533447265625, -1.3484954833984375, -1.30645751953125, -1.2644195556640625, -1.222381591796875, -1.1803436279296875, -1.1383056640625, -1.0962677001953125, -1.054229736328125, -1.0121917724609375, -0.97015380859375, -0.9281158447265625, -0.886077880859375, -0.8440399169921875, -0.802001953125, -0.7599639892578125, -0.717926025390625, -0.6758880615234375, -0.63385009765625, -0.5918121337890625, -0.549774169921875, -0.5077362060546875, -0.4656982421875, -0.4236602783203125, -0.381622314453125, -0.3395843505859375, -0.29754638671875, -0.2555084228515625, -0.213470458984375, -0.1714324951171875, -0.12939453125, -0.0873565673828125, -0.045318603515625, -0.0032806396484375, 0.03875732421875, 0.0807952880859375, 0.122833251953125, 0.1648712158203125, 0.2069091796875, 0.2489471435546875, 0.290985107421875, 0.3330230712890625, 0.37506103515625, 0.4170989990234375, 0.459136962890625, 0.5011749267578125, 0.543212890625, 0.5852508544921875, 0.627288818359375, 0.6693267822265625, 0.71136474609375, 0.7534027099609375, 0.795440673828125, 0.8374786376953125, 0.8795166015625, 0.9215545654296875, 0.963592529296875, 1.0056304931640625, 1.04766845703125, 1.0897064208984375, 1.131744384765625, 1.1737823486328125, 1.2158203125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 6.0, 2.0, 3.0, 7.0, 7.0, 8.0, 10.0, 14.0, 12.0, 22.0, 19.0, 24.0, 32.0, 36.0, 66.0, 68.0, 95.0, 142.0, 156.0, 296.0, 521.0, 1089.0, 525.0, 254.0, 173.0, 134.0, 90.0, 66.0, 49.0, 35.0, 32.0, 21.0, 15.0, 13.0, 8.0, 11.0, 4.0, 4.0, 3.0, 1.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31982421875, -0.3086204528808594, -0.29741668701171875, -0.2862129211425781, -0.2750091552734375, -0.2638053894042969, -0.25260162353515625, -0.24139785766601562, -0.230194091796875, -0.21899032592773438, -0.20778656005859375, -0.19658279418945312, -0.1853790283203125, -0.17417526245117188, -0.16297149658203125, -0.15176773071289062, -0.14056396484375, -0.12936019897460938, -0.11815643310546875, -0.10695266723632812, -0.0957489013671875, -0.08454513549804688, -0.07334136962890625, -0.062137603759765625, -0.050933837890625, -0.039730072021484375, -0.02852630615234375, -0.017322540283203125, -0.0061187744140625, 0.005084991455078125, 0.01628875732421875, 0.027492523193359375, 0.0386962890625, 0.049900054931640625, 0.06110382080078125, 0.07230758666992188, 0.0835113525390625, 0.09471511840820312, 0.10591888427734375, 0.11712265014648438, 0.128326416015625, 0.13953018188476562, 0.15073394775390625, 0.16193771362304688, 0.1731414794921875, 0.18434524536132812, 0.19554901123046875, 0.20675277709960938, 0.21795654296875, 0.22916030883789062, 0.24036407470703125, 0.2515678405761719, 0.2627716064453125, 0.2739753723144531, 0.28517913818359375, 0.2963829040527344, 0.307586669921875, 0.3187904357910156, 0.32999420166015625, 0.3411979675292969, 0.3524017333984375, 0.3636054992675781, 0.37480926513671875, 0.3860130310058594, 0.397216796875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 5.0, 7.0, 6.0, 16.0, 20.0, 66.0, 177.0, 430.0, 182.0, 56.0, 21.0, 12.0, 7.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.421138763427734, -7.251067161560059, -7.080995559692383, -6.910923480987549, -6.740851879119873, -6.570780277252197, -6.4007086753845215, -6.2306365966796875, -6.060564994812012, -5.890493392944336, -5.72042179107666, -5.550349712371826, -5.38027811050415, -5.210206508636475, -5.040134906768799, -4.870062828063965, -4.699991226196289, -4.529919624328613, -4.3598480224609375, -4.1897759437561035, -4.019704341888428, -3.849632740020752, -3.679561138153076, -3.5094892978668213, -3.3394179344177246, -3.169346332550049, -2.999274492263794, -2.829202890396118, -2.6591310501098633, -2.4890594482421875, -2.3189878463745117, -2.148916006088257, -1.9788439273834229, -1.8087722063064575, -1.6387004852294922, -1.4686288833618164, -1.2985570430755615, -1.1284854412078857, -0.9584137201309204, -0.7883419990539551, -0.6182702779769897, -0.4481985569000244, -0.27812686562538147, -0.10805517435073853, 0.06201654672622681, 0.23208826780319214, 0.4021599292755127, 0.572231650352478, 0.7423033714294434, 0.9123750925064087, 1.082446813583374, 1.2525184154510498, 1.4225902557373047, 1.5926618576049805, 1.7627335786819458, 1.9328052997589111, 2.102877140045166, 2.272948741912842, 2.4430205821990967, 2.6130921840667725, 2.7831640243530273, 2.953235626220703, 3.123307228088379, 3.293379068374634, 3.4634506702423096]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 7.0, 10.0, 15.0, 17.0, 30.0, 26.0, 29.0, 42.0, 49.0, 52.0, 42.0, 81.0, 70.0, 69.0, 62.0, 59.0, 56.0, 52.0, 47.0, 35.0, 31.0, 24.0, 22.0, 22.0, 18.0, 6.0, 10.0, 10.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.0999159812927246, -3.023454189300537, -2.9469923973083496, -2.870530366897583, -2.7940685749053955, -2.717606782913208, -2.6411447525024414, -2.564682960510254, -2.4882211685180664, -2.411759376525879, -2.3352975845336914, -2.258835554122925, -2.1823737621307373, -2.10591197013855, -2.029449939727783, -1.9529881477355957, -1.8765263557434082, -1.8000645637512207, -1.7236026525497437, -1.6471407413482666, -1.570678949356079, -1.4942171573638916, -1.4177552461624146, -1.3412933349609375, -1.26483154296875, -1.1883697509765625, -1.1119078397750854, -1.0354459285736084, -0.9589841365814209, -0.8825222849845886, -0.8060604333877563, -0.7295985817909241, -0.6531369686126709, -0.5766751170158386, -0.5002132654190063, -0.4237514138221741, -0.3472895622253418, -0.2708277106285095, -0.19436585903167725, -0.11790400743484497, -0.041442155838012695, 0.03501969575881958, 0.11148154735565186, 0.18794339895248413, 0.2644052505493164, 0.3408671021461487, 0.41732895374298096, 0.49379080533981323, 0.5702526569366455, 0.6467145085334778, 0.7231763601303101, 0.7996382117271423, 0.8761000633239746, 0.9525619149208069, 1.0290237665176392, 1.1054856777191162, 1.1819474697113037, 1.2584092617034912, 1.3348711729049683, 1.4113330841064453, 1.4877948760986328, 1.5642566680908203, 1.6407185792922974, 1.7171804904937744, 1.793642282485962]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 4.0, 11.0, 11.0, 11.0, 17.0, 34.0, 41.0, 59.0, 76.0, 105.0, 130.0, 215.0, 275.0, 366.0, 533.0, 805.0, 1100.0, 1615.0, 2439.0, 3724.0, 5904.0, 10337.0, 22719.0, 121817.0, 765094.0, 68662.0, 18050.0, 8668.0, 5210.0, 3366.0, 2250.0, 1443.0, 986.0, 698.0, 498.0, 381.0, 238.0, 197.0, 122.0, 85.0, 74.0, 57.0, 42.0, 29.0, 15.0, 14.0, 7.0, 10.0, 4.0, 6.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0322265625, -0.99932861328125, -0.9664306640625, -0.93353271484375, -0.900634765625, -0.86773681640625, -0.8348388671875, -0.80194091796875, -0.76904296875, -0.73614501953125, -0.7032470703125, -0.67034912109375, -0.637451171875, -0.60455322265625, -0.5716552734375, -0.53875732421875, -0.505859375, -0.47296142578125, -0.4400634765625, -0.40716552734375, -0.374267578125, -0.34136962890625, -0.3084716796875, -0.27557373046875, -0.24267578125, -0.20977783203125, -0.1768798828125, -0.14398193359375, -0.111083984375, -0.07818603515625, -0.0452880859375, -0.01239013671875, 0.0205078125, 0.05340576171875, 0.0863037109375, 0.11920166015625, 0.152099609375, 0.18499755859375, 0.2178955078125, 0.25079345703125, 0.28369140625, 0.31658935546875, 0.3494873046875, 0.38238525390625, 0.415283203125, 0.44818115234375, 0.4810791015625, 0.51397705078125, 0.546875, 0.57977294921875, 0.6126708984375, 0.64556884765625, 0.678466796875, 0.71136474609375, 0.7442626953125, 0.77716064453125, 0.81005859375, 0.84295654296875, 0.8758544921875, 0.90875244140625, 0.941650390625, 0.97454833984375, 1.0074462890625, 1.04034423828125, 1.0732421875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 3.0, 6.0, 4.0, 8.0, 3.0, 7.0, 7.0, 11.0, 9.0, 30.0, 94.0, 219.0, 275.0, 157.0, 62.0, 24.0, 12.0, 13.0, 7.0, 7.0, 5.0, 3.0, 4.0, 6.0, 4.0, 1.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.242919921875, -0.2358226776123047, -0.22872543334960938, -0.22162818908691406, -0.21453094482421875, -0.20743370056152344, -0.20033645629882812, -0.1932392120361328, -0.1861419677734375, -0.1790447235107422, -0.17194747924804688, -0.16485023498535156, -0.15775299072265625, -0.15065574645996094, -0.14355850219726562, -0.1364612579345703, -0.129364013671875, -0.12226676940917969, -0.11516952514648438, -0.10807228088378906, -0.10097503662109375, -0.09387779235839844, -0.08678054809570312, -0.07968330383300781, -0.0725860595703125, -0.06548881530761719, -0.058391571044921875, -0.05129432678222656, -0.04419708251953125, -0.03709983825683594, -0.030002593994140625, -0.022905349731445312, -0.01580810546875, -0.008710861206054688, -0.001613616943359375, 0.0054836273193359375, 0.01258087158203125, 0.019678115844726562, 0.026775360107421875, 0.03387260437011719, 0.0409698486328125, 0.04806709289550781, 0.055164337158203125, 0.06226158142089844, 0.06935882568359375, 0.07645606994628906, 0.08355331420898438, 0.09065055847167969, 0.097747802734375, 0.10484504699707031, 0.11194229125976562, 0.11903953552246094, 0.12613677978515625, 0.13323402404785156, 0.14033126831054688, 0.1474285125732422, 0.1545257568359375, 0.1616230010986328, 0.16872024536132812, 0.17581748962402344, 0.18291473388671875, 0.19001197814941406, 0.19710922241210938, 0.2042064666748047, 0.2113037109375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 6.0, 5.0, 3.0, 5.0, 10.0, 10.0, 17.0, 15.0, 24.0, 32.0, 56.0, 113.0, 248.0, 601.0, 2245.0, 11658.0, 255918.0, 752275.0, 20559.0, 3262.0, 812.0, 326.0, 134.0, 74.0, 51.0, 23.0, 23.0, 11.0, 8.0, 6.0, 9.0, 7.0, 6.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.271484375, -3.1663818359375, -3.061279296875, -2.9561767578125, -2.85107421875, -2.7459716796875, -2.640869140625, -2.5357666015625, -2.4306640625, -2.3255615234375, -2.220458984375, -2.1153564453125, -2.01025390625, -1.9051513671875, -1.800048828125, -1.6949462890625, -1.58984375, -1.4847412109375, -1.379638671875, -1.2745361328125, -1.16943359375, -1.0643310546875, -0.959228515625, -0.8541259765625, -0.7490234375, -0.6439208984375, -0.538818359375, -0.4337158203125, -0.32861328125, -0.2235107421875, -0.118408203125, -0.0133056640625, 0.091796875, 0.1968994140625, 0.302001953125, 0.4071044921875, 0.51220703125, 0.6173095703125, 0.722412109375, 0.8275146484375, 0.9326171875, 1.0377197265625, 1.142822265625, 1.2479248046875, 1.35302734375, 1.4581298828125, 1.563232421875, 1.6683349609375, 1.7734375, 1.8785400390625, 1.983642578125, 2.0887451171875, 2.19384765625, 2.2989501953125, 2.404052734375, 2.5091552734375, 2.6142578125, 2.7193603515625, 2.824462890625, 2.9295654296875, 3.03466796875, 3.1397705078125, 3.244873046875, 3.3499755859375, 3.455078125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 2.0, 4.0, 7.0, 9.0, 16.0, 14.0, 15.0, 13.0, 20.0, 19.0, 19.0, 26.0, 30.0, 21.0, 44.0, 29.0, 29.0, 50.0, 56.0, 42.0, 45.0, 39.0, 44.0, 38.0, 37.0, 42.0, 40.0, 29.0, 23.0, 34.0, 24.0, 20.0, 16.0, 12.0, 19.0, 17.0, 13.0, 10.0, 9.0, 5.0, 4.0, 2.0, 3.0, 2.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.93603515625, -0.9067459106445312, -0.8774566650390625, -0.8481674194335938, -0.818878173828125, -0.7895889282226562, -0.7602996826171875, -0.7310104370117188, -0.70172119140625, -0.6724319458007812, -0.6431427001953125, -0.6138534545898438, -0.584564208984375, -0.5552749633789062, -0.5259857177734375, -0.49669647216796875, -0.4674072265625, -0.43811798095703125, -0.4088287353515625, -0.37953948974609375, -0.350250244140625, -0.32096099853515625, -0.2916717529296875, -0.26238250732421875, -0.23309326171875, -0.20380401611328125, -0.1745147705078125, -0.14522552490234375, -0.115936279296875, -0.08664703369140625, -0.0573577880859375, -0.02806854248046875, 0.001220703125, 0.03050994873046875, 0.0597991943359375, 0.08908843994140625, 0.118377685546875, 0.14766693115234375, 0.1769561767578125, 0.20624542236328125, 0.23553466796875, 0.26482391357421875, 0.2941131591796875, 0.32340240478515625, 0.352691650390625, 0.38198089599609375, 0.4112701416015625, 0.44055938720703125, 0.4698486328125, 0.49913787841796875, 0.5284271240234375, 0.5577163696289062, 0.587005615234375, 0.6162948608398438, 0.6455841064453125, 0.6748733520507812, 0.70416259765625, 0.7334518432617188, 0.7627410888671875, 0.7920303344726562, 0.821319580078125, 0.8506088256835938, 0.8798980712890625, 0.9091873168945312, 0.9384765625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 6.0, 4.0, 7.0, 5.0, 10.0, 14.0, 15.0, 25.0, 38.0, 61.0, 110.0, 177.0, 345.0, 705.0, 1837.0, 8692.0, 969201.0, 60614.0, 4250.0, 1272.0, 534.0, 254.0, 128.0, 80.0, 60.0, 31.0, 31.0, 18.0, 11.0, 6.0, 6.0, 3.0, 4.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.875, -7.64874267578125, -7.4224853515625, -7.19622802734375, -6.969970703125, -6.74371337890625, -6.5174560546875, -6.29119873046875, -6.06494140625, -5.83868408203125, -5.6124267578125, -5.38616943359375, -5.159912109375, -4.93365478515625, -4.7073974609375, -4.48114013671875, -4.2548828125, -4.02862548828125, -3.8023681640625, -3.57611083984375, -3.349853515625, -3.12359619140625, -2.8973388671875, -2.67108154296875, -2.44482421875, -2.21856689453125, -1.9923095703125, -1.76605224609375, -1.539794921875, -1.31353759765625, -1.0872802734375, -0.86102294921875, -0.634765625, -0.40850830078125, -0.1822509765625, 0.04400634765625, 0.270263671875, 0.49652099609375, 0.7227783203125, 0.94903564453125, 1.17529296875, 1.40155029296875, 1.6278076171875, 1.85406494140625, 2.080322265625, 2.30657958984375, 2.5328369140625, 2.75909423828125, 2.9853515625, 3.21160888671875, 3.4378662109375, 3.66412353515625, 3.890380859375, 4.11663818359375, 4.3428955078125, 4.56915283203125, 4.79541015625, 5.02166748046875, 5.2479248046875, 5.47418212890625, 5.700439453125, 5.92669677734375, 6.1529541015625, 6.37921142578125, 6.60546875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 2.0, 6.0, 4.0, 15.0, 7.0, 5.0, 13.0, 11.0, 15.0, 21.0, 27.0, 27.0, 33.0, 37.0, 66.0, 112.0, 193.0, 115.0, 45.0, 57.0, 39.0, 28.0, 22.0, 18.0, 10.0, 14.0, 14.0, 14.0, 9.0, 7.0, 9.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0011320114135742188, -0.0010936558246612549, -0.001055300235748291, -0.0010169446468353271, -0.0009785890579223633, -0.0009402334690093994, -0.0009018778800964355, -0.0008635222911834717, -0.0008251667022705078, -0.0007868111133575439, -0.0007484555244445801, -0.0007100999355316162, -0.0006717443466186523, -0.0006333887577056885, -0.0005950331687927246, -0.0005566775798797607, -0.0005183219909667969, -0.000479966402053833, -0.00044161081314086914, -0.0004032552242279053, -0.0003648996353149414, -0.00032654404640197754, -0.00028818845748901367, -0.0002498328685760498, -0.00021147727966308594, -0.00017312169075012207, -0.0001347661018371582, -9.641051292419434e-05, -5.805492401123047e-05, -1.96993350982666e-05, 1.8656253814697266e-05, 5.701184272766113e-05, 9.5367431640625e-05, 0.00013372302055358887, 0.00017207860946655273, 0.0002104341983795166, 0.00024878978729248047, 0.00028714537620544434, 0.0003255009651184082, 0.00036385655403137207, 0.00040221214294433594, 0.0004405677318572998, 0.00047892332077026367, 0.0005172789096832275, 0.0005556344985961914, 0.0005939900875091553, 0.0006323456764221191, 0.000670701265335083, 0.0007090568542480469, 0.0007474124431610107, 0.0007857680320739746, 0.0008241236209869385, 0.0008624792098999023, 0.0009008347988128662, 0.0009391903877258301, 0.000977545976638794, 0.0010159015655517578, 0.0010542571544647217, 0.0010926127433776855, 0.0011309683322906494, 0.0011693239212036133, 0.0012076795101165771, 0.001246035099029541, 0.0012843906879425049, 0.0013227462768554688]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 5.0, 9.0, 4.0, 11.0, 20.0, 22.0, 43.0, 72.0, 137.0, 252.0, 488.0, 1195.0, 3684.0, 16019.0, 905062.0, 107853.0, 9350.0, 2431.0, 982.0, 409.0, 194.0, 121.0, 62.0, 44.0, 35.0, 16.0, 12.0, 8.0, 8.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4296875, -4.27056884765625, -4.1114501953125, -3.95233154296875, -3.793212890625, -3.63409423828125, -3.4749755859375, -3.31585693359375, -3.15673828125, -2.99761962890625, -2.8385009765625, -2.67938232421875, -2.520263671875, -2.36114501953125, -2.2020263671875, -2.04290771484375, -1.8837890625, -1.72467041015625, -1.5655517578125, -1.40643310546875, -1.247314453125, -1.08819580078125, -0.9290771484375, -0.76995849609375, -0.61083984375, -0.45172119140625, -0.2926025390625, -0.13348388671875, 0.025634765625, 0.18475341796875, 0.3438720703125, 0.50299072265625, 0.662109375, 0.82122802734375, 0.9803466796875, 1.13946533203125, 1.298583984375, 1.45770263671875, 1.6168212890625, 1.77593994140625, 1.93505859375, 2.09417724609375, 2.2532958984375, 2.41241455078125, 2.571533203125, 2.73065185546875, 2.8897705078125, 3.04888916015625, 3.2080078125, 3.36712646484375, 3.5262451171875, 3.68536376953125, 3.844482421875, 4.00360107421875, 4.1627197265625, 4.32183837890625, 4.48095703125, 4.64007568359375, 4.7991943359375, 4.95831298828125, 5.117431640625, 5.27655029296875, 5.4356689453125, 5.59478759765625, 5.75390625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 0.0, 4.0, 6.0, 5.0, 6.0, 14.0, 10.0, 19.0, 15.0, 33.0, 52.0, 102.0, 357.0, 198.0, 73.0, 41.0, 17.0, 11.0, 6.0, 5.0, 7.0, 5.0, 7.0, 5.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0625, -3.957611083984375, -3.85272216796875, -3.747833251953125, -3.6429443359375, -3.538055419921875, -3.43316650390625, -3.328277587890625, -3.223388671875, -3.118499755859375, -3.01361083984375, -2.908721923828125, -2.8038330078125, -2.698944091796875, -2.59405517578125, -2.489166259765625, -2.38427734375, -2.279388427734375, -2.17449951171875, -2.069610595703125, -1.9647216796875, -1.859832763671875, -1.75494384765625, -1.650054931640625, -1.545166015625, -1.440277099609375, -1.33538818359375, -1.230499267578125, -1.1256103515625, -1.020721435546875, -0.91583251953125, -0.810943603515625, -0.7060546875, -0.601165771484375, -0.49627685546875, -0.391387939453125, -0.2864990234375, -0.181610107421875, -0.07672119140625, 0.028167724609375, 0.133056640625, 0.237945556640625, 0.34283447265625, 0.447723388671875, 0.5526123046875, 0.657501220703125, 0.76239013671875, 0.867279052734375, 0.97216796875, 1.077056884765625, 1.18194580078125, 1.286834716796875, 1.3917236328125, 1.496612548828125, 1.60150146484375, 1.706390380859375, 1.811279296875, 1.916168212890625, 2.02105712890625, 2.125946044921875, 2.2308349609375, 2.335723876953125, 2.44061279296875, 2.545501708984375, 2.650390625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 8.0, 5.0, 22.0, 38.0, 226.0, 567.0, 121.0, 16.0, 6.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-60.37192916870117, -58.97962188720703, -57.58731460571289, -56.19500732421875, -54.80270004272461, -53.41039276123047, -52.01808547973633, -50.62577819824219, -49.23347091674805, -47.841163635253906, -46.448856353759766, -45.056549072265625, -43.664241790771484, -42.271934509277344, -40.8796272277832, -39.48731994628906, -38.09501647949219, -36.70270919799805, -35.310401916503906, -33.918094635009766, -32.525787353515625, -31.133480072021484, -29.741172790527344, -28.348865509033203, -26.956558227539062, -25.564250946044922, -24.17194366455078, -22.77963638305664, -21.3873291015625, -19.99502182006836, -18.60271453857422, -17.210407257080078, -15.818098068237305, -14.425790786743164, -13.033483505249023, -11.641176223754883, -10.248868942260742, -8.856561660766602, -7.464255332946777, -6.071948051452637, -4.679640769958496, -3.2873334884643555, -1.895026445388794, -0.5027194023132324, 0.8895878791809082, 2.281895160675049, 3.6742019653320312, 5.066509246826172, 6.4588165283203125, 7.851123809814453, 9.243431091308594, 10.635738372802734, 12.028045654296875, 13.420352935791016, 14.81265926361084, 16.204967498779297, 17.597274780273438, 18.989582061767578, 20.38188934326172, 21.77419662475586, 23.16650390625, 24.55881118774414, 25.95111846923828, 27.343425750732422, 28.73573112487793]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 6.0, 4.0, 7.0, 4.0, 2.0, 9.0, 15.0, 16.0, 18.0, 45.0, 48.0, 68.0, 94.0, 112.0, 121.0, 110.0, 98.0, 61.0, 40.0, 30.0, 32.0, 20.0, 11.0, 12.0, 0.0, 2.0, 4.0, 5.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.658111572265625, -17.033716201782227, -16.409318923950195, -15.784923553466797, -15.160527229309082, -14.536130905151367, -13.911735534667969, -13.287339210510254, -12.662942886352539, -12.038546562194824, -11.41415023803711, -10.789754867553711, -10.165358543395996, -9.540962219238281, -8.916566848754883, -8.292170524597168, -7.667774200439453, -7.043377876281738, -6.418982028961182, -5.794586181640625, -5.17018985748291, -4.545793533325195, -3.9213976860046387, -3.297001838684082, -2.672605514526367, -2.0482094287872314, -1.4238133430480957, -0.79941725730896, -0.17502117156982422, 0.4493749141693115, 1.0737709999084473, 1.698166847229004, 2.3225631713867188, 2.9469592571258545, 3.5713553428649902, 4.195751190185547, 4.820147514343262, 5.444543838500977, 6.068939685821533, 6.69333553314209, 7.317731857299805, 7.9421281814575195, 8.566524505615234, 9.190919876098633, 9.815316200256348, 10.439712524414062, 11.064107894897461, 11.688504219055176, 12.31290054321289, 12.937296867370605, 13.56169319152832, 14.186088562011719, 14.810484886169434, 15.434881210327148, 16.059276580810547, 16.683673858642578, 17.308069229125977, 17.932464599609375, 18.556861877441406, 19.181257247924805, 19.805652618408203, 20.430049896240234, 21.054445266723633, 21.67884063720703, 22.303237915039062]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 5.0, 11.0, 15.0, 19.0, 22.0, 48.0, 50.0, 110.0, 205.0, 537.0, 1685.0, 6434.0, 68602.0, 4086791.0, 23956.0, 3802.0, 1160.0, 432.0, 198.0, 95.0, 39.0, 18.0, 19.0, 4.0, 8.0, 7.0, 3.0, 1.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9765625, -6.7215576171875, -6.466552734375, -6.2115478515625, -5.95654296875, -5.7015380859375, -5.446533203125, -5.1915283203125, -4.9365234375, -4.6815185546875, -4.426513671875, -4.1715087890625, -3.91650390625, -3.6614990234375, -3.406494140625, -3.1514892578125, -2.896484375, -2.6414794921875, -2.386474609375, -2.1314697265625, -1.87646484375, -1.6214599609375, -1.366455078125, -1.1114501953125, -0.8564453125, -0.6014404296875, -0.346435546875, -0.0914306640625, 0.16357421875, 0.4185791015625, 0.673583984375, 0.9285888671875, 1.18359375, 1.4385986328125, 1.693603515625, 1.9486083984375, 2.20361328125, 2.4586181640625, 2.713623046875, 2.9686279296875, 3.2236328125, 3.4786376953125, 3.733642578125, 3.9886474609375, 4.24365234375, 4.4986572265625, 4.753662109375, 5.0086669921875, 5.263671875, 5.5186767578125, 5.773681640625, 6.0286865234375, 6.28369140625, 6.5386962890625, 6.793701171875, 7.0487060546875, 7.3037109375, 7.5587158203125, 7.813720703125, 8.0687255859375, 8.32373046875, 8.5787353515625, 8.833740234375, 9.0887451171875, 9.34375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 1.0, 4.0, 6.0, 5.0, 7.0, 6.0, 10.0, 4.0, 11.0, 11.0, 15.0, 24.0, 61.0, 118.0, 165.0, 178.0, 147.0, 92.0, 52.0, 24.0, 12.0, 10.0, 7.0, 10.0, 2.0, 5.0, 3.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.277587890625, -0.2701282501220703, -0.2626686096191406, -0.25520896911621094, -0.24774932861328125, -0.24028968811035156, -0.23283004760742188, -0.2253704071044922, -0.2179107666015625, -0.2104511260986328, -0.20299148559570312, -0.19553184509277344, -0.18807220458984375, -0.18061256408691406, -0.17315292358398438, -0.1656932830810547, -0.158233642578125, -0.1507740020751953, -0.14331436157226562, -0.13585472106933594, -0.12839508056640625, -0.12093544006347656, -0.11347579956054688, -0.10601615905761719, -0.0985565185546875, -0.09109687805175781, -0.08363723754882812, -0.07617759704589844, -0.06871795654296875, -0.06125831604003906, -0.053798675537109375, -0.04633903503417969, -0.03887939453125, -0.03141975402832031, -0.023960113525390625, -0.016500473022460938, -0.00904083251953125, -0.0015811920166015625, 0.005878448486328125, 0.013338088989257812, 0.0207977294921875, 0.028257369995117188, 0.035717010498046875, 0.04317665100097656, 0.05063629150390625, 0.05809593200683594, 0.06555557250976562, 0.07301521301269531, 0.080474853515625, 0.08793449401855469, 0.09539413452148438, 0.10285377502441406, 0.11031341552734375, 0.11777305603027344, 0.12523269653320312, 0.1326923370361328, 0.1401519775390625, 0.1476116180419922, 0.15507125854492188, 0.16253089904785156, 0.16999053955078125, 0.17745018005371094, 0.18490982055664062, 0.1923694610595703, 0.1998291015625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 3.0, 3.0, 8.0, 15.0, 17.0, 9.0, 22.0, 23.0, 38.0, 58.0, 84.0, 142.0, 221.0, 366.0, 641.0, 1173.0, 2197.0, 5161.0, 13077.0, 47225.0, 1407824.0, 2643486.0, 48629.0, 13508.0, 5250.0, 2316.0, 1138.0, 641.0, 360.0, 215.0, 127.0, 90.0, 59.0, 57.0, 26.0, 17.0, 10.0, 10.0, 12.0, 4.0, 5.0, 3.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.560546875, -2.477996826171875, -2.39544677734375, -2.312896728515625, -2.2303466796875, -2.147796630859375, -2.06524658203125, -1.982696533203125, -1.900146484375, -1.817596435546875, -1.73504638671875, -1.652496337890625, -1.5699462890625, -1.487396240234375, -1.40484619140625, -1.322296142578125, -1.23974609375, -1.157196044921875, -1.07464599609375, -0.992095947265625, -0.9095458984375, -0.826995849609375, -0.74444580078125, -0.661895751953125, -0.579345703125, -0.496795654296875, -0.41424560546875, -0.331695556640625, -0.2491455078125, -0.166595458984375, -0.08404541015625, -0.001495361328125, 0.0810546875, 0.163604736328125, 0.24615478515625, 0.328704833984375, 0.4112548828125, 0.493804931640625, 0.57635498046875, 0.658905029296875, 0.741455078125, 0.824005126953125, 0.90655517578125, 0.989105224609375, 1.0716552734375, 1.154205322265625, 1.23675537109375, 1.319305419921875, 1.40185546875, 1.484405517578125, 1.56695556640625, 1.649505615234375, 1.7320556640625, 1.814605712890625, 1.89715576171875, 1.979705810546875, 2.062255859375, 2.144805908203125, 2.22735595703125, 2.309906005859375, 2.3924560546875, 2.475006103515625, 2.55755615234375, 2.640106201171875, 2.72265625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 1.0, 2.0, 2.0, 2.0, 6.0, 12.0, 4.0, 13.0, 11.0, 23.0, 21.0, 25.0, 41.0, 55.0, 79.0, 131.0, 453.0, 2276.0, 495.0, 179.0, 79.0, 42.0, 26.0, 24.0, 14.0, 11.0, 3.0, 11.0, 9.0, 6.0, 4.0, 3.0, 5.0, 7.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.454345703125, -0.4415168762207031, -0.42868804931640625, -0.4158592224121094, -0.4030303955078125, -0.3902015686035156, -0.37737274169921875, -0.3645439147949219, -0.351715087890625, -0.3388862609863281, -0.32605743408203125, -0.3132286071777344, -0.3003997802734375, -0.2875709533691406, -0.27474212646484375, -0.2619132995605469, -0.24908447265625, -0.23625564575195312, -0.22342681884765625, -0.21059799194335938, -0.1977691650390625, -0.18494033813476562, -0.17211151123046875, -0.15928268432617188, -0.146453857421875, -0.13362503051757812, -0.12079620361328125, -0.10796737670898438, -0.0951385498046875, -0.08230972290039062, -0.06948089599609375, -0.056652069091796875, -0.0438232421875, -0.030994415283203125, -0.01816558837890625, -0.005336761474609375, 0.0074920654296875, 0.020320892333984375, 0.03314971923828125, 0.045978546142578125, 0.058807373046875, 0.07163619995117188, 0.08446502685546875, 0.09729385375976562, 0.1101226806640625, 0.12295150756835938, 0.13578033447265625, 0.14860916137695312, 0.16143798828125, 0.17426681518554688, 0.18709564208984375, 0.19992446899414062, 0.2127532958984375, 0.22558212280273438, 0.23841094970703125, 0.2512397766113281, 0.264068603515625, 0.2768974304199219, 0.28972625732421875, 0.3025550842285156, 0.3153839111328125, 0.3282127380371094, 0.34104156494140625, 0.3538703918457031, 0.36669921875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 7.0, 16.0, 42.0, 130.0, 541.0, 195.0, 51.0, 16.0, 5.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.680316925048828, -8.489845275878906, -8.299373626708984, -8.108901023864746, -7.918429374694824, -7.727957725524902, -7.5374860763549805, -7.3470139503479, -7.15654182434082, -6.966070175170898, -6.775598049163818, -6.5851263999938965, -6.394654273986816, -6.2041826248168945, -6.013710975646973, -5.823238849639893, -5.632767200469971, -5.442295551300049, -5.251823425292969, -5.061351776123047, -4.870879650115967, -4.680408000946045, -4.489935874938965, -4.299464225769043, -4.108992576599121, -3.91852068901062, -3.728048801422119, -3.5375771522521973, -3.347105026245117, -3.1566333770751953, -2.9661614894866943, -2.7756896018981934, -2.585216999053955, -2.394745111465454, -2.204273223876953, -2.0138015747070312, -1.8233295679092407, -1.6328576803207397, -1.4423859119415283, -1.2519140243530273, -1.0614421367645264, -0.8709702491760254, -0.6804984211921692, -0.490026593208313, -0.299554705619812, -0.10908281803131104, 0.08138895034790039, 0.27186083793640137, 0.46233272552490234, 0.6528046131134033, 0.8432764410972595, 1.0337482690811157, 1.2242201566696167, 1.4146920442581177, 1.605163812637329, 1.79563570022583, 1.986107587814331, 2.176579475402832, 2.367051362991333, 2.557523250579834, 2.747994899749756, 2.938467025756836, 3.128938674926758, 3.319410562515259, 3.5098824501037598]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 6.0, 9.0, 9.0, 14.0, 19.0, 27.0, 32.0, 48.0, 52.0, 68.0, 75.0, 92.0, 68.0, 90.0, 68.0, 82.0, 44.0, 44.0, 41.0, 31.0, 27.0, 16.0, 7.0, 12.0, 8.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.1098408699035645, -2.0354013442993164, -1.960961937904358, -1.8865225315093994, -1.8120830059051514, -1.7376435995101929, -1.6632041931152344, -1.5887646675109863, -1.5143252611160278, -1.4398858547210693, -1.3654463291168213, -1.2910069227218628, -1.2165675163269043, -1.1421279907226562, -1.0676885843276978, -0.9932491183280945, -0.9188096523284912, -0.8443701863288879, -0.7699307203292847, -0.6954913139343262, -0.6210518479347229, -0.5466123819351196, -0.47217294573783875, -0.39773350954055786, -0.3232940435409546, -0.2488545924425125, -0.17441514134407043, -0.09997569024562836, -0.02553623914718628, 0.04890322685241699, 0.12334266304969788, 0.19778209924697876, 0.27222156524658203, 0.3466610312461853, 0.4211004674434662, 0.49553990364074707, 0.5699793696403503, 0.6444188356399536, 0.7188582420349121, 0.7932977080345154, 0.8677371740341187, 0.9421766400337219, 1.0166161060333252, 1.0910555124282837, 1.1654949188232422, 1.2399344444274902, 1.3143738508224487, 1.3888132572174072, 1.4632527828216553, 1.5376921892166138, 1.6121317148208618, 1.6865711212158203, 1.7610106468200684, 1.8354500532150269, 1.9098894596099854, 1.9843289852142334, 2.0587682723999023, 2.1332077980041504, 2.2076470851898193, 2.2820866107940674, 2.3565261363983154, 2.4309654235839844, 2.5054049491882324, 2.5798444747924805, 2.6542840003967285]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 7.0, 5.0, 15.0, 17.0, 24.0, 28.0, 39.0, 50.0, 70.0, 148.0, 204.0, 289.0, 473.0, 779.0, 1434.0, 2435.0, 4983.0, 11314.0, 32660.0, 161974.0, 690323.0, 98944.0, 24133.0, 8991.0, 3970.0, 2107.0, 1145.0, 718.0, 451.0, 269.0, 167.0, 117.0, 78.0, 55.0, 42.0, 25.0, 19.0, 15.0, 11.0, 8.0, 5.0, 8.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.82421875, -1.76416015625, -1.7041015625, -1.64404296875, -1.583984375, -1.52392578125, -1.4638671875, -1.40380859375, -1.34375, -1.28369140625, -1.2236328125, -1.16357421875, -1.103515625, -1.04345703125, -0.9833984375, -0.92333984375, -0.86328125, -0.80322265625, -0.7431640625, -0.68310546875, -0.623046875, -0.56298828125, -0.5029296875, -0.44287109375, -0.3828125, -0.32275390625, -0.2626953125, -0.20263671875, -0.142578125, -0.08251953125, -0.0224609375, 0.03759765625, 0.09765625, 0.15771484375, 0.2177734375, 0.27783203125, 0.337890625, 0.39794921875, 0.4580078125, 0.51806640625, 0.578125, 0.63818359375, 0.6982421875, 0.75830078125, 0.818359375, 0.87841796875, 0.9384765625, 0.99853515625, 1.05859375, 1.11865234375, 1.1787109375, 1.23876953125, 1.298828125, 1.35888671875, 1.4189453125, 1.47900390625, 1.5390625, 1.59912109375, 1.6591796875, 1.71923828125, 1.779296875, 1.83935546875, 1.8994140625, 1.95947265625, 2.01953125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 0.0, 6.0, 2.0, 0.0, 4.0, 4.0, 3.0, 10.0, 10.0, 6.0, 10.0, 15.0, 20.0, 29.0, 43.0, 52.0, 68.0, 87.0, 70.0, 93.0, 73.0, 78.0, 70.0, 57.0, 39.0, 32.0, 25.0, 17.0, 12.0, 14.0, 11.0, 6.0, 7.0, 9.0, 4.0, 3.0, 3.0, 4.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.159423828125, -0.15482330322265625, -0.1502227783203125, -0.14562225341796875, -0.141021728515625, -0.13642120361328125, -0.1318206787109375, -0.12722015380859375, -0.12261962890625, -0.11801910400390625, -0.1134185791015625, -0.10881805419921875, -0.104217529296875, -0.09961700439453125, -0.0950164794921875, -0.09041595458984375, -0.0858154296875, -0.08121490478515625, -0.0766143798828125, -0.07201385498046875, -0.067413330078125, -0.06281280517578125, -0.0582122802734375, -0.05361175537109375, -0.04901123046875, -0.04441070556640625, -0.0398101806640625, -0.03520965576171875, -0.030609130859375, -0.02600860595703125, -0.0214080810546875, -0.01680755615234375, -0.01220703125, -0.00760650634765625, -0.0030059814453125, 0.00159454345703125, 0.006195068359375, 0.01079559326171875, 0.0153961181640625, 0.01999664306640625, 0.02459716796875, 0.02919769287109375, 0.0337982177734375, 0.03839874267578125, 0.042999267578125, 0.04759979248046875, 0.0522003173828125, 0.05680084228515625, 0.0614013671875, 0.06600189208984375, 0.0706024169921875, 0.07520294189453125, 0.079803466796875, 0.08440399169921875, 0.0890045166015625, 0.09360504150390625, 0.09820556640625, 0.10280609130859375, 0.1074066162109375, 0.11200714111328125, 0.116607666015625, 0.12120819091796875, 0.1258087158203125, 0.13040924072265625, 0.135009765625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 5.0, 3.0, 5.0, 4.0, 10.0, 12.0, 13.0, 23.0, 29.0, 133.0, 945.0, 24692.0, 1007809.0, 13958.0, 691.0, 117.0, 35.0, 22.0, 11.0, 12.0, 4.0, 2.0, 7.0, 7.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.9453125, -5.75, -5.5546875, -5.359375, -5.1640625, -4.96875, -4.7734375, -4.578125, -4.3828125, -4.1875, -3.9921875, -3.796875, -3.6015625, -3.40625, -3.2109375, -3.015625, -2.8203125, -2.625, -2.4296875, -2.234375, -2.0390625, -1.84375, -1.6484375, -1.453125, -1.2578125, -1.0625, -0.8671875, -0.671875, -0.4765625, -0.28125, -0.0859375, 0.109375, 0.3046875, 0.5, 0.6953125, 0.890625, 1.0859375, 1.28125, 1.4765625, 1.671875, 1.8671875, 2.0625, 2.2578125, 2.453125, 2.6484375, 2.84375, 3.0390625, 3.234375, 3.4296875, 3.625, 3.8203125, 4.015625, 4.2109375, 4.40625, 4.6015625, 4.796875, 4.9921875, 5.1875, 5.3828125, 5.578125, 5.7734375, 5.96875, 6.1640625, 6.359375, 6.5546875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 6.0, 7.0, 6.0, 12.0, 13.0, 7.0, 25.0, 15.0, 37.0, 28.0, 33.0, 43.0, 33.0, 41.0, 47.0, 46.0, 36.0, 50.0, 51.0, 67.0, 42.0, 48.0, 50.0, 33.0, 35.0, 24.0, 24.0, 22.0, 23.0, 22.0, 11.0, 15.0, 11.0, 11.0, 9.0, 3.0, 6.0, 3.0, 1.0, 2.0, 3.0, 3.0, 3.0], "bins": [-0.9033203125, -0.88031005859375, -0.8572998046875, -0.83428955078125, -0.811279296875, -0.78826904296875, -0.7652587890625, -0.74224853515625, -0.71923828125, -0.69622802734375, -0.6732177734375, -0.65020751953125, -0.627197265625, -0.60418701171875, -0.5811767578125, -0.55816650390625, -0.53515625, -0.51214599609375, -0.4891357421875, -0.46612548828125, -0.443115234375, -0.42010498046875, -0.3970947265625, -0.37408447265625, -0.35107421875, -0.32806396484375, -0.3050537109375, -0.28204345703125, -0.259033203125, -0.23602294921875, -0.2130126953125, -0.19000244140625, -0.1669921875, -0.14398193359375, -0.1209716796875, -0.09796142578125, -0.074951171875, -0.05194091796875, -0.0289306640625, -0.00592041015625, 0.01708984375, 0.04010009765625, 0.0631103515625, 0.08612060546875, 0.109130859375, 0.13214111328125, 0.1551513671875, 0.17816162109375, 0.201171875, 0.22418212890625, 0.2471923828125, 0.27020263671875, 0.293212890625, 0.31622314453125, 0.3392333984375, 0.36224365234375, 0.38525390625, 0.40826416015625, 0.4312744140625, 0.45428466796875, 0.477294921875, 0.50030517578125, 0.5233154296875, 0.54632568359375, 0.5693359375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 6.0, 7.0, 5.0, 10.0, 13.0, 16.0, 25.0, 31.0, 43.0, 65.0, 133.0, 236.0, 533.0, 1653.0, 8190.0, 807493.0, 222122.0, 5743.0, 1304.0, 435.0, 190.0, 97.0, 55.0, 37.0, 31.0, 20.0, 8.0, 9.0, 18.0, 4.0, 7.0, 3.0, 5.0, 1.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.37109375, -5.20794677734375, -5.0447998046875, -4.88165283203125, -4.718505859375, -4.55535888671875, -4.3922119140625, -4.22906494140625, -4.06591796875, -3.90277099609375, -3.7396240234375, -3.57647705078125, -3.413330078125, -3.25018310546875, -3.0870361328125, -2.92388916015625, -2.7607421875, -2.59759521484375, -2.4344482421875, -2.27130126953125, -2.108154296875, -1.94500732421875, -1.7818603515625, -1.61871337890625, -1.45556640625, -1.29241943359375, -1.1292724609375, -0.96612548828125, -0.802978515625, -0.63983154296875, -0.4766845703125, -0.31353759765625, -0.150390625, 0.01275634765625, 0.1759033203125, 0.33905029296875, 0.502197265625, 0.66534423828125, 0.8284912109375, 0.99163818359375, 1.15478515625, 1.31793212890625, 1.4810791015625, 1.64422607421875, 1.807373046875, 1.97052001953125, 2.1336669921875, 2.29681396484375, 2.4599609375, 2.62310791015625, 2.7862548828125, 2.94940185546875, 3.112548828125, 3.27569580078125, 3.4388427734375, 3.60198974609375, 3.76513671875, 3.92828369140625, 4.0914306640625, 4.25457763671875, 4.417724609375, 4.58087158203125, 4.7440185546875, 4.90716552734375, 5.0703125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 6.0, 3.0, 2.0, 8.0, 6.0, 11.0, 12.0, 23.0, 37.0, 57.0, 133.0, 290.0, 184.0, 84.0, 35.0, 20.0, 21.0, 9.0, 9.0, 18.0, 8.0, 6.0, 5.0, 4.0, 2.0, 0.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0018548965454101562, -0.0017855316400527954, -0.0017161667346954346, -0.0016468018293380737, -0.0015774369239807129, -0.001508072018623352, -0.0014387071132659912, -0.0013693422079086304, -0.0012999773025512695, -0.0012306123971939087, -0.0011612474918365479, -0.001091882586479187, -0.0010225176811218262, -0.0009531527757644653, -0.0008837878704071045, -0.0008144229650497437, -0.0007450580596923828, -0.000675693154335022, -0.0006063282489776611, -0.0005369633436203003, -0.00046759843826293945, -0.0003982335329055786, -0.0003288686275482178, -0.00025950372219085693, -0.0001901388168334961, -0.00012077391147613525, -5.1409006118774414e-05, 1.7955899238586426e-05, 8.732080459594727e-05, 0.0001566857099533081, 0.00022605061531066895, 0.0002954155206680298, 0.0003647804260253906, 0.00043414533138275146, 0.0005035102367401123, 0.0005728751420974731, 0.000642240047454834, 0.0007116049528121948, 0.0007809698581695557, 0.0008503347635269165, 0.0009196996688842773, 0.0009890645742416382, 0.001058429479598999, 0.0011277943849563599, 0.0011971592903137207, 0.0012665241956710815, 0.0013358891010284424, 0.0014052540063858032, 0.001474618911743164, 0.001543983817100525, 0.0016133487224578857, 0.0016827136278152466, 0.0017520785331726074, 0.0018214434385299683, 0.001890808343887329, 0.00196017324924469, 0.0020295381546020508, 0.0020989030599594116, 0.0021682679653167725, 0.0022376328706741333, 0.002306997776031494, 0.002376362681388855, 0.002445727586746216, 0.0025150924921035767, 0.0025844573974609375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 7.0, 5.0, 8.0, 11.0, 21.0, 16.0, 41.0, 59.0, 78.0, 143.0, 219.0, 372.0, 634.0, 1233.0, 2322.0, 5133.0, 15355.0, 111460.0, 843151.0, 49504.0, 10599.0, 3977.0, 1899.0, 1001.0, 539.0, 288.0, 172.0, 103.0, 69.0, 39.0, 32.0, 23.0, 13.0, 14.0, 9.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.68359375, -2.5921630859375, -2.500732421875, -2.4093017578125, -2.31787109375, -2.2264404296875, -2.135009765625, -2.0435791015625, -1.9521484375, -1.8607177734375, -1.769287109375, -1.6778564453125, -1.58642578125, -1.4949951171875, -1.403564453125, -1.3121337890625, -1.220703125, -1.1292724609375, -1.037841796875, -0.9464111328125, -0.85498046875, -0.7635498046875, -0.672119140625, -0.5806884765625, -0.4892578125, -0.3978271484375, -0.306396484375, -0.2149658203125, -0.12353515625, -0.0321044921875, 0.059326171875, 0.1507568359375, 0.2421875, 0.3336181640625, 0.425048828125, 0.5164794921875, 0.60791015625, 0.6993408203125, 0.790771484375, 0.8822021484375, 0.9736328125, 1.0650634765625, 1.156494140625, 1.2479248046875, 1.33935546875, 1.4307861328125, 1.522216796875, 1.6136474609375, 1.705078125, 1.7965087890625, 1.887939453125, 1.9793701171875, 2.07080078125, 2.1622314453125, 2.253662109375, 2.3450927734375, 2.4365234375, 2.5279541015625, 2.619384765625, 2.7108154296875, 2.80224609375, 2.8936767578125, 2.985107421875, 3.0765380859375, 3.16796875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 10.0, 1.0, 8.0, 16.0, 19.0, 32.0, 53.0, 80.0, 135.0, 170.0, 142.0, 132.0, 64.0, 52.0, 26.0, 17.0, 8.0, 8.0, 10.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.185546875, -2.1249237060546875, -2.064300537109375, -2.0036773681640625, -1.94305419921875, -1.8824310302734375, -1.821807861328125, -1.7611846923828125, -1.7005615234375, -1.6399383544921875, -1.579315185546875, -1.5186920166015625, -1.45806884765625, -1.3974456787109375, -1.336822509765625, -1.2761993408203125, -1.215576171875, -1.1549530029296875, -1.094329833984375, -1.0337066650390625, -0.97308349609375, -0.9124603271484375, -0.851837158203125, -0.7912139892578125, -0.7305908203125, -0.6699676513671875, -0.609344482421875, -0.5487213134765625, -0.48809814453125, -0.4274749755859375, -0.366851806640625, -0.3062286376953125, -0.24560546875, -0.1849822998046875, -0.124359130859375, -0.0637359619140625, -0.00311279296875, 0.0575103759765625, 0.118133544921875, 0.1787567138671875, 0.2393798828125, 0.3000030517578125, 0.360626220703125, 0.4212493896484375, 0.48187255859375, 0.5424957275390625, 0.603118896484375, 0.6637420654296875, 0.724365234375, 0.7849884033203125, 0.845611572265625, 0.9062347412109375, 0.96685791015625, 1.0274810791015625, 1.088104248046875, 1.1487274169921875, 1.2093505859375, 1.2699737548828125, 1.330596923828125, 1.3912200927734375, 1.45184326171875, 1.5124664306640625, 1.573089599609375, 1.6337127685546875, 1.6943359375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 8.0, 13.0, 22.0, 49.0, 175.0, 372.0, 213.0, 86.0, 32.0, 16.0, 7.0, 8.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.590793132781982, -7.1330366134643555, -6.67527961730957, -6.217523097991943, -5.759766101837158, -5.302009582519531, -4.844252586364746, -4.386496067047119, -3.928739309310913, -3.470982551574707, -3.013225793838501, -2.555469036102295, -2.097712516784668, -1.639955759048462, -1.1821990013122559, -0.7244422435760498, -0.26668548583984375, 0.19107124209403992, 0.6488279700279236, 1.1065846681594849, 1.564341425895691, 2.0220980644226074, 2.4798548221588135, 2.9376115798950195, 3.3953683376312256, 3.8531250953674316, 4.310881614685059, 4.768638610839844, 5.226395130157471, 5.684151649475098, 6.141908645629883, 6.599665641784668, 7.057421684265137, 7.515178203582764, 7.972935199737549, 8.430691719055176, 8.888448715209961, 9.34620475769043, 9.803961753845215, 10.26171875, 10.719475746154785, 11.17723274230957, 11.634988784790039, 12.092745780944824, 12.55050277709961, 13.008258819580078, 13.466015815734863, 13.923772811889648, 14.381528854370117, 14.839285850524902, 15.297041893005371, 15.754798889160156, 16.212554931640625, 16.670312881469727, 17.128068923950195, 17.585826873779297, 18.043582916259766, 18.501338958740234, 18.959096908569336, 19.416852951049805, 19.874608993530273, 20.332366943359375, 20.790122985839844, 21.247879028320312, 21.705636978149414]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 2.0, 4.0, 11.0, 13.0, 15.0, 21.0, 27.0, 35.0, 46.0, 59.0, 58.0, 84.0, 92.0, 109.0, 74.0, 76.0, 64.0, 46.0, 48.0, 31.0, 21.0, 12.0, 10.0, 13.0, 8.0, 6.0, 3.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.553495407104492, -8.272271156311035, -7.9910478591918945, -7.7098236083984375, -7.428599834442139, -7.14737606048584, -6.866152286529541, -6.584928512573242, -6.303704261779785, -6.022480487823486, -5.7412567138671875, -5.4600324630737305, -5.178808689117432, -4.897584915161133, -4.616361141204834, -4.335137367248535, -4.053913593292236, -3.7726898193359375, -3.4914658069610596, -3.2102420330047607, -2.929018020629883, -2.647794246673584, -2.366570472717285, -2.0853466987609863, -1.8041226863861084, -1.52289879322052, -1.2416749000549316, -0.9604511260986328, -0.6792272329330444, -0.39800333976745605, -0.11677956581115723, 0.16444432735443115, 0.44566822052001953, 0.7268921136856079, 1.0081160068511963, 1.2893397808074951, 1.5705636739730835, 1.8517875671386719, 2.1330113410949707, 2.4142351150512695, 2.6954591274261475, 2.9766829013824463, 3.257906913757324, 3.539130687713623, 3.820354461669922, 4.101578712463379, 4.3828020095825195, 4.664026260375977, 4.945250034332275, 5.226473808288574, 5.507697582244873, 5.788921356201172, 6.070145606994629, 6.351369380950928, 6.632593154907227, 6.913816928863525, 7.195040702819824, 7.476264476776123, 7.757488250732422, 8.038712501525879, 8.31993579864502, 8.601160049438477, 8.882383346557617, 9.163607597351074, 9.444831848144531]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 0.0, 3.0, 4.0, 6.0, 8.0, 14.0, 14.0, 21.0, 47.0, 53.0, 88.0, 144.0, 189.0, 348.0, 547.0, 1100.0, 2085.0, 4326.0, 12173.0, 50679.0, 3825315.0, 258959.0, 23728.0, 7656.0, 3055.0, 1653.0, 887.0, 462.0, 274.0, 151.0, 94.0, 64.0, 49.0, 25.0, 18.0, 19.0, 11.0, 5.0, 7.0, 3.0, 4.0, 1.0, 3.0], "bins": [-5.15234375, -5.02899169921875, -4.9056396484375, -4.78228759765625, -4.658935546875, -4.53558349609375, -4.4122314453125, -4.28887939453125, -4.16552734375, -4.04217529296875, -3.9188232421875, -3.79547119140625, -3.672119140625, -3.54876708984375, -3.4254150390625, -3.30206298828125, -3.1787109375, -3.05535888671875, -2.9320068359375, -2.80865478515625, -2.685302734375, -2.56195068359375, -2.4385986328125, -2.31524658203125, -2.19189453125, -2.06854248046875, -1.9451904296875, -1.82183837890625, -1.698486328125, -1.57513427734375, -1.4517822265625, -1.32843017578125, -1.205078125, -1.08172607421875, -0.9583740234375, -0.83502197265625, -0.711669921875, -0.58831787109375, -0.4649658203125, -0.34161376953125, -0.21826171875, -0.09490966796875, 0.0284423828125, 0.15179443359375, 0.275146484375, 0.39849853515625, 0.5218505859375, 0.64520263671875, 0.7685546875, 0.89190673828125, 1.0152587890625, 1.13861083984375, 1.261962890625, 1.38531494140625, 1.5086669921875, 1.63201904296875, 1.75537109375, 1.87872314453125, 2.0020751953125, 2.12542724609375, 2.248779296875, 2.37213134765625, 2.4954833984375, 2.61883544921875, 2.7421875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 5.0, 4.0, 5.0, 10.0, 8.0, 11.0, 10.0, 17.0, 28.0, 29.0, 56.0, 55.0, 61.0, 74.0, 88.0, 78.0, 77.0, 81.0, 66.0, 45.0, 39.0, 49.0, 24.0, 14.0, 15.0, 9.0, 6.0, 15.0, 6.0, 3.0, 2.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1754150390625, -0.1701812744140625, -0.164947509765625, -0.1597137451171875, -0.15447998046875, -0.1492462158203125, -0.144012451171875, -0.1387786865234375, -0.133544921875, -0.1283111572265625, -0.123077392578125, -0.1178436279296875, -0.11260986328125, -0.1073760986328125, -0.102142333984375, -0.0969085693359375, -0.0916748046875, -0.0864410400390625, -0.081207275390625, -0.0759735107421875, -0.07073974609375, -0.0655059814453125, -0.060272216796875, -0.0550384521484375, -0.0498046875, -0.0445709228515625, -0.039337158203125, -0.0341033935546875, -0.02886962890625, -0.0236358642578125, -0.018402099609375, -0.0131683349609375, -0.0079345703125, -0.0027008056640625, 0.002532958984375, 0.0077667236328125, 0.01300048828125, 0.0182342529296875, 0.023468017578125, 0.0287017822265625, 0.033935546875, 0.0391693115234375, 0.044403076171875, 0.0496368408203125, 0.05487060546875, 0.0601043701171875, 0.065338134765625, 0.0705718994140625, 0.0758056640625, 0.0810394287109375, 0.086273193359375, 0.0915069580078125, 0.09674072265625, 0.1019744873046875, 0.107208251953125, 0.1124420166015625, 0.11767578125, 0.1229095458984375, 0.128143310546875, 0.1333770751953125, 0.13861083984375, 0.1438446044921875, 0.149078369140625, 0.1543121337890625, 0.1595458984375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 0.0, 4.0, 8.0, 15.0, 34.0, 62.0, 403.0, 3488.0, 300876.0, 3882912.0, 5669.0, 584.0, 120.0, 38.0, 33.0, 13.0, 13.0, 7.0, 1.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.67578125, -6.40972900390625, -6.1436767578125, -5.87762451171875, -5.611572265625, -5.34552001953125, -5.0794677734375, -4.81341552734375, -4.54736328125, -4.28131103515625, -4.0152587890625, -3.74920654296875, -3.483154296875, -3.21710205078125, -2.9510498046875, -2.68499755859375, -2.4189453125, -2.15289306640625, -1.8868408203125, -1.62078857421875, -1.354736328125, -1.08868408203125, -0.8226318359375, -0.55657958984375, -0.29052734375, -0.02447509765625, 0.2415771484375, 0.50762939453125, 0.773681640625, 1.03973388671875, 1.3057861328125, 1.57183837890625, 1.837890625, 2.10394287109375, 2.3699951171875, 2.63604736328125, 2.902099609375, 3.16815185546875, 3.4342041015625, 3.70025634765625, 3.96630859375, 4.23236083984375, 4.4984130859375, 4.76446533203125, 5.030517578125, 5.29656982421875, 5.5626220703125, 5.82867431640625, 6.0947265625, 6.36077880859375, 6.6268310546875, 6.89288330078125, 7.158935546875, 7.42498779296875, 7.6910400390625, 7.95709228515625, 8.22314453125, 8.48919677734375, 8.7552490234375, 9.02130126953125, 9.287353515625, 9.55340576171875, 9.8194580078125, 10.08551025390625, 10.3515625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 4.0, 3.0, 8.0, 12.0, 6.0, 12.0, 18.0, 21.0, 20.0, 35.0, 49.0, 113.0, 146.0, 362.0, 1411.0, 1106.0, 327.0, 152.0, 88.0, 51.0, 33.0, 31.0, 20.0, 10.0, 9.0, 8.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3486328125, -0.33568572998046875, -0.3227386474609375, -0.30979156494140625, -0.296844482421875, -0.28389739990234375, -0.2709503173828125, -0.25800323486328125, -0.24505615234375, -0.23210906982421875, -0.2191619873046875, -0.20621490478515625, -0.193267822265625, -0.18032073974609375, -0.1673736572265625, -0.15442657470703125, -0.1414794921875, -0.12853240966796875, -0.1155853271484375, -0.10263824462890625, -0.089691162109375, -0.07674407958984375, -0.0637969970703125, -0.05084991455078125, -0.03790283203125, -0.02495574951171875, -0.0120086669921875, 0.00093841552734375, 0.013885498046875, 0.02683258056640625, 0.0397796630859375, 0.05272674560546875, 0.065673828125, 0.07862091064453125, 0.0915679931640625, 0.10451507568359375, 0.117462158203125, 0.13040924072265625, 0.1433563232421875, 0.15630340576171875, 0.16925048828125, 0.18219757080078125, 0.1951446533203125, 0.20809173583984375, 0.221038818359375, 0.23398590087890625, 0.2469329833984375, 0.25988006591796875, 0.2728271484375, 0.28577423095703125, 0.2987213134765625, 0.31166839599609375, 0.324615478515625, 0.33756256103515625, 0.3505096435546875, 0.36345672607421875, 0.37640380859375, 0.38935089111328125, 0.4022979736328125, 0.41524505615234375, 0.428192138671875, 0.44113922119140625, 0.4540863037109375, 0.46703338623046875, 0.47998046875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 10.0, 66.0, 692.0, 220.0, 20.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.827644109725952, -2.412982940673828, -1.9983220100402832, -1.5836609601974487, -1.1689999103546143, -0.7543389797210693, -0.3396778106689453, 0.07498335838317871, 0.48964428901672363, 0.9043053388595581, 1.3189663887023926, 1.733627438545227, 2.1482884883880615, 2.5629494190216064, 2.9776105880737305, 3.3922717571258545, 3.8069326877593994, 4.221593856811523, 4.636254787445068, 5.050915718078613, 5.465577125549316, 5.880237579345703, 6.294898986816406, 6.709560394287109, 7.124220848083496, 7.538881778717041, 7.953542709350586, 8.368204116821289, 8.782865524291992, 9.197525978088379, 9.612187385559082, 10.026847839355469, 10.441509246826172, 10.856170654296875, 11.270831108093262, 11.685492515563965, 12.100152969360352, 12.514814376831055, 12.929475784301758, 13.344137191772461, 13.758797645568848, 14.17345905303955, 14.588119506835938, 15.00278091430664, 15.417442321777344, 15.83210277557373, 16.246763229370117, 16.66142463684082, 17.076086044311523, 17.490747451782227, 17.90540885925293, 18.320068359375, 18.734729766845703, 19.149391174316406, 19.56405258178711, 19.978713989257812, 20.393375396728516, 20.80803680419922, 21.222698211669922, 21.637357711791992, 22.052019119262695, 22.4666805267334, 22.8813419342041, 23.296003341674805, 23.710662841796875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [4.0, 2.0, 5.0, 11.0, 25.0, 48.0, 62.0, 82.0, 140.0, 181.0, 148.0, 131.0, 81.0, 48.0, 21.0, 19.0, 9.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7780542373657227, -1.6003694534301758, -1.4226845502853394, -1.244999647140503, -1.067314863204956, -0.8896300196647644, -0.7119451761245728, -0.5342602729797363, -0.35657548904418945, -0.1788906455039978, -0.0012058019638061523, 0.1764790415763855, 0.35416388511657715, 0.5318487286567688, 0.7095335721969604, 0.8872184753417969, 1.0649032592773438, 1.2425880432128906, 1.420272946357727, 1.5979578495025635, 1.7756426334381104, 1.9533274173736572, 2.131012439727783, 2.30869722366333, 2.486382007598877, 2.664066791534424, 2.8417515754699707, 3.0194365978240967, 3.1971213817596436, 3.3748061656951904, 3.5524911880493164, 3.7301759719848633, 3.90786075592041, 4.085545539855957, 4.263230323791504, 4.440915107727051, 4.618599891662598, 4.796285152435303, 4.97396993637085, 5.1516547203063965, 5.329339504241943, 5.50702428817749, 5.684709072113037, 5.862393856048584, 6.040079116821289, 6.217763900756836, 6.395448684692383, 6.57313346862793, 6.750818252563477, 6.928503036499023, 7.10618782043457, 7.283872604370117, 7.461557388305664, 7.639242649078369, 7.816927433013916, 7.994612216949463, 8.172296524047852, 8.349981307983398, 8.527666091918945, 8.705350875854492, 8.883035659790039, 9.060720443725586, 9.238405227661133, 9.41609001159668, 9.593775749206543]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 8.0, 7.0, 10.0, 10.0, 12.0, 18.0, 21.0, 32.0, 40.0, 50.0, 48.0, 57.0, 81.0, 186.0, 293550.0, 753848.0, 234.0, 69.0, 55.0, 32.0, 34.0, 26.0, 23.0, 21.0, 16.0, 18.0, 14.0, 5.0, 7.0, 10.0, 7.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.9375, -11.47900390625, -11.0205078125, -10.56201171875, -10.103515625, -9.64501953125, -9.1865234375, -8.72802734375, -8.26953125, -7.81103515625, -7.3525390625, -6.89404296875, -6.435546875, -5.97705078125, -5.5185546875, -5.06005859375, -4.6015625, -4.14306640625, -3.6845703125, -3.22607421875, -2.767578125, -2.30908203125, -1.8505859375, -1.39208984375, -0.93359375, -0.47509765625, -0.0166015625, 0.44189453125, 0.900390625, 1.35888671875, 1.8173828125, 2.27587890625, 2.734375, 3.19287109375, 3.6513671875, 4.10986328125, 4.568359375, 5.02685546875, 5.4853515625, 5.94384765625, 6.40234375, 6.86083984375, 7.3193359375, 7.77783203125, 8.236328125, 8.69482421875, 9.1533203125, 9.61181640625, 10.0703125, 10.52880859375, 10.9873046875, 11.44580078125, 11.904296875, 12.36279296875, 12.8212890625, 13.27978515625, 13.73828125, 14.19677734375, 14.6552734375, 15.11376953125, 15.572265625, 16.03076171875, 16.4892578125, 16.94775390625, 17.40625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 4.0, 45.0, 226.0, 435.0, 249.0, 56.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1766357421875, -0.1382617950439453, -0.09988784790039062, -0.06151390075683594, -0.02313995361328125, 0.015233993530273438, 0.053607940673828125, 0.09198188781738281, 0.1303558349609375, 0.1687297821044922, 0.20710372924804688, 0.24547767639160156, 0.28385162353515625, 0.32222557067871094, 0.3605995178222656, 0.3989734649658203, 0.437347412109375, 0.4757213592529297, 0.5140953063964844, 0.5524692535400391, 0.5908432006835938, 0.6292171478271484, 0.6675910949707031, 0.7059650421142578, 0.7443389892578125, 0.7827129364013672, 0.8210868835449219, 0.8594608306884766, 0.8978347778320312, 0.9362087249755859, 0.9745826721191406, 1.0129566192626953, 1.05133056640625, 1.0897045135498047, 1.1280784606933594, 1.166452407836914, 1.2048263549804688, 1.2432003021240234, 1.2815742492675781, 1.3199481964111328, 1.3583221435546875, 1.3966960906982422, 1.4350700378417969, 1.4734439849853516, 1.5118179321289062, 1.550191879272461, 1.5885658264160156, 1.6269397735595703, 1.665313720703125, 1.7036876678466797, 1.7420616149902344, 1.780435562133789, 1.8188095092773438, 1.8571834564208984, 1.8955574035644531, 1.9339313507080078, 1.9723052978515625, 2.010679244995117, 2.049053192138672, 2.0874271392822266, 2.1258010864257812, 2.164175033569336, 2.2025489807128906, 2.2409229278564453, 2.279296875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 2.0, 7.0, 7.0, 6.0, 9.0, 15.0, 19.0, 19.0, 31.0, 36.0, 63.0, 99.0, 110.0, 168.0, 283.0, 438.0, 704.0, 1265.0, 2243.0, 4437.0, 10097.0, 25799.0, 86444.0, 373431.0, 404032.0, 91283.0, 26961.0, 10205.0, 4542.0, 2432.0, 1231.0, 716.0, 441.0, 309.0, 197.0, 127.0, 91.0, 67.0, 49.0, 29.0, 29.0, 19.0, 14.0, 7.0, 11.0, 13.0, 3.0, 5.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.0234375, -1.96026611328125, -1.8970947265625, -1.83392333984375, -1.770751953125, -1.70758056640625, -1.6444091796875, -1.58123779296875, -1.51806640625, -1.45489501953125, -1.3917236328125, -1.32855224609375, -1.265380859375, -1.20220947265625, -1.1390380859375, -1.07586669921875, -1.0126953125, -0.94952392578125, -0.8863525390625, -0.82318115234375, -0.760009765625, -0.69683837890625, -0.6336669921875, -0.57049560546875, -0.50732421875, -0.44415283203125, -0.3809814453125, -0.31781005859375, -0.254638671875, -0.19146728515625, -0.1282958984375, -0.06512451171875, -0.001953125, 0.06121826171875, 0.1243896484375, 0.18756103515625, 0.250732421875, 0.31390380859375, 0.3770751953125, 0.44024658203125, 0.50341796875, 0.56658935546875, 0.6297607421875, 0.69293212890625, 0.756103515625, 0.81927490234375, 0.8824462890625, 0.94561767578125, 1.0087890625, 1.07196044921875, 1.1351318359375, 1.19830322265625, 1.261474609375, 1.32464599609375, 1.3878173828125, 1.45098876953125, 1.51416015625, 1.57733154296875, 1.6405029296875, 1.70367431640625, 1.766845703125, 1.83001708984375, 1.8931884765625, 1.95635986328125, 2.01953125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 10.0, 12.0, 13.0, 11.0, 11.0, 24.0, 31.0, 39.0, 37.0, 41.0, 49.0, 46.0, 56.0, 59.0, 73.0, 60.0, 66.0, 62.0, 49.0, 55.0, 42.0, 29.0, 25.0, 15.0, 21.0, 11.0, 7.0, 11.0, 9.0, 7.0, 2.0, 2.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.01171875, -1.9522857666015625, -1.892852783203125, -1.8334197998046875, -1.77398681640625, -1.7145538330078125, -1.655120849609375, -1.5956878662109375, -1.5362548828125, -1.4768218994140625, -1.417388916015625, -1.3579559326171875, -1.29852294921875, -1.2390899658203125, -1.179656982421875, -1.1202239990234375, -1.060791015625, -1.0013580322265625, -0.941925048828125, -0.8824920654296875, -0.82305908203125, -0.7636260986328125, -0.704193115234375, -0.6447601318359375, -0.5853271484375, -0.5258941650390625, -0.466461181640625, -0.4070281982421875, -0.34759521484375, -0.2881622314453125, -0.228729248046875, -0.1692962646484375, -0.10986328125, -0.0504302978515625, 0.009002685546875, 0.0684356689453125, 0.12786865234375, 0.1873016357421875, 0.246734619140625, 0.3061676025390625, 0.3656005859375, 0.4250335693359375, 0.484466552734375, 0.5438995361328125, 0.60333251953125, 0.6627655029296875, 0.722198486328125, 0.7816314697265625, 0.841064453125, 0.9004974365234375, 0.959930419921875, 1.0193634033203125, 1.07879638671875, 1.1382293701171875, 1.197662353515625, 1.2570953369140625, 1.3165283203125, 1.3759613037109375, 1.435394287109375, 1.4948272705078125, 1.55426025390625, 1.6136932373046875, 1.673126220703125, 1.7325592041015625, 1.7919921875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 7.0, 10.0, 4.0, 8.0, 23.0, 34.0, 50.0, 49.0, 92.0, 163.0, 233.0, 423.0, 760.0, 1554.0, 3917.0, 12136.0, 65555.0, 627940.0, 292005.0, 30765.0, 7526.0, 2658.0, 1158.0, 604.0, 327.0, 216.0, 108.0, 70.0, 44.0, 38.0, 27.0, 19.0, 8.0, 4.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0], "bins": [-2.87109375, -2.7971038818359375, -2.723114013671875, -2.6491241455078125, -2.57513427734375, -2.5011444091796875, -2.427154541015625, -2.3531646728515625, -2.2791748046875, -2.2051849365234375, -2.131195068359375, -2.0572052001953125, -1.98321533203125, -1.9092254638671875, -1.835235595703125, -1.7612457275390625, -1.687255859375, -1.6132659912109375, -1.539276123046875, -1.4652862548828125, -1.39129638671875, -1.3173065185546875, -1.243316650390625, -1.1693267822265625, -1.0953369140625, -1.0213470458984375, -0.947357177734375, -0.8733673095703125, -0.79937744140625, -0.7253875732421875, -0.651397705078125, -0.5774078369140625, -0.50341796875, -0.4294281005859375, -0.355438232421875, -0.2814483642578125, -0.20745849609375, -0.1334686279296875, -0.059478759765625, 0.0145111083984375, 0.0885009765625, 0.1624908447265625, 0.236480712890625, 0.3104705810546875, 0.38446044921875, 0.4584503173828125, 0.532440185546875, 0.6064300537109375, 0.680419921875, 0.7544097900390625, 0.828399658203125, 0.9023895263671875, 0.97637939453125, 1.0503692626953125, 1.124359130859375, 1.1983489990234375, 1.2723388671875, 1.3463287353515625, 1.420318603515625, 1.4943084716796875, 1.56829833984375, 1.6422882080078125, 1.716278076171875, 1.7902679443359375, 1.8642578125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 6.0, 7.0, 5.0, 10.0, 20.0, 24.0, 38.0, 42.0, 86.0, 138.0, 142.0, 150.0, 112.0, 70.0, 38.0, 33.0, 24.0, 14.0, 9.0, 9.0, 3.0, 7.0, 1.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005331039428710938, -0.0005200505256652832, -0.0005069971084594727, -0.0004939436912536621, -0.00048089027404785156, -0.000467836856842041, -0.00045478343963623047, -0.0004417300224304199, -0.0004286766052246094, -0.00041562318801879883, -0.0004025697708129883, -0.00038951635360717773, -0.0003764629364013672, -0.00036340951919555664, -0.0003503561019897461, -0.00033730268478393555, -0.000324249267578125, -0.00031119585037231445, -0.0002981424331665039, -0.00028508901596069336, -0.0002720355987548828, -0.00025898218154907227, -0.0002459287643432617, -0.00023287534713745117, -0.00021982192993164062, -0.00020676851272583008, -0.00019371509552001953, -0.00018066167831420898, -0.00016760826110839844, -0.0001545548439025879, -0.00014150142669677734, -0.0001284480094909668, -0.00011539459228515625, -0.0001023411750793457, -8.928775787353516e-05, -7.623434066772461e-05, -6.318092346191406e-05, -5.0127506256103516e-05, -3.707408905029297e-05, -2.4020671844482422e-05, -1.0967254638671875e-05, 2.086162567138672e-06, 1.5139579772949219e-05, 2.8192996978759766e-05, 4.124641418457031e-05, 5.429983139038086e-05, 6.73532485961914e-05, 8.040666580200195e-05, 9.34600830078125e-05, 0.00010651350021362305, 0.0001195669174194336, 0.00013262033462524414, 0.0001456737518310547, 0.00015872716903686523, 0.00017178058624267578, 0.00018483400344848633, 0.00019788742065429688, 0.00021094083786010742, 0.00022399425506591797, 0.00023704767227172852, 0.00025010108947753906, 0.0002631545066833496, 0.00027620792388916016, 0.0002892613410949707, 0.00030231475830078125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 7.0, 4.0, 5.0, 9.0, 12.0, 24.0, 24.0, 35.0, 54.0, 73.0, 84.0, 127.0, 234.0, 400.0, 759.0, 1407.0, 3312.0, 9562.0, 74985.0, 861277.0, 80284.0, 9807.0, 3052.0, 1365.0, 658.0, 380.0, 227.0, 127.0, 90.0, 61.0, 33.0, 23.0, 23.0, 12.0, 6.0, 5.0, 6.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-4.203125, -4.081329345703125, -3.95953369140625, -3.837738037109375, -3.7159423828125, -3.594146728515625, -3.47235107421875, -3.350555419921875, -3.228759765625, -3.106964111328125, -2.98516845703125, -2.863372802734375, -2.7415771484375, -2.619781494140625, -2.49798583984375, -2.376190185546875, -2.25439453125, -2.132598876953125, -2.01080322265625, -1.889007568359375, -1.7672119140625, -1.645416259765625, -1.52362060546875, -1.401824951171875, -1.280029296875, -1.158233642578125, -1.03643798828125, -0.914642333984375, -0.7928466796875, -0.671051025390625, -0.54925537109375, -0.427459716796875, -0.3056640625, -0.183868408203125, -0.06207275390625, 0.059722900390625, 0.1815185546875, 0.303314208984375, 0.42510986328125, 0.546905517578125, 0.668701171875, 0.790496826171875, 0.91229248046875, 1.034088134765625, 1.1558837890625, 1.277679443359375, 1.39947509765625, 1.521270751953125, 1.64306640625, 1.764862060546875, 1.88665771484375, 2.008453369140625, 2.1302490234375, 2.252044677734375, 2.37384033203125, 2.495635986328125, 2.617431640625, 2.739227294921875, 2.86102294921875, 2.982818603515625, 3.1046142578125, 3.226409912109375, 3.34820556640625, 3.470001220703125, 3.591796875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 3.0, 6.0, 8.0, 4.0, 3.0, 10.0, 21.0, 45.0, 119.0, 227.0, 249.0, 148.0, 83.0, 36.0, 11.0, 17.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.7265625, -3.633880615234375, -3.54119873046875, -3.448516845703125, -3.3558349609375, -3.263153076171875, -3.17047119140625, -3.077789306640625, -2.985107421875, -2.892425537109375, -2.79974365234375, -2.707061767578125, -2.6143798828125, -2.521697998046875, -2.42901611328125, -2.336334228515625, -2.24365234375, -2.150970458984375, -2.05828857421875, -1.965606689453125, -1.8729248046875, -1.780242919921875, -1.68756103515625, -1.594879150390625, -1.502197265625, -1.409515380859375, -1.31683349609375, -1.224151611328125, -1.1314697265625, -1.038787841796875, -0.94610595703125, -0.853424072265625, -0.7607421875, -0.668060302734375, -0.57537841796875, -0.482696533203125, -0.3900146484375, -0.297332763671875, -0.20465087890625, -0.111968994140625, -0.019287109375, 0.073394775390625, 0.16607666015625, 0.258758544921875, 0.3514404296875, 0.444122314453125, 0.53680419921875, 0.629486083984375, 0.72216796875, 0.814849853515625, 0.90753173828125, 1.000213623046875, 1.0928955078125, 1.185577392578125, 1.27825927734375, 1.370941162109375, 1.463623046875, 1.556304931640625, 1.64898681640625, 1.741668701171875, 1.8343505859375, 1.927032470703125, 2.01971435546875, 2.112396240234375, 2.205078125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 14.0, 35.0, 108.0, 329.0, 315.0, 125.0, 40.0, 16.0, 8.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.856868743896484, -19.95081901550293, -19.044771194458008, -18.138721466064453, -17.2326717376709, -16.326622009277344, -15.420574188232422, -14.514524459838867, -13.608474731445312, -12.702425956726074, -11.79637622833252, -10.890327453613281, -9.984277725219727, -9.078228950500488, -8.17218017578125, -7.266130447387695, -6.360081672668457, -5.4540324211120605, -4.547983169555664, -3.6419341564178467, -2.73588490486145, -1.8298358917236328, -0.9237866401672363, -0.017737388610839844, 0.8883118629455566, 1.7943611145019531, 2.7004103660583496, 3.606459379196167, 4.512508392333984, 5.418557643890381, 6.324606895446777, 7.230656147003174, 8.13670539855957, 9.042754173278809, 9.948803901672363, 10.854852676391602, 11.760902404785156, 12.666951179504395, 13.572999954223633, 14.479049682617188, 15.385099411010742, 16.291149139404297, 17.19719696044922, 18.103246688842773, 19.009296417236328, 19.91534423828125, 20.821393966674805, 21.72744369506836, 22.63349151611328, 23.539541244506836, 24.445589065551758, 25.351638793945312, 26.257688522338867, 27.163738250732422, 28.069786071777344, 28.9758358001709, 29.881885528564453, 30.787935256958008, 31.69398307800293, 32.600032806396484, 33.506080627441406, 34.412132263183594, 35.318180084228516, 36.22422790527344, 37.130279541015625]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 8.0, 12.0, 5.0, 9.0, 19.0, 17.0, 27.0, 33.0, 45.0, 44.0, 51.0, 64.0, 68.0, 77.0, 75.0, 52.0, 70.0, 54.0, 53.0, 51.0, 37.0, 36.0, 27.0, 18.0, 12.0, 14.0, 14.0, 4.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.95705509185791, -12.511048316955566, -12.065042495727539, -11.619035720825195, -11.173028945922852, -10.727022171020508, -10.28101634979248, -9.835009574890137, -9.38900375366211, -8.942996978759766, -8.496991157531738, -8.050984382629395, -7.604977607727051, -7.158971309661865, -6.71296501159668, -6.266958236694336, -5.820951461791992, -5.374945163726807, -4.928938388824463, -4.482932090759277, -4.036925315856934, -3.590919017791748, -3.1449127197265625, -2.698906183242798, -2.252899646759033, -1.8068931102752686, -1.3608866930007935, -0.9148802757263184, -0.4688737392425537, -0.022867202758789062, 0.4231390953063965, 0.8691456317901611, 1.3151531219482422, 1.7611596584320068, 2.2071661949157715, 2.653172492980957, 3.0991790294647217, 3.5451855659484863, 3.991191864013672, 4.437198638916016, 4.883204936981201, 5.329211235046387, 5.7752180099487305, 6.221224308013916, 6.667230606079102, 7.113237380981445, 7.559243679046631, 8.005249977111816, 8.45125675201416, 8.897263526916504, 9.343269348144531, 9.789276123046875, 10.235282897949219, 10.681289672851562, 11.12729549407959, 11.573302268981934, 12.019308090209961, 12.465314865112305, 12.911320686340332, 13.357327461242676, 13.80333423614502, 14.249340057373047, 14.69534683227539, 15.141353607177734, 15.587360382080078]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [5.0, 4.0, 29.0, 247.0, 137867.0, 4054900.0, 725.0, 249.0, 116.0, 56.0, 44.0, 22.0, 10.0, 6.0, 8.0, 7.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.56640625, -6.07220458984375, -4.5780029296875, -3.08380126953125, -1.589599609375, -0.09539794921875, 1.3988037109375, 2.89300537109375, 4.38720703125, 5.88140869140625, 7.3756103515625, 8.86981201171875, 10.364013671875, 11.85821533203125, 13.3524169921875, 14.84661865234375, 16.3408203125, 17.83502197265625, 19.3292236328125, 20.82342529296875, 22.317626953125, 23.81182861328125, 25.3060302734375, 26.80023193359375, 28.29443359375, 29.78863525390625, 31.2828369140625, 32.77703857421875, 34.271240234375, 35.76544189453125, 37.2596435546875, 38.75384521484375, 40.248046875, 41.74224853515625, 43.2364501953125, 44.73065185546875, 46.224853515625, 47.71905517578125, 49.2132568359375, 50.70745849609375, 52.20166015625, 53.69586181640625, 55.1900634765625, 56.68426513671875, 58.178466796875, 59.67266845703125, 61.1668701171875, 62.66107177734375, 64.1552734375, 65.64947509765625, 67.1436767578125, 68.63787841796875, 70.132080078125, 71.62628173828125, 73.1204833984375, 74.61468505859375, 76.10888671875, 77.60308837890625, 79.0972900390625, 80.59149169921875, 82.085693359375, 83.57989501953125, 85.0740966796875, 86.56829833984375, 88.0625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 2.0, 18.0, 66.0, 170.0, 267.0, 288.0, 131.0, 58.0, 12.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.253173828125, -0.21085739135742188, -0.16854095458984375, -0.12622451782226562, -0.0839080810546875, -0.041591644287109375, 0.00072479248046875, 0.043041229248046875, 0.085357666015625, 0.12767410278320312, 0.16999053955078125, 0.21230697631835938, 0.2546234130859375, 0.2969398498535156, 0.33925628662109375, 0.3815727233886719, 0.42388916015625, 0.4662055969238281, 0.5085220336914062, 0.5508384704589844, 0.5931549072265625, 0.6354713439941406, 0.6777877807617188, 0.7201042175292969, 0.762420654296875, 0.8047370910644531, 0.8470535278320312, 0.8893699645996094, 0.9316864013671875, 0.9740028381347656, 1.0163192749023438, 1.0586357116699219, 1.1009521484375, 1.1432685852050781, 1.1855850219726562, 1.2279014587402344, 1.2702178955078125, 1.3125343322753906, 1.3548507690429688, 1.3971672058105469, 1.439483642578125, 1.4818000793457031, 1.5241165161132812, 1.5664329528808594, 1.6087493896484375, 1.6510658264160156, 1.6933822631835938, 1.7356986999511719, 1.77801513671875, 1.8203315734863281, 1.8626480102539062, 1.9049644470214844, 1.9472808837890625, 1.9895973205566406, 2.0319137573242188, 2.074230194091797, 2.116546630859375, 2.158863067626953, 2.2011795043945312, 2.2434959411621094, 2.2858123779296875, 2.3281288146972656, 2.3704452514648438, 2.412761688232422, 2.455078125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 10.0, 5.0, 8.0, 13.0, 17.0, 26.0, 45.0, 41.0, 129.0, 334.0, 2618.0, 163393.0, 4022786.0, 3953.0, 479.0, 165.0, 69.0, 66.0, 45.0, 27.0, 20.0, 18.0, 9.0, 3.0, 2.0, 3.0, 6.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.53125, -10.8955078125, -10.259765625, -9.6240234375, -8.98828125, -8.3525390625, -7.716796875, -7.0810546875, -6.4453125, -5.8095703125, -5.173828125, -4.5380859375, -3.90234375, -3.2666015625, -2.630859375, -1.9951171875, -1.359375, -0.7236328125, -0.087890625, 0.5478515625, 1.18359375, 1.8193359375, 2.455078125, 3.0908203125, 3.7265625, 4.3623046875, 4.998046875, 5.6337890625, 6.26953125, 6.9052734375, 7.541015625, 8.1767578125, 8.8125, 9.4482421875, 10.083984375, 10.7197265625, 11.35546875, 11.9912109375, 12.626953125, 13.2626953125, 13.8984375, 14.5341796875, 15.169921875, 15.8056640625, 16.44140625, 17.0771484375, 17.712890625, 18.3486328125, 18.984375, 19.6201171875, 20.255859375, 20.8916015625, 21.52734375, 22.1630859375, 22.798828125, 23.4345703125, 24.0703125, 24.7060546875, 25.341796875, 25.9775390625, 26.61328125, 27.2490234375, 27.884765625, 28.5205078125, 29.15625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 6.0, 5.0, 7.0, 2.0, 17.0, 14.0, 32.0, 48.0, 107.0, 435.0, 2862.0, 406.0, 91.0, 31.0, 11.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1318359375, -1.0587310791015625, -0.985626220703125, -0.9125213623046875, -0.83941650390625, -0.7663116455078125, -0.693206787109375, -0.6201019287109375, -0.5469970703125, -0.4738922119140625, -0.400787353515625, -0.3276824951171875, -0.25457763671875, -0.1814727783203125, -0.108367919921875, -0.0352630615234375, 0.037841796875, 0.1109466552734375, 0.184051513671875, 0.2571563720703125, 0.33026123046875, 0.4033660888671875, 0.476470947265625, 0.5495758056640625, 0.6226806640625, 0.6957855224609375, 0.768890380859375, 0.8419952392578125, 0.91510009765625, 0.9882049560546875, 1.061309814453125, 1.1344146728515625, 1.20751953125, 1.2806243896484375, 1.353729248046875, 1.4268341064453125, 1.49993896484375, 1.5730438232421875, 1.646148681640625, 1.7192535400390625, 1.7923583984375, 1.8654632568359375, 1.938568115234375, 2.0116729736328125, 2.08477783203125, 2.1578826904296875, 2.230987548828125, 2.3040924072265625, 2.377197265625, 2.4503021240234375, 2.523406982421875, 2.5965118408203125, 2.66961669921875, 2.7427215576171875, 2.815826416015625, 2.8889312744140625, 2.9620361328125, 3.0351409912109375, 3.108245849609375, 3.1813507080078125, 3.25445556640625, 3.3275604248046875, 3.400665283203125, 3.4737701416015625, 3.546875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 26.0, 240.0, 678.0, 58.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.13337326049805, -34.898948669433594, -33.66452407836914, -32.43009948730469, -31.195676803588867, -29.961252212524414, -28.726829528808594, -27.49240493774414, -26.257980346679688, -25.023555755615234, -23.78913116455078, -22.55470848083496, -21.320283889770508, -20.085859298706055, -18.851436614990234, -17.61701202392578, -16.382587432861328, -15.148162841796875, -13.913739204406738, -12.679315567016602, -11.444890975952148, -10.210466384887695, -8.976042747497559, -7.741619110107422, -6.507194519042969, -5.272770404815674, -4.038346290588379, -2.803922176361084, -1.569498062133789, -0.33507394790649414, 0.8993501663208008, 2.1337738037109375, 3.3681983947753906, 4.6026225090026855, 5.8370466232299805, 7.071470737457275, 8.30589485168457, 9.540319442749023, 10.77474308013916, 12.009166717529297, 13.24359130859375, 14.478015899658203, 15.71243953704834, 16.946863174438477, 18.18128776550293, 19.415712356567383, 20.650135040283203, 21.884559631347656, 23.11898422241211, 24.353408813476562, 25.587833404541016, 26.822256088256836, 28.05668067932129, 29.291105270385742, 30.525527954101562, 31.759952545166016, 32.99437713623047, 34.22880172729492, 35.463226318359375, 36.69765090942383, 37.93207550048828, 39.16649627685547, 40.40092086791992, 41.635345458984375, 42.86977005004883]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 7.0, 9.0, 28.0, 29.0, 45.0, 63.0, 92.0, 118.0, 111.0, 110.0, 94.0, 80.0, 78.0, 53.0, 33.0, 25.0, 15.0, 8.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.169807434082031, -13.781947135925293, -13.394086837768555, -13.0062255859375, -12.618365287780762, -12.230504989624023, -11.842644691467285, -11.454784393310547, -11.066923141479492, -10.679062843322754, -10.291202545166016, -9.903341293334961, -9.515480995178223, -9.127620697021484, -8.739760398864746, -8.351900100708008, -7.9640398025512695, -7.576179504394531, -7.188318729400635, -6.8004584312438965, -6.41259765625, -6.024737358093262, -5.636877059936523, -5.249016761779785, -4.861155986785889, -4.47329568862915, -4.085434913635254, -3.6975746154785156, -3.3097140789031982, -2.921853542327881, -2.5339932441711426, -2.146132707595825, -1.7582731246948242, -1.3704125881195068, -0.982552170753479, -0.5946917533874512, -0.2068312168121338, 0.1810293197631836, 0.5688896179199219, 0.9567501544952393, 1.3446106910705566, 1.732471227645874, 2.1203317642211914, 2.5081920623779297, 2.896052598953247, 3.2839131355285645, 3.6717734336853027, 4.059634208679199, 4.4474945068359375, 4.835354804992676, 5.223215579986572, 5.6110758781433105, 5.998936653137207, 6.386796951293945, 6.774657249450684, 7.162517547607422, 7.550378322601318, 7.938238620758057, 8.326099395751953, 8.713959693908691, 9.10181999206543, 9.489681243896484, 9.877540588378906, 10.265401840209961, 10.6532621383667]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 6.0, 12.0, 12.0, 19.0, 35.0, 43.0, 73.0, 96.0, 212.0, 1008.0, 15516.0, 1003554.0, 26210.0, 1198.0, 254.0, 101.0, 65.0, 33.0, 29.0, 29.0, 19.0, 11.0, 7.0, 5.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.7890625, -13.35205078125, -12.9150390625, -12.47802734375, -12.041015625, -11.60400390625, -11.1669921875, -10.72998046875, -10.29296875, -9.85595703125, -9.4189453125, -8.98193359375, -8.544921875, -8.10791015625, -7.6708984375, -7.23388671875, -6.796875, -6.35986328125, -5.9228515625, -5.48583984375, -5.048828125, -4.61181640625, -4.1748046875, -3.73779296875, -3.30078125, -2.86376953125, -2.4267578125, -1.98974609375, -1.552734375, -1.11572265625, -0.6787109375, -0.24169921875, 0.1953125, 0.63232421875, 1.0693359375, 1.50634765625, 1.943359375, 2.38037109375, 2.8173828125, 3.25439453125, 3.69140625, 4.12841796875, 4.5654296875, 5.00244140625, 5.439453125, 5.87646484375, 6.3134765625, 6.75048828125, 7.1875, 7.62451171875, 8.0615234375, 8.49853515625, 8.935546875, 9.37255859375, 9.8095703125, 10.24658203125, 10.68359375, 11.12060546875, 11.5576171875, 11.99462890625, 12.431640625, 12.86865234375, 13.3056640625, 13.74267578125, 14.1796875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 14.0, 42.0, 87.0, 182.0, 230.0, 220.0, 127.0, 65.0, 28.0, 8.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.54345703125, -0.49337005615234375, -0.4432830810546875, -0.39319610595703125, -0.343109130859375, -0.29302215576171875, -0.2429351806640625, -0.19284820556640625, -0.14276123046875, -0.09267425537109375, -0.0425872802734375, 0.00749969482421875, 0.057586669921875, 0.10767364501953125, 0.1577606201171875, 0.20784759521484375, 0.2579345703125, 0.30802154541015625, 0.3581085205078125, 0.40819549560546875, 0.458282470703125, 0.5083694458007812, 0.5584564208984375, 0.6085433959960938, 0.65863037109375, 0.7087173461914062, 0.7588043212890625, 0.8088912963867188, 0.858978271484375, 0.9090652465820312, 0.9591522216796875, 1.0092391967773438, 1.059326171875, 1.1094131469726562, 1.1595001220703125, 1.2095870971679688, 1.259674072265625, 1.3097610473632812, 1.3598480224609375, 1.4099349975585938, 1.46002197265625, 1.5101089477539062, 1.5601959228515625, 1.6102828979492188, 1.660369873046875, 1.7104568481445312, 1.7605438232421875, 1.8106307983398438, 1.8607177734375, 1.9108047485351562, 1.9608917236328125, 2.0109786987304688, 2.061065673828125, 2.1111526489257812, 2.1612396240234375, 2.2113265991210938, 2.26141357421875, 2.3115005493164062, 2.3615875244140625, 2.4116744995117188, 2.461761474609375, 2.5118484497070312, 2.5619354248046875, 2.6120223999023438, 2.662109375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 5.0, 2.0, 2.0, 3.0, 11.0, 9.0, 17.0, 24.0, 41.0, 56.0, 116.0, 183.0, 386.0, 965.0, 2885.0, 14662.0, 142984.0, 758246.0, 111268.0, 12388.0, 2614.0, 845.0, 367.0, 212.0, 107.0, 60.0, 24.0, 24.0, 18.0, 8.0, 10.0, 6.0, 2.0, 4.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3359375, -4.20233154296875, -4.0687255859375, -3.93511962890625, -3.801513671875, -3.66790771484375, -3.5343017578125, -3.40069580078125, -3.26708984375, -3.13348388671875, -2.9998779296875, -2.86627197265625, -2.732666015625, -2.59906005859375, -2.4654541015625, -2.33184814453125, -2.1982421875, -2.06463623046875, -1.9310302734375, -1.79742431640625, -1.663818359375, -1.53021240234375, -1.3966064453125, -1.26300048828125, -1.12939453125, -0.99578857421875, -0.8621826171875, -0.72857666015625, -0.594970703125, -0.46136474609375, -0.3277587890625, -0.19415283203125, -0.060546875, 0.07305908203125, 0.2066650390625, 0.34027099609375, 0.473876953125, 0.60748291015625, 0.7410888671875, 0.87469482421875, 1.00830078125, 1.14190673828125, 1.2755126953125, 1.40911865234375, 1.542724609375, 1.67633056640625, 1.8099365234375, 1.94354248046875, 2.0771484375, 2.21075439453125, 2.3443603515625, 2.47796630859375, 2.611572265625, 2.74517822265625, 2.8787841796875, 3.01239013671875, 3.14599609375, 3.27960205078125, 3.4132080078125, 3.54681396484375, 3.680419921875, 3.81402587890625, 3.9476318359375, 4.08123779296875, 4.21484375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 0.0, 3.0, 2.0, 8.0, 4.0, 10.0, 6.0, 13.0, 22.0, 25.0, 22.0, 35.0, 49.0, 46.0, 49.0, 64.0, 64.0, 61.0, 66.0, 67.0, 55.0, 60.0, 48.0, 40.0, 42.0, 30.0, 21.0, 21.0, 24.0, 9.0, 9.0, 12.0, 6.0, 6.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.232421875, -2.156463623046875, -2.08050537109375, -2.004547119140625, -1.9285888671875, -1.852630615234375, -1.77667236328125, -1.700714111328125, -1.624755859375, -1.548797607421875, -1.47283935546875, -1.396881103515625, -1.3209228515625, -1.244964599609375, -1.16900634765625, -1.093048095703125, -1.01708984375, -0.941131591796875, -0.86517333984375, -0.789215087890625, -0.7132568359375, -0.637298583984375, -0.56134033203125, -0.485382080078125, -0.409423828125, -0.333465576171875, -0.25750732421875, -0.181549072265625, -0.1055908203125, -0.029632568359375, 0.04632568359375, 0.122283935546875, 0.1982421875, 0.274200439453125, 0.35015869140625, 0.426116943359375, 0.5020751953125, 0.578033447265625, 0.65399169921875, 0.729949951171875, 0.805908203125, 0.881866455078125, 0.95782470703125, 1.033782958984375, 1.1097412109375, 1.185699462890625, 1.26165771484375, 1.337615966796875, 1.41357421875, 1.489532470703125, 1.56549072265625, 1.641448974609375, 1.7174072265625, 1.793365478515625, 1.86932373046875, 1.945281982421875, 2.021240234375, 2.097198486328125, 2.17315673828125, 2.249114990234375, 2.3250732421875, 2.401031494140625, 2.47698974609375, 2.552947998046875, 2.62890625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 0.0, 9.0, 7.0, 7.0, 14.0, 22.0, 35.0, 59.0, 70.0, 189.0, 355.0, 781.0, 2268.0, 10929.0, 123343.0, 809243.0, 89020.0, 8789.0, 2010.0, 666.0, 356.0, 156.0, 76.0, 46.0, 34.0, 24.0, 19.0, 8.0, 4.0, 7.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.916015625, -2.813507080078125, -2.71099853515625, -2.608489990234375, -2.5059814453125, -2.403472900390625, -2.30096435546875, -2.198455810546875, -2.095947265625, -1.993438720703125, -1.89093017578125, -1.788421630859375, -1.6859130859375, -1.583404541015625, -1.48089599609375, -1.378387451171875, -1.27587890625, -1.173370361328125, -1.07086181640625, -0.968353271484375, -0.8658447265625, -0.763336181640625, -0.66082763671875, -0.558319091796875, -0.455810546875, -0.353302001953125, -0.25079345703125, -0.148284912109375, -0.0457763671875, 0.056732177734375, 0.15924072265625, 0.261749267578125, 0.3642578125, 0.466766357421875, 0.56927490234375, 0.671783447265625, 0.7742919921875, 0.876800537109375, 0.97930908203125, 1.081817626953125, 1.184326171875, 1.286834716796875, 1.38934326171875, 1.491851806640625, 1.5943603515625, 1.696868896484375, 1.79937744140625, 1.901885986328125, 2.00439453125, 2.106903076171875, 2.20941162109375, 2.311920166015625, 2.4144287109375, 2.516937255859375, 2.61944580078125, 2.721954345703125, 2.824462890625, 2.926971435546875, 3.02947998046875, 3.131988525390625, 3.2344970703125, 3.337005615234375, 3.43951416015625, 3.542022705078125, 3.64453125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 5.0, 1.0, 2.0, 1.0, 5.0, 5.0, 10.0, 5.0, 14.0, 16.0, 20.0, 29.0, 27.0, 29.0, 46.0, 71.0, 80.0, 72.0, 103.0, 88.0, 77.0, 77.0, 33.0, 40.0, 40.0, 27.0, 19.0, 11.0, 9.0, 10.0, 7.0, 4.0, 6.0, 8.0, 7.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.000247955322265625, -0.0002405904233455658, -0.0002332255244255066, -0.0002258606255054474, -0.00021849572658538818, -0.00021113082766532898, -0.00020376592874526978, -0.00019640102982521057, -0.00018903613090515137, -0.00018167123198509216, -0.00017430633306503296, -0.00016694143414497375, -0.00015957653522491455, -0.00015221163630485535, -0.00014484673738479614, -0.00013748183846473694, -0.00013011693954467773, -0.00012275204062461853, -0.00011538714170455933, -0.00010802224278450012, -0.00010065734386444092, -9.329244494438171e-05, -8.592754602432251e-05, -7.85626471042633e-05, -7.11977481842041e-05, -6.38328492641449e-05, -5.646795034408569e-05, -4.910305142402649e-05, -4.1738152503967285e-05, -3.437325358390808e-05, -2.7008354663848877e-05, -1.9643455743789673e-05, -1.2278556823730469e-05, -4.913657903671265e-06, 2.4512410163879395e-06, 9.816139936447144e-06, 1.7181038856506348e-05, 2.4545937776565552e-05, 3.1910836696624756e-05, 3.927573561668396e-05, 4.6640634536743164e-05, 5.400553345680237e-05, 6.137043237686157e-05, 6.873533129692078e-05, 7.610023021697998e-05, 8.346512913703918e-05, 9.083002805709839e-05, 9.819492697715759e-05, 0.0001055598258972168, 0.000112924724817276, 0.0001202896237373352, 0.0001276545226573944, 0.0001350194215774536, 0.00014238432049751282, 0.00014974921941757202, 0.00015711411833763123, 0.00016447901725769043, 0.00017184391617774963, 0.00017920881509780884, 0.00018657371401786804, 0.00019393861293792725, 0.00020130351185798645, 0.00020866841077804565, 0.00021603330969810486, 0.00022339820861816406]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 5.0, 5.0, 6.0, 5.0, 8.0, 24.0, 32.0, 37.0, 60.0, 128.0, 203.0, 337.0, 668.0, 1550.0, 4071.0, 15156.0, 110138.0, 676780.0, 206397.0, 23773.0, 5568.0, 1895.0, 831.0, 365.0, 191.0, 130.0, 57.0, 51.0, 33.0, 14.0, 11.0, 8.0, 7.0, 3.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.060546875, -2.97216796875, -2.8837890625, -2.79541015625, -2.70703125, -2.61865234375, -2.5302734375, -2.44189453125, -2.353515625, -2.26513671875, -2.1767578125, -2.08837890625, -2.0, -1.91162109375, -1.8232421875, -1.73486328125, -1.646484375, -1.55810546875, -1.4697265625, -1.38134765625, -1.29296875, -1.20458984375, -1.1162109375, -1.02783203125, -0.939453125, -0.85107421875, -0.7626953125, -0.67431640625, -0.5859375, -0.49755859375, -0.4091796875, -0.32080078125, -0.232421875, -0.14404296875, -0.0556640625, 0.03271484375, 0.12109375, 0.20947265625, 0.2978515625, 0.38623046875, 0.474609375, 0.56298828125, 0.6513671875, 0.73974609375, 0.828125, 0.91650390625, 1.0048828125, 1.09326171875, 1.181640625, 1.27001953125, 1.3583984375, 1.44677734375, 1.53515625, 1.62353515625, 1.7119140625, 1.80029296875, 1.888671875, 1.97705078125, 2.0654296875, 2.15380859375, 2.2421875, 2.33056640625, 2.4189453125, 2.50732421875, 2.595703125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 4.0, 2.0, 7.0, 13.0, 12.0, 17.0, 27.0, 47.0, 68.0, 90.0, 117.0, 126.0, 127.0, 90.0, 67.0, 58.0, 39.0, 23.0, 28.0, 11.0, 5.0, 8.0, 8.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.279296875, -2.2172088623046875, -2.155120849609375, -2.0930328369140625, -2.03094482421875, -1.9688568115234375, -1.906768798828125, -1.8446807861328125, -1.7825927734375, -1.7205047607421875, -1.658416748046875, -1.5963287353515625, -1.53424072265625, -1.4721527099609375, -1.410064697265625, -1.3479766845703125, -1.285888671875, -1.2238006591796875, -1.161712646484375, -1.0996246337890625, -1.03753662109375, -0.9754486083984375, -0.913360595703125, -0.8512725830078125, -0.7891845703125, -0.7270965576171875, -0.665008544921875, -0.6029205322265625, -0.54083251953125, -0.4787445068359375, -0.416656494140625, -0.3545684814453125, -0.29248046875, -0.2303924560546875, -0.168304443359375, -0.1062164306640625, -0.04412841796875, 0.0179595947265625, 0.080047607421875, 0.1421356201171875, 0.2042236328125, 0.2663116455078125, 0.328399658203125, 0.3904876708984375, 0.45257568359375, 0.5146636962890625, 0.576751708984375, 0.6388397216796875, 0.700927734375, 0.7630157470703125, 0.825103759765625, 0.8871917724609375, 0.94927978515625, 1.0113677978515625, 1.073455810546875, 1.1355438232421875, 1.1976318359375, 1.2597198486328125, 1.321807861328125, 1.3838958740234375, 1.44598388671875, 1.5080718994140625, 1.570159912109375, 1.6322479248046875, 1.6943359375]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 13.0, 43.0, 220.0, 568.0, 143.0, 12.0, 10.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.64368438720703, -38.83191680908203, -37.02014923095703, -35.20838165283203, -33.39661407470703, -31.5848445892334, -29.7730770111084, -27.961307525634766, -26.149539947509766, -24.337772369384766, -22.526004791259766, -20.714237213134766, -18.902467727661133, -17.090700149536133, -15.278932571411133, -13.467164039611816, -11.655397415161133, -9.843629837036133, -8.031861305236816, -6.220093727111816, -4.408325672149658, -2.5965576171875, -0.7847900390625, 1.0269784927368164, 2.8387460708618164, 4.650514125823975, 6.462282180786133, 8.274049758911133, 10.085817337036133, 11.89758586883545, 13.70935344696045, 15.521121978759766, 17.332889556884766, 19.144657135009766, 20.956424713134766, 22.768192291259766, 24.5799617767334, 26.3917293548584, 28.2034969329834, 30.01526641845703, 31.82703399658203, 33.63880157470703, 35.45056915283203, 37.26233673095703, 39.07410430908203, 40.88587188720703, 42.69763946533203, 44.5094108581543, 46.32117462158203, 48.13294219970703, 49.94470977783203, 51.75647735595703, 53.56824493408203, 55.38001251220703, 57.19178009033203, 59.0035514831543, 60.8153190612793, 62.6270866394043, 64.43885803222656, 66.25062561035156, 68.06239318847656, 69.87416076660156, 71.68592834472656, 73.49769592285156, 75.30946350097656]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 15.0, 14.0, 9.0, 15.0, 21.0, 25.0, 35.0, 47.0, 37.0, 53.0, 59.0, 52.0, 64.0, 55.0, 71.0, 52.0, 56.0, 60.0, 46.0, 41.0, 32.0, 33.0, 17.0, 26.0, 14.0, 21.0, 5.0, 6.0, 6.0, 9.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.43329620361328, -15.91877555847168, -15.404254913330078, -14.889734268188477, -14.375213623046875, -13.860692977905273, -13.346171379089355, -12.831650733947754, -12.317130088806152, -11.80260944366455, -11.28808879852295, -10.773568153381348, -10.25904655456543, -9.744525909423828, -9.230005264282227, -8.715484619140625, -8.200963973999023, -7.686443328857422, -7.17192268371582, -6.6574015617370605, -6.142880916595459, -5.628360271453857, -5.113839149475098, -4.599318504333496, -4.0847978591918945, -3.570277214050293, -3.0557563304901123, -2.5412354469299316, -2.02671480178833, -1.5121941566467285, -0.9976732730865479, -0.4831523895263672, 0.03137016296386719, 0.5458909273147583, 1.0604116916656494, 1.5749324560165405, 2.0894532203674316, 2.603973865509033, 3.118494749069214, 3.6330156326293945, 4.147536277770996, 4.662056922912598, 5.176577568054199, 5.691098690032959, 6.2056193351745605, 6.720139980316162, 7.234661102294922, 7.749181747436523, 8.263702392578125, 8.778223037719727, 9.292743682861328, 9.80726432800293, 10.321784973144531, 10.836305618286133, 11.35082721710205, 11.865347862243652, 12.379868507385254, 12.894389152526855, 13.408909797668457, 13.923430442810059, 14.437952041625977, 14.952472686767578, 15.46699333190918, 15.981513977050781, 16.496034622192383]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 6.0, 11.0, 27.0, 81.0, 246.0, 999.0, 5623.0, 65910.0, 4027441.0, 84798.0, 6547.0, 1315.0, 425.0, 220.0, 175.0, 108.0, 74.0, 57.0, 37.0, 33.0, 32.0, 22.0, 21.0, 21.0, 13.0, 9.0, 4.0, 11.0, 5.0, 11.0, 4.0, 4.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.171875, -3.810546875, -3.44921875, -3.087890625, -2.7265625, -2.365234375, -2.00390625, -1.642578125, -1.28125, -0.919921875, -0.55859375, -0.197265625, 0.1640625, 0.525390625, 0.88671875, 1.248046875, 1.609375, 1.970703125, 2.33203125, 2.693359375, 3.0546875, 3.416015625, 3.77734375, 4.138671875, 4.5, 4.861328125, 5.22265625, 5.583984375, 5.9453125, 6.306640625, 6.66796875, 7.029296875, 7.390625, 7.751953125, 8.11328125, 8.474609375, 8.8359375, 9.197265625, 9.55859375, 9.919921875, 10.28125, 10.642578125, 11.00390625, 11.365234375, 11.7265625, 12.087890625, 12.44921875, 12.810546875, 13.171875, 13.533203125, 13.89453125, 14.255859375, 14.6171875, 14.978515625, 15.33984375, 15.701171875, 16.0625, 16.423828125, 16.78515625, 17.146484375, 17.5078125, 17.869140625, 18.23046875, 18.591796875, 18.953125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 2.0, 13.0, 23.0, 42.0, 86.0, 126.0, 182.0, 179.0, 144.0, 97.0, 59.0, 28.0, 21.0, 6.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48974609375, -0.44632720947265625, -0.4029083251953125, -0.35948944091796875, -0.316070556640625, -0.27265167236328125, -0.2292327880859375, -0.18581390380859375, -0.14239501953125, -0.09897613525390625, -0.0555572509765625, -0.01213836669921875, 0.031280517578125, 0.07469940185546875, 0.1181182861328125, 0.16153717041015625, 0.2049560546875, 0.24837493896484375, 0.2917938232421875, 0.33521270751953125, 0.378631591796875, 0.42205047607421875, 0.4654693603515625, 0.5088882446289062, 0.55230712890625, 0.5957260131835938, 0.6391448974609375, 0.6825637817382812, 0.725982666015625, 0.7694015502929688, 0.8128204345703125, 0.8562393188476562, 0.899658203125, 0.9430770874023438, 0.9864959716796875, 1.0299148559570312, 1.073333740234375, 1.1167526245117188, 1.1601715087890625, 1.2035903930664062, 1.24700927734375, 1.2904281616210938, 1.3338470458984375, 1.3772659301757812, 1.420684814453125, 1.4641036987304688, 1.5075225830078125, 1.5509414672851562, 1.5943603515625, 1.6377792358398438, 1.6811981201171875, 1.7246170043945312, 1.768035888671875, 1.8114547729492188, 1.8548736572265625, 1.8982925415039062, 1.94171142578125, 1.9851303100585938, 2.0285491943359375, 2.0719680786132812, 2.115386962890625, 2.1588058471679688, 2.2022247314453125, 2.2456436157226562, 2.2890625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 4.0, 6.0, 8.0, 9.0, 40.0, 55.0, 132.0, 232.0, 518.0, 1172.0, 4051.0, 42645.0, 4007092.0, 127013.0, 7339.0, 2036.0, 942.0, 437.0, 259.0, 129.0, 70.0, 45.0, 19.0, 12.0, 4.0, 1.0, 6.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.16015625, -4.85003662109375, -4.5399169921875, -4.22979736328125, -3.919677734375, -3.60955810546875, -3.2994384765625, -2.98931884765625, -2.67919921875, -2.36907958984375, -2.0589599609375, -1.74884033203125, -1.438720703125, -1.12860107421875, -0.8184814453125, -0.50836181640625, -0.1982421875, 0.11187744140625, 0.4219970703125, 0.73211669921875, 1.042236328125, 1.35235595703125, 1.6624755859375, 1.97259521484375, 2.28271484375, 2.59283447265625, 2.9029541015625, 3.21307373046875, 3.523193359375, 3.83331298828125, 4.1434326171875, 4.45355224609375, 4.763671875, 5.07379150390625, 5.3839111328125, 5.69403076171875, 6.004150390625, 6.31427001953125, 6.6243896484375, 6.93450927734375, 7.24462890625, 7.55474853515625, 7.8648681640625, 8.17498779296875, 8.485107421875, 8.79522705078125, 9.1053466796875, 9.41546630859375, 9.7255859375, 10.03570556640625, 10.3458251953125, 10.65594482421875, 10.966064453125, 11.27618408203125, 11.5863037109375, 11.89642333984375, 12.20654296875, 12.51666259765625, 12.8267822265625, 13.13690185546875, 13.447021484375, 13.75714111328125, 14.0672607421875, 14.37738037109375, 14.6875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 4.0, 11.0, 12.0, 19.0, 38.0, 59.0, 101.0, 231.0, 858.0, 1950.0, 415.0, 185.0, 84.0, 34.0, 21.0, 17.0, 8.0, 7.0, 7.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0654296875, -1.017578125, -0.9697265625, -0.921875, -0.8740234375, -0.826171875, -0.7783203125, -0.73046875, -0.6826171875, -0.634765625, -0.5869140625, -0.5390625, -0.4912109375, -0.443359375, -0.3955078125, -0.34765625, -0.2998046875, -0.251953125, -0.2041015625, -0.15625, -0.1083984375, -0.060546875, -0.0126953125, 0.03515625, 0.0830078125, 0.130859375, 0.1787109375, 0.2265625, 0.2744140625, 0.322265625, 0.3701171875, 0.41796875, 0.4658203125, 0.513671875, 0.5615234375, 0.609375, 0.6572265625, 0.705078125, 0.7529296875, 0.80078125, 0.8486328125, 0.896484375, 0.9443359375, 0.9921875, 1.0400390625, 1.087890625, 1.1357421875, 1.18359375, 1.2314453125, 1.279296875, 1.3271484375, 1.375, 1.4228515625, 1.470703125, 1.5185546875, 1.56640625, 1.6142578125, 1.662109375, 1.7099609375, 1.7578125, 1.8056640625, 1.853515625, 1.9013671875, 1.94921875, 1.9970703125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 25.0, 80.0, 295.0, 394.0, 143.0, 53.0, 10.0, 4.0, 5.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.582685470581055, -18.004316329956055, -17.425945281982422, -16.847576141357422, -16.269207000732422, -15.690835952758789, -15.112466812133789, -14.534096717834473, -13.955726623535156, -13.37735652923584, -12.798986434936523, -12.220617294311523, -11.642247200012207, -11.06387710571289, -10.48550796508789, -9.907137870788574, -9.328767776489258, -8.750397682189941, -8.172027587890625, -7.593658447265625, -7.015288352966309, -6.436918258666992, -5.858548641204834, -5.280179023742676, -4.701808929443359, -4.123438835144043, -3.5450692176818848, -2.9666993618011475, -2.38832950592041, -1.8099596500396729, -1.2315897941589355, -0.6532201766967773, -0.07484817504882812, 0.5035216808319092, 1.0818915367126465, 1.6602613925933838, 2.238631248474121, 2.8170011043548584, 3.3953709602355957, 3.973740577697754, 4.55211067199707, 5.130480766296387, 5.708850383758545, 6.287220001220703, 6.8655900955200195, 7.443960189819336, 8.022329330444336, 8.600699424743652, 9.179069519042969, 9.757439613342285, 10.335809707641602, 10.914178848266602, 11.492548942565918, 12.070919036865234, 12.649288177490234, 13.22765827178955, 13.806028366088867, 14.384398460388184, 14.9627685546875, 15.5411376953125, 16.1195068359375, 16.697877883911133, 17.276247024536133, 17.854618072509766, 18.432987213134766]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 7.0, 13.0, 25.0, 28.0, 34.0, 53.0, 63.0, 72.0, 91.0, 107.0, 94.0, 115.0, 83.0, 72.0, 37.0, 40.0, 25.0, 19.0, 8.0, 4.0, 6.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.906780242919922, -8.629692077636719, -8.352603912353516, -8.075515747070312, -7.798427581787109, -7.521339416503906, -7.244251251220703, -6.9671630859375, -6.690074920654297, -6.412986755371094, -6.135898590087891, -5.8588104248046875, -5.581722259521484, -5.304634094238281, -5.027545928955078, -4.750457763671875, -4.473369121551514, -4.1962809562683105, -3.9191927909851074, -3.6421046257019043, -3.365016460418701, -3.087928295135498, -2.810839891433716, -2.5337517261505127, -2.2566635608673096, -1.9795753955841064, -1.7024872303009033, -1.4253989458084106, -1.1483107805252075, -0.8712226152420044, -0.5941343307495117, -0.3170461654663086, -0.03995800018310547, 0.23713019490242004, 0.5142183899879456, 0.7913066148757935, 1.0683947801589966, 1.3454829454421997, 1.6225712299346924, 1.8996593952178955, 2.1767475605010986, 2.4538357257843018, 2.730923891067505, 3.008012294769287, 3.2851004600524902, 3.5621886253356934, 3.8392767906188965, 4.1163649559021, 4.393453121185303, 4.670541286468506, 4.947629451751709, 5.224717617034912, 5.501805782318115, 5.778893947601318, 6.05598258972168, 6.333070755004883, 6.610158920288086, 6.887247085571289, 7.164335250854492, 7.441423416137695, 7.718511581420898, 7.995599746704102, 8.272687911987305, 8.549776077270508, 8.826864242553711]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 5.0, 2.0, 12.0, 8.0, 13.0, 21.0, 10.0, 23.0, 18.0, 30.0, 46.0, 57.0, 76.0, 135.0, 332.0, 850.0, 3609.0, 30317.0, 565778.0, 419784.0, 22915.0, 3063.0, 780.0, 258.0, 120.0, 82.0, 44.0, 37.0, 41.0, 23.0, 18.0, 10.0, 8.0, 11.0, 7.0, 6.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.7578125, -6.55267333984375, -6.3475341796875, -6.14239501953125, -5.937255859375, -5.73211669921875, -5.5269775390625, -5.32183837890625, -5.11669921875, -4.91156005859375, -4.7064208984375, -4.50128173828125, -4.296142578125, -4.09100341796875, -3.8858642578125, -3.68072509765625, -3.4755859375, -3.27044677734375, -3.0653076171875, -2.86016845703125, -2.655029296875, -2.44989013671875, -2.2447509765625, -2.03961181640625, -1.83447265625, -1.62933349609375, -1.4241943359375, -1.21905517578125, -1.013916015625, -0.80877685546875, -0.6036376953125, -0.39849853515625, -0.193359375, 0.01177978515625, 0.2169189453125, 0.42205810546875, 0.627197265625, 0.83233642578125, 1.0374755859375, 1.24261474609375, 1.44775390625, 1.65289306640625, 1.8580322265625, 2.06317138671875, 2.268310546875, 2.47344970703125, 2.6785888671875, 2.88372802734375, 3.0888671875, 3.29400634765625, 3.4991455078125, 3.70428466796875, 3.909423828125, 4.11456298828125, 4.3197021484375, 4.52484130859375, 4.72998046875, 4.93511962890625, 5.1402587890625, 5.34539794921875, 5.550537109375, 5.75567626953125, 5.9608154296875, 6.16595458984375, 6.37109375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 8.0, 24.0, 32.0, 54.0, 96.0, 122.0, 177.0, 153.0, 131.0, 89.0, 52.0, 32.0, 20.0, 10.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6796875, -0.6312255859375, -0.582763671875, -0.5343017578125, -0.48583984375, -0.4373779296875, -0.388916015625, -0.3404541015625, -0.2919921875, -0.2435302734375, -0.195068359375, -0.1466064453125, -0.09814453125, -0.0496826171875, -0.001220703125, 0.0472412109375, 0.095703125, 0.1441650390625, 0.192626953125, 0.2410888671875, 0.28955078125, 0.3380126953125, 0.386474609375, 0.4349365234375, 0.4833984375, 0.5318603515625, 0.580322265625, 0.6287841796875, 0.67724609375, 0.7257080078125, 0.774169921875, 0.8226318359375, 0.87109375, 0.9195556640625, 0.968017578125, 1.0164794921875, 1.06494140625, 1.1134033203125, 1.161865234375, 1.2103271484375, 1.2587890625, 1.3072509765625, 1.355712890625, 1.4041748046875, 1.45263671875, 1.5010986328125, 1.549560546875, 1.5980224609375, 1.646484375, 1.6949462890625, 1.743408203125, 1.7918701171875, 1.84033203125, 1.8887939453125, 1.937255859375, 1.9857177734375, 2.0341796875, 2.0826416015625, 2.131103515625, 2.1795654296875, 2.22802734375, 2.2764892578125, 2.324951171875, 2.3734130859375, 2.421875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 1.0, 2.0, 6.0, 10.0, 11.0, 11.0, 24.0, 22.0, 48.0, 64.0, 99.0, 154.0, 207.0, 335.0, 582.0, 1140.0, 2543.0, 6684.0, 21855.0, 84286.0, 346984.0, 428122.0, 112703.0, 28285.0, 8377.0, 2935.0, 1345.0, 619.0, 405.0, 233.0, 136.0, 109.0, 49.0, 42.0, 31.0, 29.0, 18.0, 17.0, 11.0, 9.0, 5.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.87890625, -2.799163818359375, -2.71942138671875, -2.639678955078125, -2.5599365234375, -2.480194091796875, -2.40045166015625, -2.320709228515625, -2.240966796875, -2.161224365234375, -2.08148193359375, -2.001739501953125, -1.9219970703125, -1.842254638671875, -1.76251220703125, -1.682769775390625, -1.60302734375, -1.523284912109375, -1.44354248046875, -1.363800048828125, -1.2840576171875, -1.204315185546875, -1.12457275390625, -1.044830322265625, -0.965087890625, -0.885345458984375, -0.80560302734375, -0.725860595703125, -0.6461181640625, -0.566375732421875, -0.48663330078125, -0.406890869140625, -0.3271484375, -0.247406005859375, -0.16766357421875, -0.087921142578125, -0.0081787109375, 0.071563720703125, 0.15130615234375, 0.231048583984375, 0.310791015625, 0.390533447265625, 0.47027587890625, 0.550018310546875, 0.6297607421875, 0.709503173828125, 0.78924560546875, 0.868988037109375, 0.94873046875, 1.028472900390625, 1.10821533203125, 1.187957763671875, 1.2677001953125, 1.347442626953125, 1.42718505859375, 1.506927490234375, 1.586669921875, 1.666412353515625, 1.74615478515625, 1.825897216796875, 1.9056396484375, 1.985382080078125, 2.06512451171875, 2.144866943359375, 2.224609375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 2.0, 5.0, 4.0, 13.0, 7.0, 6.0, 12.0, 10.0, 22.0, 16.0, 27.0, 25.0, 26.0, 44.0, 37.0, 37.0, 32.0, 50.0, 51.0, 60.0, 45.0, 56.0, 42.0, 48.0, 37.0, 36.0, 43.0, 30.0, 30.0, 23.0, 27.0, 18.0, 23.0, 15.0, 8.0, 12.0, 4.0, 5.0, 4.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-2.765625, -2.683685302734375, -2.60174560546875, -2.519805908203125, -2.4378662109375, -2.355926513671875, -2.27398681640625, -2.192047119140625, -2.110107421875, -2.028167724609375, -1.94622802734375, -1.864288330078125, -1.7823486328125, -1.700408935546875, -1.61846923828125, -1.536529541015625, -1.45458984375, -1.372650146484375, -1.29071044921875, -1.208770751953125, -1.1268310546875, -1.044891357421875, -0.96295166015625, -0.881011962890625, -0.799072265625, -0.717132568359375, -0.63519287109375, -0.553253173828125, -0.4713134765625, -0.389373779296875, -0.30743408203125, -0.225494384765625, -0.1435546875, -0.061614990234375, 0.02032470703125, 0.102264404296875, 0.1842041015625, 0.266143798828125, 0.34808349609375, 0.430023193359375, 0.511962890625, 0.593902587890625, 0.67584228515625, 0.757781982421875, 0.8397216796875, 0.921661376953125, 1.00360107421875, 1.085540771484375, 1.16748046875, 1.249420166015625, 1.33135986328125, 1.413299560546875, 1.4952392578125, 1.577178955078125, 1.65911865234375, 1.741058349609375, 1.822998046875, 1.904937744140625, 1.98687744140625, 2.068817138671875, 2.1507568359375, 2.232696533203125, 2.31463623046875, 2.396575927734375, 2.478515625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 6.0, 7.0, 10.0, 5.0, 18.0, 21.0, 40.0, 58.0, 106.0, 247.0, 519.0, 1223.0, 3609.0, 12800.0, 66383.0, 525261.0, 377265.0, 46476.0, 9764.0, 2864.0, 1042.0, 396.0, 216.0, 87.0, 62.0, 25.0, 15.0, 12.0, 4.0, 7.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9716796875, -1.9057464599609375, -1.839813232421875, -1.7738800048828125, -1.70794677734375, -1.6420135498046875, -1.576080322265625, -1.5101470947265625, -1.4442138671875, -1.3782806396484375, -1.312347412109375, -1.2464141845703125, -1.18048095703125, -1.1145477294921875, -1.048614501953125, -0.9826812744140625, -0.916748046875, -0.8508148193359375, -0.784881591796875, -0.7189483642578125, -0.65301513671875, -0.5870819091796875, -0.521148681640625, -0.4552154541015625, -0.3892822265625, -0.3233489990234375, -0.257415771484375, -0.1914825439453125, -0.12554931640625, -0.0596160888671875, 0.006317138671875, 0.0722503662109375, 0.13818359375, 0.2041168212890625, 0.270050048828125, 0.3359832763671875, 0.40191650390625, 0.4678497314453125, 0.533782958984375, 0.5997161865234375, 0.6656494140625, 0.7315826416015625, 0.797515869140625, 0.8634490966796875, 0.92938232421875, 0.9953155517578125, 1.061248779296875, 1.1271820068359375, 1.193115234375, 1.2590484619140625, 1.324981689453125, 1.3909149169921875, 1.45684814453125, 1.5227813720703125, 1.588714599609375, 1.6546478271484375, 1.7205810546875, 1.7865142822265625, 1.852447509765625, 1.9183807373046875, 1.98431396484375, 2.0502471923828125, 2.116180419921875, 2.1821136474609375, 2.248046875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 5.0, 0.0, 2.0, 5.0, 7.0, 8.0, 7.0, 4.0, 3.0, 18.0, 18.0, 33.0, 16.0, 55.0, 56.0, 56.0, 85.0, 109.0, 114.0, 110.0, 63.0, 51.0, 43.0, 32.0, 26.0, 15.0, 16.0, 9.0, 5.0, 9.0, 7.0, 7.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000244140625, -0.00023512914776802063, -0.00022611767053604126, -0.0002171061933040619, -0.00020809471607208252, -0.00019908323884010315, -0.00019007176160812378, -0.0001810602843761444, -0.00017204880714416504, -0.00016303732991218567, -0.0001540258526802063, -0.00014501437544822693, -0.00013600289821624756, -0.0001269914209842682, -0.00011797994375228882, -0.00010896846652030945, -9.995698928833008e-05, -9.094551205635071e-05, -8.193403482437134e-05, -7.292255759239197e-05, -6.39110803604126e-05, -5.489960312843323e-05, -4.588812589645386e-05, -3.687664866447449e-05, -2.7865171432495117e-05, -1.8853694200515747e-05, -9.842216968536377e-06, -8.307397365570068e-07, 8.180737495422363e-06, 1.7192214727401733e-05, 2.6203691959381104e-05, 3.5215169191360474e-05, 4.4226646423339844e-05, 5.3238123655319214e-05, 6.224960088729858e-05, 7.126107811927795e-05, 8.027255535125732e-05, 8.92840325832367e-05, 9.829550981521606e-05, 0.00010730698704719543, 0.0001163184642791748, 0.00012532994151115417, 0.00013434141874313354, 0.00014335289597511292, 0.00015236437320709229, 0.00016137585043907166, 0.00017038732767105103, 0.0001793988049030304, 0.00018841028213500977, 0.00019742175936698914, 0.0002064332365989685, 0.00021544471383094788, 0.00022445619106292725, 0.00023346766829490662, 0.00024247914552688599, 0.00025149062275886536, 0.0002605020999908447, 0.0002695135772228241, 0.00027852505445480347, 0.00028753653168678284, 0.0002965480089187622, 0.0003055594861507416, 0.00031457096338272095, 0.0003235824406147003, 0.0003325939178466797]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 5.0, 3.0, 8.0, 5.0, 10.0, 15.0, 20.0, 30.0, 35.0, 49.0, 73.0, 119.0, 186.0, 275.0, 486.0, 864.0, 1358.0, 2789.0, 5662.0, 12534.0, 32708.0, 105233.0, 360379.0, 362484.0, 105699.0, 33084.0, 12601.0, 5496.0, 2723.0, 1446.0, 825.0, 475.0, 278.0, 185.0, 132.0, 91.0, 60.0, 37.0, 26.0, 17.0, 16.0, 10.0, 7.0, 6.0, 3.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-1.416015625, -1.37310791015625, -1.3302001953125, -1.28729248046875, -1.244384765625, -1.20147705078125, -1.1585693359375, -1.11566162109375, -1.07275390625, -1.02984619140625, -0.9869384765625, -0.94403076171875, -0.901123046875, -0.85821533203125, -0.8153076171875, -0.77239990234375, -0.7294921875, -0.68658447265625, -0.6436767578125, -0.60076904296875, -0.557861328125, -0.51495361328125, -0.4720458984375, -0.42913818359375, -0.38623046875, -0.34332275390625, -0.3004150390625, -0.25750732421875, -0.214599609375, -0.17169189453125, -0.1287841796875, -0.08587646484375, -0.04296875, -6.103515625e-05, 0.0428466796875, 0.08575439453125, 0.128662109375, 0.17156982421875, 0.2144775390625, 0.25738525390625, 0.30029296875, 0.34320068359375, 0.3861083984375, 0.42901611328125, 0.471923828125, 0.51483154296875, 0.5577392578125, 0.60064697265625, 0.6435546875, 0.68646240234375, 0.7293701171875, 0.77227783203125, 0.815185546875, 0.85809326171875, 0.9010009765625, 0.94390869140625, 0.98681640625, 1.02972412109375, 1.0726318359375, 1.11553955078125, 1.158447265625, 1.20135498046875, 1.2442626953125, 1.28717041015625, 1.330078125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 7.0, 1.0, 7.0, 6.0, 11.0, 10.0, 19.0, 20.0, 34.0, 37.0, 62.0, 71.0, 87.0, 95.0, 95.0, 86.0, 80.0, 77.0, 61.0, 38.0, 26.0, 12.0, 22.0, 14.0, 5.0, 9.0, 3.0, 5.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.8505859375, -1.8010711669921875, -1.751556396484375, -1.7020416259765625, -1.65252685546875, -1.6030120849609375, -1.553497314453125, -1.5039825439453125, -1.4544677734375, -1.4049530029296875, -1.355438232421875, -1.3059234619140625, -1.25640869140625, -1.2068939208984375, -1.157379150390625, -1.1078643798828125, -1.058349609375, -1.0088348388671875, -0.959320068359375, -0.9098052978515625, -0.86029052734375, -0.8107757568359375, -0.761260986328125, -0.7117462158203125, -0.6622314453125, -0.6127166748046875, -0.563201904296875, -0.5136871337890625, -0.46417236328125, -0.4146575927734375, -0.365142822265625, -0.3156280517578125, -0.26611328125, -0.2165985107421875, -0.167083740234375, -0.1175689697265625, -0.06805419921875, -0.0185394287109375, 0.030975341796875, 0.0804901123046875, 0.1300048828125, 0.1795196533203125, 0.229034423828125, 0.2785491943359375, 0.32806396484375, 0.3775787353515625, 0.427093505859375, 0.4766082763671875, 0.526123046875, 0.5756378173828125, 0.625152587890625, 0.6746673583984375, 0.72418212890625, 0.7736968994140625, 0.823211669921875, 0.8727264404296875, 0.9222412109375, 0.9717559814453125, 1.021270751953125, 1.0707855224609375, 1.12030029296875, 1.1698150634765625, 1.219329833984375, 1.2688446044921875, 1.318359375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 10.0, 12.0, 22.0, 70.0, 134.0, 238.0, 264.0, 162.0, 60.0, 14.0, 17.0, 7.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.28567886352539, -12.278127670288086, -11.270576477050781, -10.263026237487793, -9.255475044250488, -8.247923851013184, -7.240373134613037, -6.232822418212891, -5.225271224975586, -4.217720031738281, -3.2101693153381348, -2.202618360519409, -1.1950674057006836, -0.1875162124633789, 0.8200345039367676, 1.827585220336914, 2.8351364135742188, 3.8426873683929443, 4.85023832321167, 5.857789039611816, 6.865340232849121, 7.872891426086426, 8.880441665649414, 9.887992858886719, 10.895544052124023, 11.903095245361328, 12.910646438598633, 13.918196678161621, 14.925747871398926, 15.93329906463623, 16.94084930419922, 17.948400497436523, 18.955955505371094, 19.9635066986084, 20.971057891845703, 21.978609085083008, 22.986160278320312, 23.993709564208984, 25.00126075744629, 26.008811950683594, 27.0163631439209, 28.023914337158203, 29.031465530395508, 30.039016723632812, 31.046566009521484, 32.05411911010742, 33.061668395996094, 34.06922149658203, 35.0767707824707, 36.084320068359375, 37.09187316894531, 38.099422454833984, 39.10697555541992, 40.114524841308594, 41.12207794189453, 42.1296272277832, 43.137176513671875, 44.14472579956055, 45.152278900146484, 46.159828186035156, 47.167381286621094, 48.174930572509766, 49.1824836730957, 50.190032958984375, 51.19758605957031]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 7.0, 6.0, 9.0, 5.0, 6.0, 10.0, 10.0, 12.0, 8.0, 24.0, 23.0, 26.0, 36.0, 15.0, 29.0, 39.0, 42.0, 44.0, 44.0, 44.0, 47.0, 45.0, 40.0, 46.0, 56.0, 47.0, 36.0, 28.0, 41.0, 27.0, 32.0, 20.0, 26.0, 21.0, 14.0, 9.0, 7.0, 8.0, 4.0, 1.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.903984069824219, -15.421110153198242, -14.938237190246582, -14.455364227294922, -13.972490310668945, -13.489616394042969, -13.006743431091309, -12.523870468139648, -12.040996551513672, -11.558122634887695, -11.075249671936035, -10.592376708984375, -10.109502792358398, -9.626628875732422, -9.143755912780762, -8.660882949829102, -8.178009033203125, -7.695135593414307, -7.212262153625488, -6.72938871383667, -6.246515274047852, -5.763641834259033, -5.280768394470215, -4.7978949546813965, -4.315021514892578, -3.8321480751037598, -3.3492746353149414, -2.866401195526123, -2.3835277557373047, -1.9006543159484863, -1.417780876159668, -0.9349074363708496, -0.45203304290771484, 0.030840396881103516, 0.5137138366699219, 0.9965872764587402, 1.4794607162475586, 1.962334156036377, 2.4452075958251953, 2.9280810356140137, 3.410954475402832, 3.8938279151916504, 4.376701354980469, 4.859574794769287, 5.3424482345581055, 5.825321674346924, 6.308195114135742, 6.7910685539245605, 7.273941993713379, 7.756815433502197, 8.239688873291016, 8.722562789916992, 9.205435752868652, 9.688308715820312, 10.171182632446289, 10.654056549072266, 11.136929512023926, 11.619802474975586, 12.102676391601562, 12.585550308227539, 13.0684232711792, 13.55129623413086, 14.034170150756836, 14.517044067382812, 14.999917030334473]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 4.0, 5.0, 10.0, 27.0, 58.0, 143.0, 315.0, 1066.0, 5346.0, 60705.0, 4056786.0, 62064.0, 5250.0, 1311.0, 496.0, 237.0, 122.0, 89.0, 73.0, 35.0, 31.0, 24.0, 21.0, 14.0, 13.0, 7.0, 8.0, 7.0, 3.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.96484375, -3.67144775390625, -3.3780517578125, -3.08465576171875, -2.791259765625, -2.49786376953125, -2.2044677734375, -1.91107177734375, -1.61767578125, -1.32427978515625, -1.0308837890625, -0.73748779296875, -0.444091796875, -0.15069580078125, 0.1427001953125, 0.43609619140625, 0.7294921875, 1.02288818359375, 1.3162841796875, 1.60968017578125, 1.903076171875, 2.19647216796875, 2.4898681640625, 2.78326416015625, 3.07666015625, 3.37005615234375, 3.6634521484375, 3.95684814453125, 4.250244140625, 4.54364013671875, 4.8370361328125, 5.13043212890625, 5.423828125, 5.71722412109375, 6.0106201171875, 6.30401611328125, 6.597412109375, 6.89080810546875, 7.1842041015625, 7.47760009765625, 7.77099609375, 8.06439208984375, 8.3577880859375, 8.65118408203125, 8.944580078125, 9.23797607421875, 9.5313720703125, 9.82476806640625, 10.1181640625, 10.41156005859375, 10.7049560546875, 10.99835205078125, 11.291748046875, 11.58514404296875, 11.8785400390625, 12.17193603515625, 12.46533203125, 12.75872802734375, 13.0521240234375, 13.34552001953125, 13.638916015625, 13.93231201171875, 14.2257080078125, 14.51910400390625, 14.8125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 5.0, 4.0, 21.0, 28.0, 76.0, 84.0, 117.0, 167.0, 159.0, 121.0, 93.0, 67.0, 42.0, 11.0, 7.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68896484375, -0.6365432739257812, -0.5841217041015625, -0.5317001342773438, -0.479278564453125, -0.42685699462890625, -0.3744354248046875, -0.32201385498046875, -0.26959228515625, -0.21717071533203125, -0.1647491455078125, -0.11232757568359375, -0.059906005859375, -0.00748443603515625, 0.0449371337890625, 0.09735870361328125, 0.1497802734375, 0.20220184326171875, 0.2546234130859375, 0.30704498291015625, 0.359466552734375, 0.41188812255859375, 0.4643096923828125, 0.5167312622070312, 0.56915283203125, 0.6215744018554688, 0.6739959716796875, 0.7264175415039062, 0.778839111328125, 0.8312606811523438, 0.8836822509765625, 0.9361038208007812, 0.988525390625, 1.0409469604492188, 1.0933685302734375, 1.1457901000976562, 1.198211669921875, 1.2506332397460938, 1.3030548095703125, 1.3554763793945312, 1.40789794921875, 1.4603195190429688, 1.5127410888671875, 1.5651626586914062, 1.617584228515625, 1.6700057983398438, 1.7224273681640625, 1.7748489379882812, 1.8272705078125, 1.8796920776367188, 1.9321136474609375, 1.9845352172851562, 2.036956787109375, 2.0893783569335938, 2.1417999267578125, 2.1942214965820312, 2.24664306640625, 2.2990646362304688, 2.3514862060546875, 2.4039077758789062, 2.456329345703125, 2.5087509155273438, 2.5611724853515625, 2.6135940551757812, 2.666015625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 10.0, 11.0, 10.0, 14.0, 43.0, 69.0, 82.0, 172.0, 343.0, 658.0, 1790.0, 6547.0, 49840.0, 3853677.0, 259527.0, 16162.0, 3211.0, 1021.0, 466.0, 234.0, 139.0, 96.0, 61.0, 28.0, 26.0, 15.0, 18.0, 5.0, 7.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.19140625, -6.94964599609375, -6.7078857421875, -6.46612548828125, -6.224365234375, -5.98260498046875, -5.7408447265625, -5.49908447265625, -5.25732421875, -5.01556396484375, -4.7738037109375, -4.53204345703125, -4.290283203125, -4.04852294921875, -3.8067626953125, -3.56500244140625, -3.3232421875, -3.08148193359375, -2.8397216796875, -2.59796142578125, -2.356201171875, -2.11444091796875, -1.8726806640625, -1.63092041015625, -1.38916015625, -1.14739990234375, -0.9056396484375, -0.66387939453125, -0.422119140625, -0.18035888671875, 0.0614013671875, 0.30316162109375, 0.544921875, 0.78668212890625, 1.0284423828125, 1.27020263671875, 1.511962890625, 1.75372314453125, 1.9954833984375, 2.23724365234375, 2.47900390625, 2.72076416015625, 2.9625244140625, 3.20428466796875, 3.446044921875, 3.68780517578125, 3.9295654296875, 4.17132568359375, 4.4130859375, 4.65484619140625, 4.8966064453125, 5.13836669921875, 5.380126953125, 5.62188720703125, 5.8636474609375, 6.10540771484375, 6.34716796875, 6.58892822265625, 6.8306884765625, 7.07244873046875, 7.314208984375, 7.55596923828125, 7.7977294921875, 8.03948974609375, 8.28125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 5.0, 8.0, 10.0, 16.0, 27.0, 50.0, 77.0, 193.0, 522.0, 2266.0, 552.0, 175.0, 66.0, 26.0, 28.0, 25.0, 8.0, 5.0, 6.0, 5.0, 1.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5693359375, -1.5142822265625, -1.459228515625, -1.4041748046875, -1.34912109375, -1.2940673828125, -1.239013671875, -1.1839599609375, -1.12890625, -1.0738525390625, -1.018798828125, -0.9637451171875, -0.90869140625, -0.8536376953125, -0.798583984375, -0.7435302734375, -0.6884765625, -0.6334228515625, -0.578369140625, -0.5233154296875, -0.46826171875, -0.4132080078125, -0.358154296875, -0.3031005859375, -0.248046875, -0.1929931640625, -0.137939453125, -0.0828857421875, -0.02783203125, 0.0272216796875, 0.082275390625, 0.1373291015625, 0.1923828125, 0.2474365234375, 0.302490234375, 0.3575439453125, 0.41259765625, 0.4676513671875, 0.522705078125, 0.5777587890625, 0.6328125, 0.6878662109375, 0.742919921875, 0.7979736328125, 0.85302734375, 0.9080810546875, 0.963134765625, 1.0181884765625, 1.0732421875, 1.1282958984375, 1.183349609375, 1.2384033203125, 1.29345703125, 1.3485107421875, 1.403564453125, 1.4586181640625, 1.513671875, 1.5687255859375, 1.623779296875, 1.6788330078125, 1.73388671875, 1.7889404296875, 1.843994140625, 1.8990478515625, 1.9541015625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 15.0, 18.0, 49.0, 93.0, 136.0, 168.0, 200.0, 141.0, 79.0, 46.0, 23.0, 7.0, 12.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.040183067321777, -8.766946792602539, -8.4937105178833, -8.220475196838379, -7.947238922119141, -7.674002647399902, -7.400766372680664, -7.127530097961426, -6.854294300079346, -6.581058025360107, -6.307822227478027, -6.034585952758789, -5.761349678039551, -5.488113880157471, -5.214877605438232, -4.941641807556152, -4.668405532836914, -4.395169258117676, -4.121933460235596, -3.8486971855163574, -3.5754611492156982, -3.302225112915039, -3.028988838195801, -2.7557528018951416, -2.4825167655944824, -2.2092807292938232, -1.9360445737838745, -1.6628084182739258, -1.3895723819732666, -1.1163363456726074, -0.8431001901626587, -0.56986403465271, -0.2966270446777344, -0.02339094877243042, 0.24984514713287354, 0.5230812430381775, 0.7963173389434814, 1.0695533752441406, 1.3427895307540894, 1.616025686264038, 1.8892617225646973, 2.1624977588653564, 2.4357337951660156, 2.708970069885254, 2.982206106185913, 3.2554421424865723, 3.5286784172058105, 3.8019144535064697, 4.075150489807129, 4.348386764526367, 4.621622562408447, 4.8948588371276855, 5.168094635009766, 5.441330909729004, 5.714567184448242, 5.9878034591674805, 6.2610392570495605, 6.534275531768799, 6.807511329650879, 7.080747604370117, 7.3539838790893555, 7.6272196769714355, 7.900455951690674, 8.173691749572754, 8.446928024291992]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 1.0, 2.0, 4.0, 5.0, 9.0, 10.0, 9.0, 9.0, 13.0, 31.0, 30.0, 44.0, 53.0, 49.0, 44.0, 72.0, 55.0, 65.0, 63.0, 56.0, 63.0, 50.0, 44.0, 31.0, 31.0, 40.0, 31.0, 23.0, 15.0, 15.0, 15.0, 4.0, 7.0, 3.0, 4.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.088855266571045, -3.9363560676574707, -3.7838568687438965, -3.6313576698303223, -3.478858709335327, -3.326359510421753, -3.1738603115081787, -3.0213613510131836, -2.8688621520996094, -2.716362953186035, -2.563863754272461, -2.4113645553588867, -2.2588655948638916, -2.1063663959503174, -1.9538671970367432, -1.8013681173324585, -1.6488687992095947, -1.4963696002960205, -1.3438705205917358, -1.1913713216781616, -1.038872241973877, -0.8863730430603027, -0.7338738441467285, -0.5813747644424438, -0.42887556552886963, -0.2763764262199402, -0.12387725710868835, 0.028621912002563477, 0.18112105131149292, 0.33362019062042236, 0.4861193895339966, 0.6386184692382812, 0.7911176681518555, 0.9436168074607849, 1.0961159467697144, 1.2486151456832886, 1.4011142253875732, 1.5536134243011475, 1.7061126232147217, 1.8586117029190063, 2.011110782623291, 2.1636099815368652, 2.3161091804504395, 2.4686083793640137, 2.621107339859009, 2.773606538772583, 2.9261057376861572, 3.0786046981811523, 3.2311041355133057, 3.38360333442688, 3.536102533340454, 3.688601493835449, 3.8411006927490234, 3.9935998916625977, 4.146099090576172, 4.298598289489746, 4.45109748840332, 4.6035966873168945, 4.756095886230469, 4.908595085144043, 5.061094284057617, 5.213593482971191, 5.366092681884766, 5.518591403961182, 5.671090602874756]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 6.0, 6.0, 8.0, 10.0, 16.0, 24.0, 28.0, 26.0, 51.0, 83.0, 145.0, 330.0, 755.0, 2197.0, 9832.0, 99282.0, 750103.0, 166919.0, 14320.0, 2698.0, 861.0, 359.0, 177.0, 95.0, 62.0, 49.0, 27.0, 27.0, 8.0, 13.0, 6.0, 9.0, 4.0, 0.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.12109375, -5.94415283203125, -5.7672119140625, -5.59027099609375, -5.413330078125, -5.23638916015625, -5.0594482421875, -4.88250732421875, -4.70556640625, -4.52862548828125, -4.3516845703125, -4.17474365234375, -3.997802734375, -3.82086181640625, -3.6439208984375, -3.46697998046875, -3.2900390625, -3.11309814453125, -2.9361572265625, -2.75921630859375, -2.582275390625, -2.40533447265625, -2.2283935546875, -2.05145263671875, -1.87451171875, -1.69757080078125, -1.5206298828125, -1.34368896484375, -1.166748046875, -0.98980712890625, -0.8128662109375, -0.63592529296875, -0.458984375, -0.28204345703125, -0.1051025390625, 0.07183837890625, 0.248779296875, 0.42572021484375, 0.6026611328125, 0.77960205078125, 0.95654296875, 1.13348388671875, 1.3104248046875, 1.48736572265625, 1.664306640625, 1.84124755859375, 2.0181884765625, 2.19512939453125, 2.3720703125, 2.54901123046875, 2.7259521484375, 2.90289306640625, 3.079833984375, 3.25677490234375, 3.4337158203125, 3.61065673828125, 3.78759765625, 3.96453857421875, 4.1414794921875, 4.31842041015625, 4.495361328125, 4.67230224609375, 4.8492431640625, 5.02618408203125, 5.203125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 11.0, 11.0, 32.0, 51.0, 65.0, 103.0, 134.0, 142.0, 124.0, 108.0, 95.0, 65.0, 27.0, 17.0, 7.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8125, -0.76104736328125, -0.7095947265625, -0.65814208984375, -0.606689453125, -0.55523681640625, -0.5037841796875, -0.45233154296875, -0.40087890625, -0.34942626953125, -0.2979736328125, -0.24652099609375, -0.195068359375, -0.14361572265625, -0.0921630859375, -0.04071044921875, 0.0107421875, 0.06219482421875, 0.1136474609375, 0.16510009765625, 0.216552734375, 0.26800537109375, 0.3194580078125, 0.37091064453125, 0.42236328125, 0.47381591796875, 0.5252685546875, 0.57672119140625, 0.628173828125, 0.67962646484375, 0.7310791015625, 0.78253173828125, 0.833984375, 0.88543701171875, 0.9368896484375, 0.98834228515625, 1.039794921875, 1.09124755859375, 1.1427001953125, 1.19415283203125, 1.24560546875, 1.29705810546875, 1.3485107421875, 1.39996337890625, 1.451416015625, 1.50286865234375, 1.5543212890625, 1.60577392578125, 1.6572265625, 1.70867919921875, 1.7601318359375, 1.81158447265625, 1.863037109375, 1.91448974609375, 1.9659423828125, 2.01739501953125, 2.06884765625, 2.12030029296875, 2.1717529296875, 2.22320556640625, 2.274658203125, 2.32611083984375, 2.3775634765625, 2.42901611328125, 2.48046875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 2.0, 1.0, 3.0, 4.0, 4.0, 12.0, 11.0, 12.0, 29.0, 27.0, 55.0, 101.0, 151.0, 267.0, 517.0, 970.0, 2656.0, 9421.0, 46540.0, 327991.0, 546868.0, 90155.0, 15964.0, 4010.0, 1322.0, 629.0, 352.0, 174.0, 109.0, 74.0, 43.0, 31.0, 12.0, 11.0, 8.0, 6.0, 5.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.30078125, -3.1746826171875, -3.048583984375, -2.9224853515625, -2.79638671875, -2.6702880859375, -2.544189453125, -2.4180908203125, -2.2919921875, -2.1658935546875, -2.039794921875, -1.9136962890625, -1.78759765625, -1.6614990234375, -1.535400390625, -1.4093017578125, -1.283203125, -1.1571044921875, -1.031005859375, -0.9049072265625, -0.77880859375, -0.6527099609375, -0.526611328125, -0.4005126953125, -0.2744140625, -0.1483154296875, -0.022216796875, 0.1038818359375, 0.22998046875, 0.3560791015625, 0.482177734375, 0.6082763671875, 0.734375, 0.8604736328125, 0.986572265625, 1.1126708984375, 1.23876953125, 1.3648681640625, 1.490966796875, 1.6170654296875, 1.7431640625, 1.8692626953125, 1.995361328125, 2.1214599609375, 2.24755859375, 2.3736572265625, 2.499755859375, 2.6258544921875, 2.751953125, 2.8780517578125, 3.004150390625, 3.1302490234375, 3.25634765625, 3.3824462890625, 3.508544921875, 3.6346435546875, 3.7607421875, 3.8868408203125, 4.012939453125, 4.1390380859375, 4.26513671875, 4.3912353515625, 4.517333984375, 4.6434326171875, 4.76953125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 7.0, 7.0, 10.0, 19.0, 14.0, 25.0, 20.0, 32.0, 41.0, 53.0, 44.0, 59.0, 47.0, 62.0, 57.0, 47.0, 63.0, 60.0, 56.0, 55.0, 43.0, 34.0, 33.0, 23.0, 18.0, 10.0, 14.0, 12.0, 13.0, 8.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.798828125, -2.677520751953125, -2.55621337890625, -2.434906005859375, -2.3135986328125, -2.192291259765625, -2.07098388671875, -1.949676513671875, -1.828369140625, -1.707061767578125, -1.58575439453125, -1.464447021484375, -1.3431396484375, -1.221832275390625, -1.10052490234375, -0.979217529296875, -0.85791015625, -0.736602783203125, -0.61529541015625, -0.493988037109375, -0.3726806640625, -0.251373291015625, -0.13006591796875, -0.008758544921875, 0.112548828125, 0.233856201171875, 0.35516357421875, 0.476470947265625, 0.5977783203125, 0.719085693359375, 0.84039306640625, 0.961700439453125, 1.0830078125, 1.204315185546875, 1.32562255859375, 1.446929931640625, 1.5682373046875, 1.689544677734375, 1.81085205078125, 1.932159423828125, 2.053466796875, 2.174774169921875, 2.29608154296875, 2.417388916015625, 2.5386962890625, 2.660003662109375, 2.78131103515625, 2.902618408203125, 3.02392578125, 3.145233154296875, 3.26654052734375, 3.387847900390625, 3.5091552734375, 3.630462646484375, 3.75177001953125, 3.873077392578125, 3.994384765625, 4.115692138671875, 4.23699951171875, 4.358306884765625, 4.4796142578125, 4.600921630859375, 4.72222900390625, 4.843536376953125, 4.96484375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 10.0, 19.0, 31.0, 48.0, 76.0, 118.0, 218.0, 416.0, 918.0, 2282.0, 6307.0, 21903.0, 104266.0, 524549.0, 312916.0, 54399.0, 12975.0, 4069.0, 1588.0, 702.0, 322.0, 160.0, 108.0, 47.0, 38.0, 24.0, 17.0, 8.0, 10.0, 10.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4130859375, -1.3640289306640625, -1.314971923828125, -1.2659149169921875, -1.21685791015625, -1.1678009033203125, -1.118743896484375, -1.0696868896484375, -1.0206298828125, -0.9715728759765625, -0.922515869140625, -0.8734588623046875, -0.82440185546875, -0.7753448486328125, -0.726287841796875, -0.6772308349609375, -0.628173828125, -0.5791168212890625, -0.530059814453125, -0.4810028076171875, -0.43194580078125, -0.3828887939453125, -0.333831787109375, -0.2847747802734375, -0.2357177734375, -0.1866607666015625, -0.137603759765625, -0.0885467529296875, -0.03948974609375, 0.0095672607421875, 0.058624267578125, 0.1076812744140625, 0.15673828125, 0.2057952880859375, 0.254852294921875, 0.3039093017578125, 0.35296630859375, 0.4020233154296875, 0.451080322265625, 0.5001373291015625, 0.5491943359375, 0.5982513427734375, 0.647308349609375, 0.6963653564453125, 0.74542236328125, 0.7944793701171875, 0.843536376953125, 0.8925933837890625, 0.941650390625, 0.9907073974609375, 1.039764404296875, 1.0888214111328125, 1.13787841796875, 1.1869354248046875, 1.235992431640625, 1.2850494384765625, 1.3341064453125, 1.3831634521484375, 1.432220458984375, 1.4812774658203125, 1.53033447265625, 1.5793914794921875, 1.628448486328125, 1.6775054931640625, 1.7265625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 5.0, 6.0, 5.0, 13.0, 9.0, 15.0, 18.0, 22.0, 21.0, 27.0, 44.0, 38.0, 59.0, 72.0, 75.0, 90.0, 85.0, 60.0, 83.0, 47.0, 35.0, 29.0, 25.0, 23.0, 20.0, 14.0, 10.0, 7.0, 8.0, 3.0, 6.0, 7.0, 2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.00023102760314941406, -0.00022437795996665955, -0.00021772831678390503, -0.0002110786736011505, -0.000204429030418396, -0.00019777938723564148, -0.00019112974405288696, -0.00018448010087013245, -0.00017783045768737793, -0.0001711808145046234, -0.0001645311713218689, -0.00015788152813911438, -0.00015123188495635986, -0.00014458224177360535, -0.00013793259859085083, -0.0001312829554080963, -0.0001246333122253418, -0.00011798366904258728, -0.00011133402585983276, -0.00010468438267707825, -9.803473949432373e-05, -9.138509631156921e-05, -8.47354531288147e-05, -7.808580994606018e-05, -7.143616676330566e-05, -6.478652358055115e-05, -5.813688039779663e-05, -5.1487237215042114e-05, -4.48375940322876e-05, -3.818795084953308e-05, -3.1538307666778564e-05, -2.4888664484024048e-05, -1.823902130126953e-05, -1.1589378118515015e-05, -4.939734935760498e-06, 1.7099082469940186e-06, 8.359551429748535e-06, 1.5009194612503052e-05, 2.165883779525757e-05, 2.8308480978012085e-05, 3.49581241607666e-05, 4.160776734352112e-05, 4.8257410526275635e-05, 5.490705370903015e-05, 6.155669689178467e-05, 6.820634007453918e-05, 7.48559832572937e-05, 8.150562644004822e-05, 8.815526962280273e-05, 9.480491280555725e-05, 0.00010145455598831177, 0.00010810419917106628, 0.0001147538423538208, 0.00012140348553657532, 0.00012805312871932983, 0.00013470277190208435, 0.00014135241508483887, 0.00014800205826759338, 0.0001546517014503479, 0.00016130134463310242, 0.00016795098781585693, 0.00017460063099861145, 0.00018125027418136597, 0.00018789991736412048, 0.000194549560546875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 8.0, 8.0, 16.0, 26.0, 49.0, 89.0, 135.0, 251.0, 672.0, 1718.0, 6053.0, 31353.0, 283612.0, 630491.0, 77709.0, 11718.0, 2776.0, 1025.0, 440.0, 187.0, 110.0, 47.0, 33.0, 16.0, 7.0, 7.0, 3.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.525390625, -2.45159912109375, -2.3778076171875, -2.30401611328125, -2.230224609375, -2.15643310546875, -2.0826416015625, -2.00885009765625, -1.93505859375, -1.86126708984375, -1.7874755859375, -1.71368408203125, -1.639892578125, -1.56610107421875, -1.4923095703125, -1.41851806640625, -1.3447265625, -1.27093505859375, -1.1971435546875, -1.12335205078125, -1.049560546875, -0.97576904296875, -0.9019775390625, -0.82818603515625, -0.75439453125, -0.68060302734375, -0.6068115234375, -0.53302001953125, -0.459228515625, -0.38543701171875, -0.3116455078125, -0.23785400390625, -0.1640625, -0.09027099609375, -0.0164794921875, 0.05731201171875, 0.131103515625, 0.20489501953125, 0.2786865234375, 0.35247802734375, 0.42626953125, 0.50006103515625, 0.5738525390625, 0.64764404296875, 0.721435546875, 0.79522705078125, 0.8690185546875, 0.94281005859375, 1.0166015625, 1.09039306640625, 1.1641845703125, 1.23797607421875, 1.311767578125, 1.38555908203125, 1.4593505859375, 1.53314208984375, 1.60693359375, 1.68072509765625, 1.7545166015625, 1.82830810546875, 1.902099609375, 1.97589111328125, 2.0496826171875, 2.12347412109375, 2.197265625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 7.0, 6.0, 6.0, 15.0, 20.0, 22.0, 27.0, 32.0, 38.0, 57.0, 52.0, 64.0, 89.0, 71.0, 67.0, 84.0, 74.0, 50.0, 52.0, 33.0, 27.0, 21.0, 23.0, 17.0, 7.0, 11.0, 9.0, 7.0, 4.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.2802734375, -1.2455673217773438, -1.2108612060546875, -1.1761550903320312, -1.141448974609375, -1.1067428588867188, -1.0720367431640625, -1.0373306274414062, -1.00262451171875, -0.9679183959960938, -0.9332122802734375, -0.8985061645507812, -0.863800048828125, -0.8290939331054688, -0.7943878173828125, -0.7596817016601562, -0.7249755859375, -0.6902694702148438, -0.6555633544921875, -0.6208572387695312, -0.586151123046875, -0.5514450073242188, -0.5167388916015625, -0.48203277587890625, -0.44732666015625, -0.41262054443359375, -0.3779144287109375, -0.34320831298828125, -0.308502197265625, -0.27379608154296875, -0.2390899658203125, -0.20438385009765625, -0.169677734375, -0.13497161865234375, -0.1002655029296875, -0.06555938720703125, -0.030853271484375, 0.00385284423828125, 0.0385589599609375, 0.07326507568359375, 0.10797119140625, 0.14267730712890625, 0.1773834228515625, 0.21208953857421875, 0.246795654296875, 0.28150177001953125, 0.3162078857421875, 0.35091400146484375, 0.3856201171875, 0.42032623291015625, 0.4550323486328125, 0.48973846435546875, 0.524444580078125, 0.5591506958007812, 0.5938568115234375, 0.6285629272460938, 0.66326904296875, 0.6979751586914062, 0.7326812744140625, 0.7673873901367188, 0.802093505859375, 0.8367996215820312, 0.8715057373046875, 0.9062118530273438, 0.94091796875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 3.0, 8.0, 6.0, 15.0, 14.0, 19.0, 46.0, 50.0, 95.0, 111.0, 148.0, 143.0, 130.0, 71.0, 58.0, 34.0, 16.0, 12.0, 7.0, 14.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.20459747314453, -21.58837127685547, -20.97214698791504, -20.355920791625977, -19.739694595336914, -19.12346839904785, -18.507244110107422, -17.89101791381836, -17.274791717529297, -16.658565521240234, -16.042341232299805, -15.426115036010742, -14.80988883972168, -14.193663597106934, -13.577438354492188, -12.961212158203125, -12.344986915588379, -11.728761672973633, -11.11253547668457, -10.496310234069824, -9.880084037780762, -9.263858795166016, -8.647632598876953, -8.031407356262207, -7.415181636810303, -6.798955917358398, -6.182730197906494, -5.56650447845459, -4.950279235839844, -4.334053039550781, -3.717827796936035, -3.101602077484131, -2.4853763580322266, -1.8691506385803223, -1.2529250383377075, -0.6366994380950928, -0.020473718643188477, 0.5957520008087158, 1.211977481842041, 1.8282032012939453, 2.4444289207458496, 3.060654640197754, 3.676880359649658, 4.2931060791015625, 4.909331321716309, 5.525557518005371, 6.141782760620117, 6.7580084800720215, 7.374234199523926, 7.99045991897583, 8.606685638427734, 9.22291088104248, 9.839137077331543, 10.455362319946289, 11.071588516235352, 11.687813758850098, 12.304039001464844, 12.92026424407959, 13.536490440368652, 14.152715682983398, 14.768941879272461, 15.385167121887207, 16.001392364501953, 16.617618560791016, 17.233844757080078]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 3.0, 3.0, 8.0, 9.0, 4.0, 17.0, 11.0, 19.0, 20.0, 23.0, 15.0, 29.0, 27.0, 29.0, 41.0, 49.0, 44.0, 42.0, 37.0, 50.0, 56.0, 53.0, 42.0, 53.0, 35.0, 36.0, 24.0, 21.0, 27.0, 33.0, 24.0, 28.0, 14.0, 13.0, 11.0, 9.0, 8.0, 6.0, 10.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-18.857324600219727, -18.321470260620117, -17.785614013671875, -17.249759674072266, -16.713905334472656, -16.178050994873047, -15.642195701599121, -15.106340408325195, -14.570486068725586, -14.034631729125977, -13.49877643585205, -12.962921142578125, -12.427066802978516, -11.891212463378906, -11.35535717010498, -10.819501876831055, -10.283647537231445, -9.747793197631836, -9.21193790435791, -8.676082611083984, -8.140228271484375, -7.604373455047607, -7.06851863861084, -6.532663822174072, -5.996809005737305, -5.460954189300537, -4.9250993728637695, -4.389244556427002, -3.8533897399902344, -3.317534923553467, -2.781680107116699, -2.2458252906799316, -1.7099723815917969, -1.1741175651550293, -0.6382627487182617, -0.10240793228149414, 0.43344688415527344, 0.969301700592041, 1.5051565170288086, 2.041011333465576, 2.5768661499023438, 3.1127209663391113, 3.648575782775879, 4.1844305992126465, 4.720285415649414, 5.256140232086182, 5.791995048522949, 6.327849864959717, 6.863704681396484, 7.399559497833252, 7.9354143142700195, 8.471269607543945, 9.007123947143555, 9.542978286743164, 10.07883358001709, 10.614688873291016, 11.150543212890625, 11.686397552490234, 12.22225284576416, 12.758108139038086, 13.293962478637695, 13.829816818237305, 14.36567211151123, 14.901527404785156, 15.437381744384766]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 11.0, 14.0, 26.0, 85.0, 217.0, 490.0, 1533.0, 5886.0, 39418.0, 3638888.0, 478921.0, 21874.0, 4061.0, 1273.0, 588.0, 298.0, 192.0, 130.0, 87.0, 73.0, 50.0, 38.0, 30.0, 18.0, 14.0, 14.0, 18.0, 8.0, 8.0, 6.0, 1.0, 5.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.919921875, -2.651397705078125, -2.38287353515625, -2.114349365234375, -1.8458251953125, -1.577301025390625, -1.30877685546875, -1.040252685546875, -0.771728515625, -0.503204345703125, -0.23468017578125, 0.033843994140625, 0.3023681640625, 0.570892333984375, 0.83941650390625, 1.107940673828125, 1.37646484375, 1.644989013671875, 1.91351318359375, 2.182037353515625, 2.4505615234375, 2.719085693359375, 2.98760986328125, 3.256134033203125, 3.524658203125, 3.793182373046875, 4.06170654296875, 4.330230712890625, 4.5987548828125, 4.867279052734375, 5.13580322265625, 5.404327392578125, 5.6728515625, 5.941375732421875, 6.20989990234375, 6.478424072265625, 6.7469482421875, 7.015472412109375, 7.28399658203125, 7.552520751953125, 7.821044921875, 8.089569091796875, 8.35809326171875, 8.626617431640625, 8.8951416015625, 9.163665771484375, 9.43218994140625, 9.700714111328125, 9.96923828125, 10.237762451171875, 10.50628662109375, 10.774810791015625, 11.0433349609375, 11.311859130859375, 11.58038330078125, 11.848907470703125, 12.117431640625, 12.385955810546875, 12.65447998046875, 12.923004150390625, 13.1915283203125, 13.460052490234375, 13.72857666015625, 13.997100830078125, 14.265625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 9.0, 11.0, 23.0, 37.0, 73.0, 105.0, 118.0, 140.0, 133.0, 114.0, 101.0, 62.0, 30.0, 28.0, 15.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59716796875, -0.5429153442382812, -0.4886627197265625, -0.43441009521484375, -0.380157470703125, -0.32590484619140625, -0.2716522216796875, -0.21739959716796875, -0.16314697265625, -0.10889434814453125, -0.0546417236328125, -0.00038909912109375, 0.053863525390625, 0.10811614990234375, 0.1623687744140625, 0.21662139892578125, 0.2708740234375, 0.32512664794921875, 0.3793792724609375, 0.43363189697265625, 0.487884521484375, 0.5421371459960938, 0.5963897705078125, 0.6506423950195312, 0.70489501953125, 0.7591476440429688, 0.8134002685546875, 0.8676528930664062, 0.921905517578125, 0.9761581420898438, 1.0304107666015625, 1.0846633911132812, 1.138916015625, 1.1931686401367188, 1.2474212646484375, 1.3016738891601562, 1.355926513671875, 1.4101791381835938, 1.4644317626953125, 1.5186843872070312, 1.57293701171875, 1.6271896362304688, 1.6814422607421875, 1.7356948852539062, 1.789947509765625, 1.8442001342773438, 1.8984527587890625, 1.9527053833007812, 2.0069580078125, 2.0612106323242188, 2.1154632568359375, 2.1697158813476562, 2.223968505859375, 2.2782211303710938, 2.3324737548828125, 2.3867263793945312, 2.44097900390625, 2.4952316284179688, 2.5494842529296875, 2.6037368774414062, 2.657989501953125, 2.7122421264648438, 2.7664947509765625, 2.8207473754882812, 2.875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 10.0, 20.0, 27.0, 54.0, 67.0, 135.0, 211.0, 458.0, 1029.0, 2988.0, 13429.0, 870584.0, 3279741.0, 18614.0, 4186.0, 1441.0, 570.0, 293.0, 169.0, 101.0, 63.0, 37.0, 23.0, 17.0, 6.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.59375, -14.1773681640625, -13.760986328125, -13.3446044921875, -12.92822265625, -12.5118408203125, -12.095458984375, -11.6790771484375, -11.2626953125, -10.8463134765625, -10.429931640625, -10.0135498046875, -9.59716796875, -9.1807861328125, -8.764404296875, -8.3480224609375, -7.931640625, -7.5152587890625, -7.098876953125, -6.6824951171875, -6.26611328125, -5.8497314453125, -5.433349609375, -5.0169677734375, -4.6005859375, -4.1842041015625, -3.767822265625, -3.3514404296875, -2.93505859375, -2.5186767578125, -2.102294921875, -1.6859130859375, -1.26953125, -0.8531494140625, -0.436767578125, -0.0203857421875, 0.39599609375, 0.8123779296875, 1.228759765625, 1.6451416015625, 2.0615234375, 2.4779052734375, 2.894287109375, 3.3106689453125, 3.72705078125, 4.1434326171875, 4.559814453125, 4.9761962890625, 5.392578125, 5.8089599609375, 6.225341796875, 6.6417236328125, 7.05810546875, 7.4744873046875, 7.890869140625, 8.3072509765625, 8.7236328125, 9.1400146484375, 9.556396484375, 9.9727783203125, 10.38916015625, 10.8055419921875, 11.221923828125, 11.6383056640625, 12.0546875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 9.0, 16.0, 23.0, 85.0, 387.0, 2941.0, 400.0, 110.0, 44.0, 23.0, 6.0, 12.0, 8.0, 3.0, 3.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.359375, -5.1715087890625, -4.983642578125, -4.7957763671875, -4.60791015625, -4.4200439453125, -4.232177734375, -4.0443115234375, -3.8564453125, -3.6685791015625, -3.480712890625, -3.2928466796875, -3.10498046875, -2.9171142578125, -2.729248046875, -2.5413818359375, -2.353515625, -2.1656494140625, -1.977783203125, -1.7899169921875, -1.60205078125, -1.4141845703125, -1.226318359375, -1.0384521484375, -0.8505859375, -0.6627197265625, -0.474853515625, -0.2869873046875, -0.09912109375, 0.0887451171875, 0.276611328125, 0.4644775390625, 0.65234375, 0.8402099609375, 1.028076171875, 1.2159423828125, 1.40380859375, 1.5916748046875, 1.779541015625, 1.9674072265625, 2.1552734375, 2.3431396484375, 2.531005859375, 2.7188720703125, 2.90673828125, 3.0946044921875, 3.282470703125, 3.4703369140625, 3.658203125, 3.8460693359375, 4.033935546875, 4.2218017578125, 4.40966796875, 4.5975341796875, 4.785400390625, 4.9732666015625, 5.1611328125, 5.3489990234375, 5.536865234375, 5.7247314453125, 5.91259765625, 6.1004638671875, 6.288330078125, 6.4761962890625, 6.6640625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 12.0, 133.0, 647.0, 190.0, 17.0, 7.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-108.46897888183594, -106.36431884765625, -104.25965881347656, -102.1550064086914, -100.05034637451172, -97.94568634033203, -95.84102630615234, -93.73637390136719, -91.6317138671875, -89.52705383300781, -87.42239379882812, -85.31774139404297, -83.21308135986328, -81.1084213256836, -79.0037612915039, -76.89910888671875, -74.79444885253906, -72.68978881835938, -70.58512878417969, -68.48047637939453, -66.37581634521484, -64.27115631103516, -62.16649627685547, -60.06184005737305, -57.957176208496094, -55.852516174316406, -53.747859954833984, -51.6431999206543, -49.538543701171875, -47.43388366699219, -45.3292236328125, -43.22456741333008, -41.11990737915039, -39.0152473449707, -36.91059112548828, -34.805931091308594, -32.70127487182617, -30.596614837646484, -28.49195671081543, -26.387298583984375, -24.28264045715332, -22.177982330322266, -20.07332420349121, -17.968666076660156, -15.864006996154785, -13.75934886932373, -11.65468978881836, -9.550031661987305, -7.44537353515625, -5.340715408325195, -3.2360568046569824, -1.1313982009887695, 0.9732599258422852, 3.07791805267334, 5.182577133178711, 7.287235260009766, 9.39189338684082, 11.496551513671875, 13.60120964050293, 15.7058687210083, 17.810527801513672, 19.915184020996094, 22.01984405517578, 24.124502182006836, 26.22916030883789]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 17.0, 29.0, 43.0, 77.0, 142.0, 133.0, 157.0, 140.0, 97.0, 88.0, 41.0, 18.0, 13.0, 5.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.270702362060547, -28.42811393737793, -27.585525512695312, -26.742937088012695, -25.900348663330078, -25.05776023864746, -24.215171813964844, -23.372583389282227, -22.52999496459961, -21.687406539916992, -20.844818115234375, -20.002229690551758, -19.15964126586914, -18.317052841186523, -17.474464416503906, -16.63187599182129, -15.789287567138672, -14.946699142456055, -14.104110717773438, -13.26152229309082, -12.418933868408203, -11.576345443725586, -10.733757019042969, -9.891168594360352, -9.048580169677734, -8.205991744995117, -7.3634033203125, -6.520814895629883, -5.678226470947266, -4.835638046264648, -3.9930496215820312, -3.150461196899414, -2.307870864868164, -1.4652824401855469, -0.6226940155029297, 0.2198944091796875, 1.0624828338623047, 1.9050712585449219, 2.747659683227539, 3.5902481079101562, 4.432836532592773, 5.275424957275391, 6.118013381958008, 6.960601806640625, 7.803190231323242, 8.64577865600586, 9.488367080688477, 10.330955505371094, 11.173543930053711, 12.016132354736328, 12.858720779418945, 13.701309204101562, 14.54389762878418, 15.386486053466797, 16.229074478149414, 17.07166290283203, 17.91425132751465, 18.756839752197266, 19.599428176879883, 20.4420166015625, 21.284605026245117, 22.127193450927734, 22.96978187561035, 23.81237030029297, 24.654958724975586]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 5.0, 1.0, 2.0, 2.0, 2.0, 2.0, 8.0, 15.0, 16.0, 32.0, 36.0, 45.0, 68.0, 85.0, 109.0, 177.0, 295.0, 470.0, 868.0, 1699.0, 4186.0, 13080.0, 57922.0, 333322.0, 507906.0, 97552.0, 20009.0, 5874.0, 2115.0, 1056.0, 528.0, 334.0, 197.0, 148.0, 92.0, 77.0, 55.0, 51.0, 27.0, 27.0, 12.0, 12.0, 6.0, 4.0, 6.0, 6.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0], "bins": [-4.8203125, -4.6749267578125, -4.529541015625, -4.3841552734375, -4.23876953125, -4.0933837890625, -3.947998046875, -3.8026123046875, -3.6572265625, -3.5118408203125, -3.366455078125, -3.2210693359375, -3.07568359375, -2.9302978515625, -2.784912109375, -2.6395263671875, -2.494140625, -2.3487548828125, -2.203369140625, -2.0579833984375, -1.91259765625, -1.7672119140625, -1.621826171875, -1.4764404296875, -1.3310546875, -1.1856689453125, -1.040283203125, -0.8948974609375, -0.74951171875, -0.6041259765625, -0.458740234375, -0.3133544921875, -0.16796875, -0.0225830078125, 0.122802734375, 0.2681884765625, 0.41357421875, 0.5589599609375, 0.704345703125, 0.8497314453125, 0.9951171875, 1.1405029296875, 1.285888671875, 1.4312744140625, 1.57666015625, 1.7220458984375, 1.867431640625, 2.0128173828125, 2.158203125, 2.3035888671875, 2.448974609375, 2.5943603515625, 2.73974609375, 2.8851318359375, 3.030517578125, 3.1759033203125, 3.3212890625, 3.4666748046875, 3.612060546875, 3.7574462890625, 3.90283203125, 4.0482177734375, 4.193603515625, 4.3389892578125, 4.484375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 2.0, 1.0, 8.0, 6.0, 16.0, 20.0, 44.0, 55.0, 75.0, 95.0, 108.0, 99.0, 102.0, 113.0, 80.0, 65.0, 38.0, 31.0, 18.0, 14.0, 5.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.91943359375, -0.8728408813476562, -0.8262481689453125, -0.7796554565429688, -0.733062744140625, -0.6864700317382812, -0.6398773193359375, -0.5932846069335938, -0.54669189453125, -0.5000991821289062, -0.4535064697265625, -0.40691375732421875, -0.360321044921875, -0.31372833251953125, -0.2671356201171875, -0.22054290771484375, -0.1739501953125, -0.12735748291015625, -0.0807647705078125, -0.03417205810546875, 0.012420654296875, 0.05901336669921875, 0.1056060791015625, 0.15219879150390625, 0.19879150390625, 0.24538421630859375, 0.2919769287109375, 0.33856964111328125, 0.385162353515625, 0.43175506591796875, 0.4783477783203125, 0.5249404907226562, 0.571533203125, 0.6181259155273438, 0.6647186279296875, 0.7113113403320312, 0.757904052734375, 0.8044967651367188, 0.8510894775390625, 0.8976821899414062, 0.94427490234375, 0.9908676147460938, 1.0374603271484375, 1.0840530395507812, 1.130645751953125, 1.1772384643554688, 1.2238311767578125, 1.2704238891601562, 1.3170166015625, 1.3636093139648438, 1.4102020263671875, 1.4567947387695312, 1.503387451171875, 1.5499801635742188, 1.5965728759765625, 1.6431655883789062, 1.68975830078125, 1.7363510131835938, 1.7829437255859375, 1.8295364379882812, 1.876129150390625, 1.9227218627929688, 1.9693145751953125, 2.0159072875976562, 2.0625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 1.0, 5.0, 5.0, 12.0, 4.0, 20.0, 23.0, 34.0, 58.0, 89.0, 131.0, 244.0, 374.0, 735.0, 1436.0, 3156.0, 7580.0, 20527.0, 60562.0, 190990.0, 421691.0, 227500.0, 72646.0, 24312.0, 9088.0, 3731.0, 1653.0, 788.0, 445.0, 254.0, 154.0, 114.0, 65.0, 35.0, 27.0, 28.0, 13.0, 11.0, 6.0, 6.0, 5.0, 3.0, 0.0, 2.0], "bins": [-3.26953125, -3.18896484375, -3.1083984375, -3.02783203125, -2.947265625, -2.86669921875, -2.7861328125, -2.70556640625, -2.625, -2.54443359375, -2.4638671875, -2.38330078125, -2.302734375, -2.22216796875, -2.1416015625, -2.06103515625, -1.98046875, -1.89990234375, -1.8193359375, -1.73876953125, -1.658203125, -1.57763671875, -1.4970703125, -1.41650390625, -1.3359375, -1.25537109375, -1.1748046875, -1.09423828125, -1.013671875, -0.93310546875, -0.8525390625, -0.77197265625, -0.69140625, -0.61083984375, -0.5302734375, -0.44970703125, -0.369140625, -0.28857421875, -0.2080078125, -0.12744140625, -0.046875, 0.03369140625, 0.1142578125, 0.19482421875, 0.275390625, 0.35595703125, 0.4365234375, 0.51708984375, 0.59765625, 0.67822265625, 0.7587890625, 0.83935546875, 0.919921875, 1.00048828125, 1.0810546875, 1.16162109375, 1.2421875, 1.32275390625, 1.4033203125, 1.48388671875, 1.564453125, 1.64501953125, 1.7255859375, 1.80615234375, 1.88671875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 3.0, 1.0, 4.0, 4.0, 3.0, 1.0, 11.0, 6.0, 12.0, 8.0, 11.0, 16.0, 18.0, 14.0, 20.0, 23.0, 23.0, 28.0, 30.0, 34.0, 31.0, 38.0, 36.0, 46.0, 53.0, 42.0, 37.0, 37.0, 56.0, 50.0, 29.0, 35.0, 31.0, 37.0, 39.0, 23.0, 21.0, 17.0, 10.0, 21.0, 12.0, 6.0, 5.0, 9.0, 11.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-2.9296875, -2.839385986328125, -2.74908447265625, -2.658782958984375, -2.5684814453125, -2.478179931640625, -2.38787841796875, -2.297576904296875, -2.207275390625, -2.116973876953125, -2.02667236328125, -1.936370849609375, -1.8460693359375, -1.755767822265625, -1.66546630859375, -1.575164794921875, -1.48486328125, -1.394561767578125, -1.30426025390625, -1.213958740234375, -1.1236572265625, -1.033355712890625, -0.94305419921875, -0.852752685546875, -0.762451171875, -0.672149658203125, -0.58184814453125, -0.491546630859375, -0.4012451171875, -0.310943603515625, -0.22064208984375, -0.130340576171875, -0.0400390625, 0.050262451171875, 0.14056396484375, 0.230865478515625, 0.3211669921875, 0.411468505859375, 0.50177001953125, 0.592071533203125, 0.682373046875, 0.772674560546875, 0.86297607421875, 0.953277587890625, 1.0435791015625, 1.133880615234375, 1.22418212890625, 1.314483642578125, 1.40478515625, 1.495086669921875, 1.58538818359375, 1.675689697265625, 1.7659912109375, 1.856292724609375, 1.94659423828125, 2.036895751953125, 2.127197265625, 2.217498779296875, 2.30780029296875, 2.398101806640625, 2.4884033203125, 2.578704833984375, 2.66900634765625, 2.759307861328125, 2.849609375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 1.0, 1.0, 4.0, 8.0, 6.0, 7.0, 15.0, 22.0, 32.0, 45.0, 81.0, 120.0, 206.0, 313.0, 630.0, 1204.0, 2230.0, 5085.0, 12832.0, 43467.0, 210864.0, 581848.0, 139754.0, 31391.0, 10122.0, 4047.0, 1924.0, 955.0, 550.0, 310.0, 168.0, 108.0, 60.0, 33.0, 39.0, 19.0, 17.0, 13.0, 5.0, 11.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.583984375, -1.5318450927734375, -1.479705810546875, -1.4275665283203125, -1.37542724609375, -1.3232879638671875, -1.271148681640625, -1.2190093994140625, -1.1668701171875, -1.1147308349609375, -1.062591552734375, -1.0104522705078125, -0.95831298828125, -0.9061737060546875, -0.854034423828125, -0.8018951416015625, -0.749755859375, -0.6976165771484375, -0.645477294921875, -0.5933380126953125, -0.54119873046875, -0.4890594482421875, -0.436920166015625, -0.3847808837890625, -0.3326416015625, -0.2805023193359375, -0.228363037109375, -0.1762237548828125, -0.12408447265625, -0.0719451904296875, -0.019805908203125, 0.0323333740234375, 0.08447265625, 0.1366119384765625, 0.188751220703125, 0.2408905029296875, 0.29302978515625, 0.3451690673828125, 0.397308349609375, 0.4494476318359375, 0.5015869140625, 0.5537261962890625, 0.605865478515625, 0.6580047607421875, 0.71014404296875, 0.7622833251953125, 0.814422607421875, 0.8665618896484375, 0.918701171875, 0.9708404541015625, 1.022979736328125, 1.0751190185546875, 1.12725830078125, 1.1793975830078125, 1.231536865234375, 1.2836761474609375, 1.3358154296875, 1.3879547119140625, 1.440093994140625, 1.4922332763671875, 1.54437255859375, 1.5965118408203125, 1.648651123046875, 1.7007904052734375, 1.7529296875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 5.0, 3.0, 9.0, 9.0, 18.0, 24.0, 41.0, 65.0, 65.0, 140.0, 194.0, 181.0, 77.0, 61.0, 26.0, 26.0, 19.0, 5.0, 11.0, 7.0, 6.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00041103363037109375, -0.0003988109529018402, -0.00038658827543258667, -0.00037436559796333313, -0.0003621429204940796, -0.00034992024302482605, -0.0003376975655555725, -0.00032547488808631897, -0.00031325221061706543, -0.0003010295331478119, -0.00028880685567855835, -0.0002765841782093048, -0.00026436150074005127, -0.00025213882327079773, -0.0002399161458015442, -0.00022769346833229065, -0.0002154707908630371, -0.00020324811339378357, -0.00019102543592453003, -0.0001788027584552765, -0.00016658008098602295, -0.0001543574035167694, -0.00014213472604751587, -0.00012991204857826233, -0.00011768937110900879, -0.00010546669363975525, -9.324401617050171e-05, -8.102133870124817e-05, -6.879866123199463e-05, -5.657598376274109e-05, -4.435330629348755e-05, -3.213062882423401e-05, -1.990795135498047e-05, -7.685273885726929e-06, 4.537403583526611e-06, 1.676008105278015e-05, 2.898275852203369e-05, 4.120543599128723e-05, 5.342811346054077e-05, 6.565079092979431e-05, 7.787346839904785e-05, 9.009614586830139e-05, 0.00010231882333755493, 0.00011454150080680847, 0.000126764178276062, 0.00013898685574531555, 0.0001512095332145691, 0.00016343221068382263, 0.00017565488815307617, 0.0001878775656223297, 0.00020010024309158325, 0.0002123229205608368, 0.00022454559803009033, 0.00023676827549934387, 0.0002489909529685974, 0.00026121363043785095, 0.0002734363079071045, 0.00028565898537635803, 0.00029788166284561157, 0.0003101043403148651, 0.00032232701778411865, 0.0003345496952533722, 0.00034677237272262573, 0.00035899505019187927, 0.0003712177276611328]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 7.0, 9.0, 8.0, 12.0, 20.0, 35.0, 33.0, 65.0, 92.0, 157.0, 263.0, 476.0, 828.0, 1578.0, 3380.0, 8682.0, 26002.0, 98274.0, 473201.0, 333614.0, 69740.0, 19300.0, 6812.0, 2825.0, 1370.0, 745.0, 416.0, 238.0, 137.0, 72.0, 56.0, 33.0, 24.0, 14.0, 11.0, 14.0, 5.0, 6.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.611328125, -1.557403564453125, -1.50347900390625, -1.449554443359375, -1.3956298828125, -1.341705322265625, -1.28778076171875, -1.233856201171875, -1.179931640625, -1.126007080078125, -1.07208251953125, -1.018157958984375, -0.9642333984375, -0.910308837890625, -0.85638427734375, -0.802459716796875, -0.74853515625, -0.694610595703125, -0.64068603515625, -0.586761474609375, -0.5328369140625, -0.478912353515625, -0.42498779296875, -0.371063232421875, -0.317138671875, -0.263214111328125, -0.20928955078125, -0.155364990234375, -0.1014404296875, -0.047515869140625, 0.00640869140625, 0.060333251953125, 0.1142578125, 0.168182373046875, 0.22210693359375, 0.276031494140625, 0.3299560546875, 0.383880615234375, 0.43780517578125, 0.491729736328125, 0.545654296875, 0.599578857421875, 0.65350341796875, 0.707427978515625, 0.7613525390625, 0.815277099609375, 0.86920166015625, 0.923126220703125, 0.97705078125, 1.030975341796875, 1.08489990234375, 1.138824462890625, 1.1927490234375, 1.246673583984375, 1.30059814453125, 1.354522705078125, 1.408447265625, 1.462371826171875, 1.51629638671875, 1.570220947265625, 1.6241455078125, 1.678070068359375, 1.73199462890625, 1.785919189453125, 1.83984375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 9.0, 14.0, 10.0, 27.0, 44.0, 49.0, 78.0, 113.0, 147.0, 139.0, 117.0, 78.0, 50.0, 33.0, 19.0, 13.0, 16.0, 13.0, 3.0, 4.0, 4.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.01171875, -1.94451904296875, -1.8773193359375, -1.81011962890625, -1.742919921875, -1.67572021484375, -1.6085205078125, -1.54132080078125, -1.47412109375, -1.40692138671875, -1.3397216796875, -1.27252197265625, -1.205322265625, -1.13812255859375, -1.0709228515625, -1.00372314453125, -0.9365234375, -0.86932373046875, -0.8021240234375, -0.73492431640625, -0.667724609375, -0.60052490234375, -0.5333251953125, -0.46612548828125, -0.39892578125, -0.33172607421875, -0.2645263671875, -0.19732666015625, -0.130126953125, -0.06292724609375, 0.0042724609375, 0.07147216796875, 0.138671875, 0.20587158203125, 0.2730712890625, 0.34027099609375, 0.407470703125, 0.47467041015625, 0.5418701171875, 0.60906982421875, 0.67626953125, 0.74346923828125, 0.8106689453125, 0.87786865234375, 0.945068359375, 1.01226806640625, 1.0794677734375, 1.14666748046875, 1.2138671875, 1.28106689453125, 1.3482666015625, 1.41546630859375, 1.482666015625, 1.54986572265625, 1.6170654296875, 1.68426513671875, 1.75146484375, 1.81866455078125, 1.8858642578125, 1.95306396484375, 2.020263671875, 2.08746337890625, 2.1546630859375, 2.22186279296875, 2.2890625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 6.0, 10.0, 6.0, 20.0, 44.0, 86.0, 189.0, 275.0, 184.0, 107.0, 40.0, 25.0, 9.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.461505889892578, -23.28386878967285, -22.106229782104492, -20.928592681884766, -19.750953674316406, -18.57331657409668, -17.395679473876953, -16.218040466308594, -15.040403366088867, -13.862765312194824, -12.685127258300781, -11.507490158081055, -10.329852104187012, -9.152214050292969, -7.974576473236084, -6.796938896179199, -5.619300842285156, -4.441662788391113, -3.2640252113342285, -2.0863873958587646, -0.9087495803833008, 0.2688884735107422, 1.446526050567627, 2.6241636276245117, 3.8018016815185547, 4.979439735412598, 6.157077312469482, 7.334714889526367, 8.51235294342041, 9.689990997314453, 10.86762809753418, 12.045266151428223, 13.222900390625, 14.400538444519043, 15.578176498413086, 16.755813598632812, 17.933452606201172, 19.1110897064209, 20.288726806640625, 21.466365814208984, 22.64400291442871, 23.821640014648438, 24.999279022216797, 26.176916122436523, 27.35455322265625, 28.53219223022461, 29.709829330444336, 30.887466430664062, 32.06510543823242, 33.24274444580078, 34.420379638671875, 35.598018646240234, 36.775657653808594, 37.95329284667969, 39.13093185424805, 40.308570861816406, 41.4862060546875, 42.66384506225586, 43.84148025512695, 45.01911926269531, 46.19675827026367, 47.37439727783203, 48.552032470703125, 49.729671478271484, 50.907310485839844]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 6.0, 6.0, 7.0, 7.0, 11.0, 14.0, 24.0, 34.0, 26.0, 36.0, 47.0, 45.0, 42.0, 52.0, 51.0, 49.0, 66.0, 70.0, 54.0, 49.0, 44.0, 53.0, 46.0, 36.0, 31.0, 25.0, 21.0, 18.0, 13.0, 9.0, 8.0, 1.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.97154998779297, -24.275362014770508, -23.579174041748047, -22.882986068725586, -22.186798095703125, -21.490610122680664, -20.794422149658203, -20.098236083984375, -19.40204620361328, -18.70585823059082, -18.00967025756836, -17.3134822845459, -16.617294311523438, -15.921106338500977, -15.224919319152832, -14.528731346130371, -13.832544326782227, -13.136356353759766, -12.440168380737305, -11.743980407714844, -11.047792434692383, -10.351604461669922, -9.655417442321777, -8.959229469299316, -8.263041496276855, -7.5668535232543945, -6.870665550231934, -6.174478054046631, -5.47829008102417, -4.782102108001709, -4.085914611816406, -3.3897266387939453, -2.693540573120117, -1.9973527193069458, -1.3011648654937744, -0.6049771308898926, 0.09121084213256836, 0.7873988151550293, 1.483586311340332, 2.179774284362793, 2.875962257385254, 3.572150230407715, 4.268338203430176, 4.9645256996154785, 5.6607136726379395, 6.3569016456604, 7.053089141845703, 7.749277114868164, 8.445465087890625, 9.141653060913086, 9.837841033935547, 10.534029006958008, 11.230216979980469, 11.92640495300293, 12.622591972351074, 13.318779945373535, 14.014967918395996, 14.711155891418457, 15.407343864440918, 16.103530883789062, 16.799718856811523, 17.495906829833984, 18.192094802856445, 18.888282775878906, 19.584470748901367]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 13.0, 10.0, 21.0, 16.0, 25.0, 45.0, 63.0, 120.0, 195.0, 377.0, 758.0, 1704.0, 4984.0, 20221.0, 327143.0, 3789889.0, 36664.0, 7255.0, 2412.0, 1029.0, 486.0, 268.0, 194.0, 94.0, 77.0, 39.0, 42.0, 37.0, 20.0, 24.0, 10.0, 10.0, 7.0, 10.0, 1.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-6.91015625, -6.7017822265625, -6.493408203125, -6.2850341796875, -6.07666015625, -5.8682861328125, -5.659912109375, -5.4515380859375, -5.2431640625, -5.0347900390625, -4.826416015625, -4.6180419921875, -4.40966796875, -4.2012939453125, -3.992919921875, -3.7845458984375, -3.576171875, -3.3677978515625, -3.159423828125, -2.9510498046875, -2.74267578125, -2.5343017578125, -2.325927734375, -2.1175537109375, -1.9091796875, -1.7008056640625, -1.492431640625, -1.2840576171875, -1.07568359375, -0.8673095703125, -0.658935546875, -0.4505615234375, -0.2421875, -0.0338134765625, 0.174560546875, 0.3829345703125, 0.59130859375, 0.7996826171875, 1.008056640625, 1.2164306640625, 1.4248046875, 1.6331787109375, 1.841552734375, 2.0499267578125, 2.25830078125, 2.4666748046875, 2.675048828125, 2.8834228515625, 3.091796875, 3.3001708984375, 3.508544921875, 3.7169189453125, 3.92529296875, 4.1336669921875, 4.342041015625, 4.5504150390625, 4.7587890625, 4.9671630859375, 5.175537109375, 5.3839111328125, 5.59228515625, 5.8006591796875, 6.009033203125, 6.2174072265625, 6.42578125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 8.0, 11.0, 7.0, 16.0, 14.0, 42.0, 43.0, 63.0, 73.0, 74.0, 102.0, 80.0, 86.0, 67.0, 75.0, 70.0, 60.0, 34.0, 28.0, 12.0, 21.0, 6.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.86279296875, -0.8211593627929688, -0.7795257568359375, -0.7378921508789062, -0.696258544921875, -0.6546249389648438, -0.6129913330078125, -0.5713577270507812, -0.52972412109375, -0.48809051513671875, -0.4464569091796875, -0.40482330322265625, -0.363189697265625, -0.32155609130859375, -0.2799224853515625, -0.23828887939453125, -0.1966552734375, -0.15502166748046875, -0.1133880615234375, -0.07175445556640625, -0.030120849609375, 0.01151275634765625, 0.0531463623046875, 0.09477996826171875, 0.13641357421875, 0.17804718017578125, 0.2196807861328125, 0.26131439208984375, 0.302947998046875, 0.34458160400390625, 0.3862152099609375, 0.42784881591796875, 0.469482421875, 0.5111160278320312, 0.5527496337890625, 0.5943832397460938, 0.636016845703125, 0.6776504516601562, 0.7192840576171875, 0.7609176635742188, 0.80255126953125, 0.8441848754882812, 0.8858184814453125, 0.9274520874023438, 0.969085693359375, 1.0107192993164062, 1.0523529052734375, 1.0939865112304688, 1.1356201171875, 1.1772537231445312, 1.2188873291015625, 1.2605209350585938, 1.302154541015625, 1.3437881469726562, 1.3854217529296875, 1.4270553588867188, 1.46868896484375, 1.5103225708007812, 1.5519561767578125, 1.5935897827148438, 1.635223388671875, 1.6768569946289062, 1.7184906005859375, 1.7601242065429688, 1.8017578125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 2.0, 6.0, 3.0, 9.0, 13.0, 11.0, 18.0, 18.0, 35.0, 49.0, 55.0, 93.0, 90.0, 158.0, 215.0, 317.0, 582.0, 1016.0, 1801.0, 3758.0, 8146.0, 20981.0, 77525.0, 1039301.0, 2887475.0, 107297.0, 26448.0, 9674.0, 4341.0, 2131.0, 1134.0, 619.0, 328.0, 204.0, 132.0, 78.0, 70.0, 48.0, 28.0, 19.0, 10.0, 13.0, 14.0, 4.0, 3.0, 5.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.087890625, -2.98858642578125, -2.8892822265625, -2.78997802734375, -2.690673828125, -2.59136962890625, -2.4920654296875, -2.39276123046875, -2.29345703125, -2.19415283203125, -2.0948486328125, -1.99554443359375, -1.896240234375, -1.79693603515625, -1.6976318359375, -1.59832763671875, -1.4990234375, -1.39971923828125, -1.3004150390625, -1.20111083984375, -1.101806640625, -1.00250244140625, -0.9031982421875, -0.80389404296875, -0.70458984375, -0.60528564453125, -0.5059814453125, -0.40667724609375, -0.307373046875, -0.20806884765625, -0.1087646484375, -0.00946044921875, 0.08984375, 0.18914794921875, 0.2884521484375, 0.38775634765625, 0.487060546875, 0.58636474609375, 0.6856689453125, 0.78497314453125, 0.88427734375, 0.98358154296875, 1.0828857421875, 1.18218994140625, 1.281494140625, 1.38079833984375, 1.4801025390625, 1.57940673828125, 1.6787109375, 1.77801513671875, 1.8773193359375, 1.97662353515625, 2.075927734375, 2.17523193359375, 2.2745361328125, 2.37384033203125, 2.47314453125, 2.57244873046875, 2.6717529296875, 2.77105712890625, 2.870361328125, 2.96966552734375, 3.0689697265625, 3.16827392578125, 3.267578125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 7.0, 8.0, 5.0, 7.0, 11.0, 16.0, 31.0, 48.0, 85.0, 186.0, 482.0, 2102.0, 636.0, 196.0, 84.0, 56.0, 34.0, 26.0, 18.0, 9.0, 9.0, 6.0, 2.0, 2.0, 4.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.34375, -2.2912445068359375, -2.238739013671875, -2.1862335205078125, -2.13372802734375, -2.0812225341796875, -2.028717041015625, -1.9762115478515625, -1.9237060546875, -1.8712005615234375, -1.818695068359375, -1.7661895751953125, -1.71368408203125, -1.6611785888671875, -1.608673095703125, -1.5561676025390625, -1.503662109375, -1.4511566162109375, -1.398651123046875, -1.3461456298828125, -1.29364013671875, -1.2411346435546875, -1.188629150390625, -1.1361236572265625, -1.0836181640625, -1.0311126708984375, -0.978607177734375, -0.9261016845703125, -0.87359619140625, -0.8210906982421875, -0.768585205078125, -0.7160797119140625, -0.66357421875, -0.6110687255859375, -0.558563232421875, -0.5060577392578125, -0.45355224609375, -0.4010467529296875, -0.348541259765625, -0.2960357666015625, -0.2435302734375, -0.1910247802734375, -0.138519287109375, -0.0860137939453125, -0.03350830078125, 0.0189971923828125, 0.071502685546875, 0.1240081787109375, 0.176513671875, 0.2290191650390625, 0.281524658203125, 0.3340301513671875, 0.38653564453125, 0.4390411376953125, 0.491546630859375, 0.5440521240234375, 0.5965576171875, 0.6490631103515625, 0.701568603515625, 0.7540740966796875, 0.80657958984375, 0.8590850830078125, 0.911590576171875, 0.9640960693359375, 1.0166015625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 12.0, 41.0, 197.0, 445.0, 242.0, 64.0, 8.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.0708122253418, -42.25343704223633, -41.436065673828125, -40.618690490722656, -39.80131530761719, -38.98394012451172, -38.166568756103516, -37.34919357299805, -36.53181838989258, -35.71444320678711, -34.897071838378906, -34.07969665527344, -33.26232147216797, -32.4449462890625, -31.627573013305664, -30.810199737548828, -29.99282455444336, -29.175451278686523, -28.358076095581055, -27.54070281982422, -26.72332763671875, -25.905954360961914, -25.088579177856445, -24.27120590209961, -23.453832626342773, -22.636459350585938, -21.81908416748047, -21.001710891723633, -20.184335708618164, -19.366962432861328, -18.54958724975586, -17.732213973999023, -16.914838790893555, -16.09746551513672, -15.28009033203125, -14.462716102600098, -13.645341873168945, -12.82796859741211, -12.01059341430664, -11.193220138549805, -10.375844955444336, -9.558470726013184, -8.741096496582031, -7.923722267150879, -7.106348037719727, -6.288974285125732, -5.47160005569458, -4.654225826263428, -3.8368520736694336, -3.0194778442382812, -2.202103614807129, -1.3847296237945557, -0.5673553943634033, 0.2500185966491699, 1.0673928260803223, 1.8847670555114746, 2.702141284942627, 3.5195155143737793, 4.336889743804932, 5.154263496398926, 5.971637725830078, 6.7890119552612305, 7.606386184692383, 8.423760414123535, 9.241134643554688]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 6.0, 9.0, 21.0, 21.0, 20.0, 25.0, 28.0, 31.0, 38.0, 42.0, 51.0, 62.0, 70.0, 62.0, 63.0, 54.0, 56.0, 48.0, 41.0, 47.0, 30.0, 30.0, 28.0, 22.0, 22.0, 23.0, 6.0, 6.0, 10.0, 12.0, 2.0, 4.0, 1.0, 2.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.072479248046875, -5.903938293457031, -5.735397815704346, -5.566856861114502, -5.398316383361816, -5.229775428771973, -5.061234474182129, -4.892693996429443, -4.724153518676758, -4.555612564086914, -4.3870720863342285, -4.218531131744385, -4.049990653991699, -3.8814496994018555, -3.712908983230591, -3.544368267059326, -3.3758273124694824, -3.2072865962982178, -3.038745880126953, -2.8702049255371094, -2.701664447784424, -2.53312349319458, -2.3645827770233154, -2.196042060852051, -2.027501344680786, -1.8589606285095215, -1.6904199123382568, -1.5218790769577026, -1.353338360786438, -1.1847976446151733, -1.0162568092346191, -0.8477160930633545, -0.679175853729248, -0.5106351375579834, -0.342094361782074, -0.17355358600616455, -0.005012869834899902, 0.16352784633636475, 0.33206868171691895, 0.5006093978881836, 0.6691501140594482, 0.8376908302307129, 1.0062315464019775, 1.1747723817825317, 1.3433130979537964, 1.511853814125061, 1.6803946495056152, 1.8489353656768799, 2.0174760818481445, 2.186016798019409, 2.354557514190674, 2.5230984687805176, 2.691638946533203, 2.860179901123047, 3.0287206172943115, 3.197261333465576, 3.365802049636841, 3.5343427658081055, 3.70288348197937, 3.8714241981506348, 4.0399651527404785, 4.208505630493164, 4.377046585083008, 4.545587539672852, 4.714128017425537]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 6.0, 12.0, 16.0, 22.0, 14.0, 39.0, 41.0, 64.0, 82.0, 142.0, 190.0, 252.0, 407.0, 707.0, 1364.0, 2744.0, 6669.0, 19671.0, 70631.0, 283531.0, 462337.0, 143415.0, 36327.0, 11134.0, 4278.0, 1865.0, 979.0, 594.0, 348.0, 191.0, 148.0, 83.0, 67.0, 54.0, 32.0, 31.0, 17.0, 5.0, 7.0, 11.0, 3.0, 7.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.880859375, -3.760528564453125, -3.64019775390625, -3.519866943359375, -3.3995361328125, -3.279205322265625, -3.15887451171875, -3.038543701171875, -2.918212890625, -2.797882080078125, -2.67755126953125, -2.557220458984375, -2.4368896484375, -2.316558837890625, -2.19622802734375, -2.075897216796875, -1.95556640625, -1.835235595703125, -1.71490478515625, -1.594573974609375, -1.4742431640625, -1.353912353515625, -1.23358154296875, -1.113250732421875, -0.992919921875, -0.872589111328125, -0.75225830078125, -0.631927490234375, -0.5115966796875, -0.391265869140625, -0.27093505859375, -0.150604248046875, -0.0302734375, 0.090057373046875, 0.21038818359375, 0.330718994140625, 0.4510498046875, 0.571380615234375, 0.69171142578125, 0.812042236328125, 0.932373046875, 1.052703857421875, 1.17303466796875, 1.293365478515625, 1.4136962890625, 1.534027099609375, 1.65435791015625, 1.774688720703125, 1.89501953125, 2.015350341796875, 2.13568115234375, 2.256011962890625, 2.3763427734375, 2.496673583984375, 2.61700439453125, 2.737335205078125, 2.857666015625, 2.977996826171875, 3.09832763671875, 3.218658447265625, 3.3389892578125, 3.459320068359375, 3.57965087890625, 3.699981689453125, 3.8203125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0, 3.0, 4.0, 12.0, 13.0, 27.0, 42.0, 52.0, 63.0, 79.0, 92.0, 81.0, 91.0, 85.0, 73.0, 78.0, 62.0, 54.0, 28.0, 22.0, 12.0, 15.0, 5.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9462890625, -0.902130126953125, -0.85797119140625, -0.813812255859375, -0.7696533203125, -0.725494384765625, -0.68133544921875, -0.637176513671875, -0.593017578125, -0.548858642578125, -0.50469970703125, -0.460540771484375, -0.4163818359375, -0.372222900390625, -0.32806396484375, -0.283905029296875, -0.23974609375, -0.195587158203125, -0.15142822265625, -0.107269287109375, -0.0631103515625, -0.018951416015625, 0.02520751953125, 0.069366455078125, 0.113525390625, 0.157684326171875, 0.20184326171875, 0.246002197265625, 0.2901611328125, 0.334320068359375, 0.37847900390625, 0.422637939453125, 0.466796875, 0.510955810546875, 0.55511474609375, 0.599273681640625, 0.6434326171875, 0.687591552734375, 0.73175048828125, 0.775909423828125, 0.820068359375, 0.864227294921875, 0.90838623046875, 0.952545166015625, 0.9967041015625, 1.040863037109375, 1.08502197265625, 1.129180908203125, 1.17333984375, 1.217498779296875, 1.26165771484375, 1.305816650390625, 1.3499755859375, 1.394134521484375, 1.43829345703125, 1.482452392578125, 1.526611328125, 1.570770263671875, 1.61492919921875, 1.659088134765625, 1.7032470703125, 1.747406005859375, 1.79156494140625, 1.835723876953125, 1.8798828125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 3.0, 4.0, 5.0, 6.0, 10.0, 8.0, 17.0, 17.0, 23.0, 25.0, 48.0, 61.0, 87.0, 114.0, 180.0, 244.0, 410.0, 618.0, 1123.0, 2058.0, 3780.0, 7549.0, 16356.0, 37818.0, 93632.0, 228504.0, 343705.0, 181758.0, 73326.0, 29977.0, 13296.0, 6327.0, 3153.0, 1671.0, 945.0, 587.0, 367.0, 218.0, 154.0, 96.0, 63.0, 72.0, 32.0, 27.0, 19.0, 11.0, 21.0, 12.0, 2.0, 7.0, 5.0, 1.0, 3.0, 4.0, 3.0, 2.0, 2.0], "bins": [-2.111328125, -2.0480499267578125, -1.984771728515625, -1.9214935302734375, -1.85821533203125, -1.7949371337890625, -1.731658935546875, -1.6683807373046875, -1.6051025390625, -1.5418243408203125, -1.478546142578125, -1.4152679443359375, -1.35198974609375, -1.2887115478515625, -1.225433349609375, -1.1621551513671875, -1.098876953125, -1.0355987548828125, -0.972320556640625, -0.9090423583984375, -0.84576416015625, -0.7824859619140625, -0.719207763671875, -0.6559295654296875, -0.5926513671875, -0.5293731689453125, -0.466094970703125, -0.4028167724609375, -0.33953857421875, -0.2762603759765625, -0.212982177734375, -0.1497039794921875, -0.08642578125, -0.0231475830078125, 0.040130615234375, 0.1034088134765625, 0.16668701171875, 0.2299652099609375, 0.293243408203125, 0.3565216064453125, 0.4197998046875, 0.4830780029296875, 0.546356201171875, 0.6096343994140625, 0.67291259765625, 0.7361907958984375, 0.799468994140625, 0.8627471923828125, 0.926025390625, 0.9893035888671875, 1.052581787109375, 1.1158599853515625, 1.17913818359375, 1.2424163818359375, 1.305694580078125, 1.3689727783203125, 1.4322509765625, 1.4955291748046875, 1.558807373046875, 1.6220855712890625, 1.68536376953125, 1.7486419677734375, 1.811920166015625, 1.8751983642578125, 1.9384765625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 5.0, 3.0, 9.0, 16.0, 14.0, 21.0, 14.0, 17.0, 22.0, 16.0, 36.0, 28.0, 32.0, 39.0, 35.0, 39.0, 48.0, 42.0, 54.0, 57.0, 47.0, 44.0, 43.0, 50.0, 36.0, 35.0, 25.0, 32.0, 17.0, 26.0, 15.0, 12.0, 12.0, 9.0, 9.0, 10.0, 7.0, 6.0, 4.0, 4.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.03125, -2.928070068359375, -2.82489013671875, -2.721710205078125, -2.6185302734375, -2.515350341796875, -2.41217041015625, -2.308990478515625, -2.205810546875, -2.102630615234375, -1.99945068359375, -1.896270751953125, -1.7930908203125, -1.689910888671875, -1.58673095703125, -1.483551025390625, -1.38037109375, -1.277191162109375, -1.17401123046875, -1.070831298828125, -0.9676513671875, -0.864471435546875, -0.76129150390625, -0.658111572265625, -0.554931640625, -0.451751708984375, -0.34857177734375, -0.245391845703125, -0.1422119140625, -0.039031982421875, 0.06414794921875, 0.167327880859375, 0.2705078125, 0.373687744140625, 0.47686767578125, 0.580047607421875, 0.6832275390625, 0.786407470703125, 0.88958740234375, 0.992767333984375, 1.095947265625, 1.199127197265625, 1.30230712890625, 1.405487060546875, 1.5086669921875, 1.611846923828125, 1.71502685546875, 1.818206787109375, 1.92138671875, 2.024566650390625, 2.12774658203125, 2.230926513671875, 2.3341064453125, 2.437286376953125, 2.54046630859375, 2.643646240234375, 2.746826171875, 2.850006103515625, 2.95318603515625, 3.056365966796875, 3.1595458984375, 3.262725830078125, 3.36590576171875, 3.469085693359375, 3.572265625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 7.0, 5.0, 5.0, 12.0, 13.0, 20.0, 26.0, 25.0, 48.0, 70.0, 132.0, 188.0, 346.0, 581.0, 1145.0, 2374.0, 5563.0, 16081.0, 66674.0, 632546.0, 269462.0, 34975.0, 10606.0, 3978.0, 1694.0, 848.0, 392.0, 273.0, 163.0, 96.0, 62.0, 50.0, 23.0, 26.0, 19.0, 10.0, 6.0, 6.0, 1.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.958984375, -2.880706787109375, -2.80242919921875, -2.724151611328125, -2.6458740234375, -2.567596435546875, -2.48931884765625, -2.411041259765625, -2.332763671875, -2.254486083984375, -2.17620849609375, -2.097930908203125, -2.0196533203125, -1.941375732421875, -1.86309814453125, -1.784820556640625, -1.70654296875, -1.628265380859375, -1.54998779296875, -1.471710205078125, -1.3934326171875, -1.315155029296875, -1.23687744140625, -1.158599853515625, -1.080322265625, -1.002044677734375, -0.92376708984375, -0.845489501953125, -0.7672119140625, -0.688934326171875, -0.61065673828125, -0.532379150390625, -0.4541015625, -0.375823974609375, -0.29754638671875, -0.219268798828125, -0.1409912109375, -0.062713623046875, 0.01556396484375, 0.093841552734375, 0.172119140625, 0.250396728515625, 0.32867431640625, 0.406951904296875, 0.4852294921875, 0.563507080078125, 0.64178466796875, 0.720062255859375, 0.79833984375, 0.876617431640625, 0.95489501953125, 1.033172607421875, 1.1114501953125, 1.189727783203125, 1.26800537109375, 1.346282958984375, 1.424560546875, 1.502838134765625, 1.58111572265625, 1.659393310546875, 1.7376708984375, 1.815948486328125, 1.89422607421875, 1.972503662109375, 2.05078125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 12.0, 9.0, 11.0, 23.0, 40.0, 42.0, 65.0, 87.0, 175.0, 179.0, 130.0, 61.0, 45.0, 31.0, 30.0, 15.0, 10.0, 10.0, 6.0, 4.0, 4.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003161430358886719, -0.00030185282230377197, -0.00028756260871887207, -0.00027327239513397217, -0.00025898218154907227, -0.00024469196796417236, -0.00023040175437927246, -0.00021611154079437256, -0.00020182132720947266, -0.00018753111362457275, -0.00017324090003967285, -0.00015895068645477295, -0.00014466047286987305, -0.00013037025928497314, -0.00011608004570007324, -0.00010178983211517334, -8.749961853027344e-05, -7.320940494537354e-05, -5.891919136047363e-05, -4.462897777557373e-05, -3.0338764190673828e-05, -1.6048550605773926e-05, -1.7583370208740234e-06, 1.2531876564025879e-05, 2.682209014892578e-05, 4.1112303733825684e-05, 5.5402517318725586e-05, 6.969273090362549e-05, 8.398294448852539e-05, 9.827315807342529e-05, 0.0001125633716583252, 0.0001268535852432251, 0.000141143798828125, 0.0001554340124130249, 0.0001697242259979248, 0.0001840144395828247, 0.0001983046531677246, 0.0002125948667526245, 0.00022688508033752441, 0.00024117529392242432, 0.0002554655075073242, 0.0002697557210922241, 0.000284045934677124, 0.0002983361482620239, 0.00031262636184692383, 0.00032691657543182373, 0.00034120678901672363, 0.00035549700260162354, 0.00036978721618652344, 0.00038407742977142334, 0.00039836764335632324, 0.00041265785694122314, 0.00042694807052612305, 0.00044123828411102295, 0.00045552849769592285, 0.00046981871128082275, 0.00048410892486572266, 0.0004983991384506226, 0.0005126893520355225, 0.0005269795656204224, 0.0005412697792053223, 0.0005555599927902222, 0.0005698502063751221, 0.000584140419960022, 0.0005984306335449219]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 3.0, 5.0, 6.0, 6.0, 10.0, 15.0, 17.0, 27.0, 36.0, 81.0, 97.0, 134.0, 230.0, 397.0, 773.0, 1365.0, 2818.0, 5917.0, 14091.0, 42130.0, 442136.0, 468286.0, 43496.0, 14558.0, 5920.0, 2787.0, 1366.0, 719.0, 413.0, 252.0, 159.0, 103.0, 62.0, 37.0, 23.0, 16.0, 18.0, 13.0, 11.0, 4.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.08203125, -2.985748291015625, -2.88946533203125, -2.793182373046875, -2.6968994140625, -2.600616455078125, -2.50433349609375, -2.408050537109375, -2.311767578125, -2.215484619140625, -2.11920166015625, -2.022918701171875, -1.9266357421875, -1.830352783203125, -1.73406982421875, -1.637786865234375, -1.54150390625, -1.445220947265625, -1.34893798828125, -1.252655029296875, -1.1563720703125, -1.060089111328125, -0.96380615234375, -0.867523193359375, -0.771240234375, -0.674957275390625, -0.57867431640625, -0.482391357421875, -0.3861083984375, -0.289825439453125, -0.19354248046875, -0.097259521484375, -0.0009765625, 0.095306396484375, 0.19158935546875, 0.287872314453125, 0.3841552734375, 0.480438232421875, 0.57672119140625, 0.673004150390625, 0.769287109375, 0.865570068359375, 0.96185302734375, 1.058135986328125, 1.1544189453125, 1.250701904296875, 1.34698486328125, 1.443267822265625, 1.53955078125, 1.635833740234375, 1.73211669921875, 1.828399658203125, 1.9246826171875, 2.020965576171875, 2.11724853515625, 2.213531494140625, 2.309814453125, 2.406097412109375, 2.50238037109375, 2.598663330078125, 2.6949462890625, 2.791229248046875, 2.88751220703125, 2.983795166015625, 3.080078125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 5.0, 10.0, 3.0, 9.0, 7.0, 9.0, 11.0, 11.0, 14.0, 28.0, 48.0, 84.0, 176.0, 206.0, 136.0, 92.0, 46.0, 23.0, 21.0, 12.0, 10.0, 11.0, 6.0, 9.0, 3.0, 1.0, 6.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.47265625, -2.388427734375, -2.30419921875, -2.219970703125, -2.1357421875, -2.051513671875, -1.96728515625, -1.883056640625, -1.798828125, -1.714599609375, -1.63037109375, -1.546142578125, -1.4619140625, -1.377685546875, -1.29345703125, -1.209228515625, -1.125, -1.040771484375, -0.95654296875, -0.872314453125, -0.7880859375, -0.703857421875, -0.61962890625, -0.535400390625, -0.451171875, -0.366943359375, -0.28271484375, -0.198486328125, -0.1142578125, -0.030029296875, 0.05419921875, 0.138427734375, 0.22265625, 0.306884765625, 0.39111328125, 0.475341796875, 0.5595703125, 0.643798828125, 0.72802734375, 0.812255859375, 0.896484375, 0.980712890625, 1.06494140625, 1.149169921875, 1.2333984375, 1.317626953125, 1.40185546875, 1.486083984375, 1.5703125, 1.654541015625, 1.73876953125, 1.822998046875, 1.9072265625, 1.991455078125, 2.07568359375, 2.159912109375, 2.244140625, 2.328369140625, 2.41259765625, 2.496826171875, 2.5810546875, 2.665283203125, 2.74951171875, 2.833740234375, 2.91796875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 11.0, 37.0, 110.0, 319.0, 356.0, 125.0, 33.0, 13.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.36107635498047, -54.985172271728516, -52.60926818847656, -50.23336410522461, -47.857460021972656, -45.4815559387207, -43.10565185546875, -40.72975158691406, -38.353843688964844, -35.97793960571289, -33.60203552246094, -31.226131439208984, -28.85022735595703, -26.474323272705078, -24.098421096801758, -21.722517013549805, -19.346614837646484, -16.97071075439453, -14.594806671142578, -12.218903541564941, -9.842999458312988, -7.467095375061035, -5.091192245483398, -2.7152881622314453, -0.3393840789794922, 2.036519765853882, 4.412423610687256, 6.788327217102051, 9.164231300354004, 11.540135383605957, 13.916038513183594, 16.291942596435547, 18.6678466796875, 21.043750762939453, 23.419654846191406, 25.79555892944336, 28.171463012695312, 30.547367095947266, 32.92327117919922, 35.299171447753906, 37.675079345703125, 40.05098342895508, 42.42688751220703, 44.802791595458984, 47.17869567871094, 49.55459976196289, 51.930503845214844, 54.30640411376953, 56.682308197021484, 59.05821228027344, 61.43411636352539, 63.810020446777344, 66.18592071533203, 68.56182861328125, 70.93772888183594, 73.31363677978516, 75.68953704833984, 78.06543731689453, 80.44134521484375, 82.81724548339844, 85.19315338134766, 87.56905364990234, 89.94496154785156, 92.32086181640625, 94.69676971435547]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 8.0, 3.0, 4.0, 5.0, 8.0, 9.0, 6.0, 12.0, 19.0, 18.0, 13.0, 14.0, 14.0, 23.0, 33.0, 28.0, 33.0, 39.0, 29.0, 36.0, 38.0, 38.0, 47.0, 52.0, 38.0, 47.0, 50.0, 43.0, 36.0, 32.0, 31.0, 30.0, 23.0, 27.0, 18.0, 20.0, 18.0, 17.0, 8.0, 9.0, 10.0, 4.0, 3.0, 4.0, 7.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-20.422222137451172, -19.8066463470459, -19.191070556640625, -18.57549476623535, -17.959918975830078, -17.344341278076172, -16.7287654876709, -16.113189697265625, -15.497613906860352, -14.882038116455078, -14.266462326049805, -13.650885581970215, -13.035309791564941, -12.419734001159668, -11.804157257080078, -11.188581466674805, -10.573005676269531, -9.957429885864258, -9.341854095458984, -8.726277351379395, -8.110701560974121, -7.495125770568848, -6.879549503326416, -6.263973236083984, -5.648397445678711, -5.0328216552734375, -4.417245388031006, -3.8016693592071533, -3.186093330383301, -2.5705173015594482, -1.9549412727355957, -1.339365005493164, -0.7237892150878906, -0.10821318626403809, 0.5073628425598145, 1.122938871383667, 1.7385149002075195, 2.354090929031372, 2.9696669578552246, 3.5852432250976562, 4.20081901550293, 4.816394805908203, 5.431971073150635, 6.047547340393066, 6.66312313079834, 7.278698921203613, 7.894275188446045, 8.509851455688477, 9.12542724609375, 9.741003036499023, 10.356578826904297, 10.972155570983887, 11.58773136138916, 12.203307151794434, 12.818883895874023, 13.434459686279297, 14.05003547668457, 14.665611267089844, 15.281187057495117, 15.896763801574707, 16.512340545654297, 17.12791633605957, 17.743492126464844, 18.359067916870117, 18.97464370727539]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 12.0, 10.0, 18.0, 31.0, 47.0, 74.0, 139.0, 222.0, 435.0, 995.0, 2572.0, 8824.0, 52974.0, 3854162.0, 246680.0, 19262.0, 4501.0, 1617.0, 719.0, 391.0, 204.0, 118.0, 94.0, 51.0, 41.0, 27.0, 12.0, 10.0, 9.0, 8.0, 3.0, 5.0, 7.0, 0.0, 2.0, 5.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.51953125, -6.314208984375, -6.10888671875, -5.903564453125, -5.6982421875, -5.492919921875, -5.28759765625, -5.082275390625, -4.876953125, -4.671630859375, -4.46630859375, -4.260986328125, -4.0556640625, -3.850341796875, -3.64501953125, -3.439697265625, -3.234375, -3.029052734375, -2.82373046875, -2.618408203125, -2.4130859375, -2.207763671875, -2.00244140625, -1.797119140625, -1.591796875, -1.386474609375, -1.18115234375, -0.975830078125, -0.7705078125, -0.565185546875, -0.35986328125, -0.154541015625, 0.05078125, 0.256103515625, 0.46142578125, 0.666748046875, 0.8720703125, 1.077392578125, 1.28271484375, 1.488037109375, 1.693359375, 1.898681640625, 2.10400390625, 2.309326171875, 2.5146484375, 2.719970703125, 2.92529296875, 3.130615234375, 3.3359375, 3.541259765625, 3.74658203125, 3.951904296875, 4.1572265625, 4.362548828125, 4.56787109375, 4.773193359375, 4.978515625, 5.183837890625, 5.38916015625, 5.594482421875, 5.7998046875, 6.005126953125, 6.21044921875, 6.415771484375, 6.62109375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 6.0, 5.0, 10.0, 18.0, 13.0, 28.0, 33.0, 64.0, 81.0, 75.0, 105.0, 82.0, 80.0, 88.0, 72.0, 74.0, 46.0, 43.0, 31.0, 15.0, 11.0, 10.0, 5.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.099609375, -1.0514984130859375, -1.003387451171875, -0.9552764892578125, -0.90716552734375, -0.8590545654296875, -0.810943603515625, -0.7628326416015625, -0.7147216796875, -0.6666107177734375, -0.618499755859375, -0.5703887939453125, -0.52227783203125, -0.4741668701171875, -0.426055908203125, -0.3779449462890625, -0.329833984375, -0.2817230224609375, -0.233612060546875, -0.1855010986328125, -0.13739013671875, -0.0892791748046875, -0.041168212890625, 0.0069427490234375, 0.0550537109375, 0.1031646728515625, 0.151275634765625, 0.1993865966796875, 0.24749755859375, 0.2956085205078125, 0.343719482421875, 0.3918304443359375, 0.43994140625, 0.4880523681640625, 0.536163330078125, 0.5842742919921875, 0.63238525390625, 0.6804962158203125, 0.728607177734375, 0.7767181396484375, 0.8248291015625, 0.8729400634765625, 0.921051025390625, 0.9691619873046875, 1.01727294921875, 1.0653839111328125, 1.113494873046875, 1.1616058349609375, 1.209716796875, 1.2578277587890625, 1.305938720703125, 1.3540496826171875, 1.40216064453125, 1.4502716064453125, 1.498382568359375, 1.5464935302734375, 1.5946044921875, 1.6427154541015625, 1.690826416015625, 1.7389373779296875, 1.78704833984375, 1.8351593017578125, 1.883270263671875, 1.9313812255859375, 1.9794921875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 2.0, 6.0, 3.0, 15.0, 9.0, 19.0, 34.0, 73.0, 93.0, 131.0, 193.0, 389.0, 800.0, 2110.0, 7247.0, 36094.0, 1158994.0, 2931711.0, 44025.0, 8222.0, 2268.0, 909.0, 375.0, 208.0, 121.0, 79.0, 60.0, 35.0, 22.0, 16.0, 10.0, 10.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.7109375, -6.51385498046875, -6.3167724609375, -6.11968994140625, -5.922607421875, -5.72552490234375, -5.5284423828125, -5.33135986328125, -5.13427734375, -4.93719482421875, -4.7401123046875, -4.54302978515625, -4.345947265625, -4.14886474609375, -3.9517822265625, -3.75469970703125, -3.5576171875, -3.36053466796875, -3.1634521484375, -2.96636962890625, -2.769287109375, -2.57220458984375, -2.3751220703125, -2.17803955078125, -1.98095703125, -1.78387451171875, -1.5867919921875, -1.38970947265625, -1.192626953125, -0.99554443359375, -0.7984619140625, -0.60137939453125, -0.404296875, -0.20721435546875, -0.0101318359375, 0.18695068359375, 0.384033203125, 0.58111572265625, 0.7781982421875, 0.97528076171875, 1.17236328125, 1.36944580078125, 1.5665283203125, 1.76361083984375, 1.960693359375, 2.15777587890625, 2.3548583984375, 2.55194091796875, 2.7490234375, 2.94610595703125, 3.1431884765625, 3.34027099609375, 3.537353515625, 3.73443603515625, 3.9315185546875, 4.12860107421875, 4.32568359375, 4.52276611328125, 4.7198486328125, 4.91693115234375, 5.114013671875, 5.31109619140625, 5.5081787109375, 5.70526123046875, 5.90234375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 6.0, 14.0, 11.0, 14.0, 42.0, 86.0, 171.0, 974.0, 2242.0, 307.0, 107.0, 55.0, 17.0, 17.0, 5.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.62109375, -3.51202392578125, -3.4029541015625, -3.29388427734375, -3.184814453125, -3.07574462890625, -2.9666748046875, -2.85760498046875, -2.74853515625, -2.63946533203125, -2.5303955078125, -2.42132568359375, -2.312255859375, -2.20318603515625, -2.0941162109375, -1.98504638671875, -1.8759765625, -1.76690673828125, -1.6578369140625, -1.54876708984375, -1.439697265625, -1.33062744140625, -1.2215576171875, -1.11248779296875, -1.00341796875, -0.89434814453125, -0.7852783203125, -0.67620849609375, -0.567138671875, -0.45806884765625, -0.3489990234375, -0.23992919921875, -0.130859375, -0.02178955078125, 0.0872802734375, 0.19635009765625, 0.305419921875, 0.41448974609375, 0.5235595703125, 0.63262939453125, 0.74169921875, 0.85076904296875, 0.9598388671875, 1.06890869140625, 1.177978515625, 1.28704833984375, 1.3961181640625, 1.50518798828125, 1.6142578125, 1.72332763671875, 1.8323974609375, 1.94146728515625, 2.050537109375, 2.15960693359375, 2.2686767578125, 2.37774658203125, 2.48681640625, 2.59588623046875, 2.7049560546875, 2.81402587890625, 2.923095703125, 3.03216552734375, 3.1412353515625, 3.25030517578125, 3.359375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 21.0, 377.0, 564.0, 51.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-116.98536682128906, -114.86746978759766, -112.74957275390625, -110.63166809082031, -108.5137710571289, -106.3958740234375, -104.27796936035156, -102.16007232666016, -100.04217529296875, -97.92427825927734, -95.80638122558594, -93.6884765625, -91.5705795288086, -89.45268249511719, -87.33477783203125, -85.21688079833984, -83.09898376464844, -80.98108673095703, -78.86318969726562, -76.74528503417969, -74.62738800048828, -72.50949096679688, -70.39158630371094, -68.27368927001953, -66.15579223632812, -64.03789520263672, -61.91999435424805, -59.802093505859375, -57.68419647216797, -55.56629943847656, -53.44839859008789, -51.33049774169922, -49.212608337402344, -47.09471130371094, -44.976810455322266, -42.858909606933594, -40.74101257324219, -38.62311553955078, -36.50521469116211, -34.38731384277344, -32.26941680908203, -30.151517868041992, -28.033618927001953, -25.915719985961914, -23.797821044921875, -21.679922103881836, -19.562023162841797, -17.444124221801758, -15.326223373413086, -13.208324432373047, -11.090425491333008, -8.972526550292969, -6.85462760925293, -4.736728668212891, -2.6188297271728516, -0.5009307861328125, 1.6169681549072266, 3.7348670959472656, 5.852766036987305, 7.970664978027344, 10.088563919067383, 12.206462860107422, 14.324361801147461, 16.4422607421875, 18.56015968322754]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 9.0, 9.0, 15.0, 14.0, 18.0, 29.0, 57.0, 64.0, 63.0, 56.0, 83.0, 77.0, 63.0, 87.0, 75.0, 69.0, 64.0, 38.0, 34.0, 26.0, 18.0, 20.0, 7.0, 4.0, 5.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.015313148498535, -11.670171737670898, -11.325031280517578, -10.979890823364258, -10.634749412536621, -10.289608001708984, -9.944467544555664, -9.599327087402344, -9.254185676574707, -8.90904426574707, -8.56390380859375, -8.21876335144043, -7.873621940612793, -7.5284810066223145, -7.183340072631836, -6.838199138641357, -6.493058204650879, -6.1479172706604, -5.802776336669922, -5.457635402679443, -5.112494468688965, -4.767353534698486, -4.422212600708008, -4.077071666717529, -3.731930732727051, -3.3867897987365723, -3.0416488647460938, -2.6965079307556152, -2.3513669967651367, -2.006226062774658, -1.6610851287841797, -1.3159441947937012, -0.9708042144775391, -0.6256632804870605, -0.28052234649658203, 0.06461858749389648, 0.409759521484375, 0.7549004554748535, 1.100041389465332, 1.4451823234558105, 1.790323257446289, 2.1354641914367676, 2.480605125427246, 2.8257460594177246, 3.170886993408203, 3.5160279273986816, 3.86116886138916, 4.206309795379639, 4.551450729370117, 4.896591663360596, 5.241732597351074, 5.586873531341553, 5.932014465332031, 6.27715539932251, 6.622296333312988, 6.967437267303467, 7.312578201293945, 7.657719135284424, 8.002860069274902, 8.348001480102539, 8.69314193725586, 9.03828239440918, 9.383423805236816, 9.728565216064453, 10.073705673217773]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 5.0, 6.0, 15.0, 25.0, 14.0, 28.0, 50.0, 80.0, 122.0, 199.0, 322.0, 582.0, 1081.0, 2159.0, 4893.0, 12517.0, 41556.0, 171589.0, 540817.0, 200753.0, 47264.0, 14106.0, 5368.0, 2390.0, 1095.0, 618.0, 314.0, 208.0, 106.0, 69.0, 62.0, 37.0, 31.0, 15.0, 16.0, 12.0, 10.0, 4.0, 4.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.33984375, -4.2142333984375, -4.088623046875, -3.9630126953125, -3.83740234375, -3.7117919921875, -3.586181640625, -3.4605712890625, -3.3349609375, -3.2093505859375, -3.083740234375, -2.9581298828125, -2.83251953125, -2.7069091796875, -2.581298828125, -2.4556884765625, -2.330078125, -2.2044677734375, -2.078857421875, -1.9532470703125, -1.82763671875, -1.7020263671875, -1.576416015625, -1.4508056640625, -1.3251953125, -1.1995849609375, -1.073974609375, -0.9483642578125, -0.82275390625, -0.6971435546875, -0.571533203125, -0.4459228515625, -0.3203125, -0.1947021484375, -0.069091796875, 0.0565185546875, 0.18212890625, 0.3077392578125, 0.433349609375, 0.5589599609375, 0.6845703125, 0.8101806640625, 0.935791015625, 1.0614013671875, 1.18701171875, 1.3126220703125, 1.438232421875, 1.5638427734375, 1.689453125, 1.8150634765625, 1.940673828125, 2.0662841796875, 2.19189453125, 2.3175048828125, 2.443115234375, 2.5687255859375, 2.6943359375, 2.8199462890625, 2.945556640625, 3.0711669921875, 3.19677734375, 3.3223876953125, 3.447998046875, 3.5736083984375, 3.69921875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 4.0, 13.0, 12.0, 13.0, 24.0, 40.0, 38.0, 56.0, 88.0, 75.0, 84.0, 70.0, 80.0, 81.0, 66.0, 54.0, 58.0, 41.0, 36.0, 20.0, 10.0, 15.0, 7.0, 4.0, 5.0, 0.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9697265625, -0.925140380859375, -0.88055419921875, -0.835968017578125, -0.7913818359375, -0.746795654296875, -0.70220947265625, -0.657623291015625, -0.613037109375, -0.568450927734375, -0.52386474609375, -0.479278564453125, -0.4346923828125, -0.390106201171875, -0.34552001953125, -0.300933837890625, -0.25634765625, -0.211761474609375, -0.16717529296875, -0.122589111328125, -0.0780029296875, -0.033416748046875, 0.01116943359375, 0.055755615234375, 0.100341796875, 0.144927978515625, 0.18951416015625, 0.234100341796875, 0.2786865234375, 0.323272705078125, 0.36785888671875, 0.412445068359375, 0.45703125, 0.501617431640625, 0.54620361328125, 0.590789794921875, 0.6353759765625, 0.679962158203125, 0.72454833984375, 0.769134521484375, 0.813720703125, 0.858306884765625, 0.90289306640625, 0.947479248046875, 0.9920654296875, 1.036651611328125, 1.08123779296875, 1.125823974609375, 1.17041015625, 1.214996337890625, 1.25958251953125, 1.304168701171875, 1.3487548828125, 1.393341064453125, 1.43792724609375, 1.482513427734375, 1.527099609375, 1.571685791015625, 1.61627197265625, 1.660858154296875, 1.7054443359375, 1.750030517578125, 1.79461669921875, 1.839202880859375, 1.8837890625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 5.0, 7.0, 5.0, 4.0, 14.0, 13.0, 20.0, 25.0, 27.0, 35.0, 46.0, 75.0, 111.0, 138.0, 179.0, 285.0, 406.0, 603.0, 989.0, 1803.0, 3012.0, 5853.0, 11942.0, 27325.0, 69907.0, 195623.0, 412036.0, 195579.0, 69640.0, 27329.0, 12009.0, 5861.0, 2954.0, 1671.0, 1010.0, 620.0, 400.0, 279.0, 189.0, 137.0, 105.0, 80.0, 54.0, 40.0, 33.0, 23.0, 17.0, 10.0, 10.0, 8.0, 7.0, 4.0, 3.0, 1.0, 2.0, 0.0, 3.0], "bins": [-2.46875, -2.395050048828125, -2.32135009765625, -2.247650146484375, -2.1739501953125, -2.100250244140625, -2.02655029296875, -1.952850341796875, -1.879150390625, -1.805450439453125, -1.73175048828125, -1.658050537109375, -1.5843505859375, -1.510650634765625, -1.43695068359375, -1.363250732421875, -1.28955078125, -1.215850830078125, -1.14215087890625, -1.068450927734375, -0.9947509765625, -0.921051025390625, -0.84735107421875, -0.773651123046875, -0.699951171875, -0.626251220703125, -0.55255126953125, -0.478851318359375, -0.4051513671875, -0.331451416015625, -0.25775146484375, -0.184051513671875, -0.1103515625, -0.036651611328125, 0.03704833984375, 0.110748291015625, 0.1844482421875, 0.258148193359375, 0.33184814453125, 0.405548095703125, 0.479248046875, 0.552947998046875, 0.62664794921875, 0.700347900390625, 0.7740478515625, 0.847747802734375, 0.92144775390625, 0.995147705078125, 1.06884765625, 1.142547607421875, 1.21624755859375, 1.289947509765625, 1.3636474609375, 1.437347412109375, 1.51104736328125, 1.584747314453125, 1.658447265625, 1.732147216796875, 1.80584716796875, 1.879547119140625, 1.9532470703125, 2.026947021484375, 2.10064697265625, 2.174346923828125, 2.248046875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 5.0, 4.0, 6.0, 4.0, 11.0, 11.0, 16.0, 22.0, 27.0, 26.0, 43.0, 24.0, 43.0, 51.0, 60.0, 60.0, 54.0, 63.0, 59.0, 56.0, 58.0, 59.0, 43.0, 32.0, 43.0, 22.0, 25.0, 21.0, 16.0, 12.0, 8.0, 4.0, 12.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.796875, -4.6531982421875, -4.509521484375, -4.3658447265625, -4.22216796875, -4.0784912109375, -3.934814453125, -3.7911376953125, -3.6474609375, -3.5037841796875, -3.360107421875, -3.2164306640625, -3.07275390625, -2.9290771484375, -2.785400390625, -2.6417236328125, -2.498046875, -2.3543701171875, -2.210693359375, -2.0670166015625, -1.92333984375, -1.7796630859375, -1.635986328125, -1.4923095703125, -1.3486328125, -1.2049560546875, -1.061279296875, -0.9176025390625, -0.77392578125, -0.6302490234375, -0.486572265625, -0.3428955078125, -0.19921875, -0.0555419921875, 0.088134765625, 0.2318115234375, 0.37548828125, 0.5191650390625, 0.662841796875, 0.8065185546875, 0.9501953125, 1.0938720703125, 1.237548828125, 1.3812255859375, 1.52490234375, 1.6685791015625, 1.812255859375, 1.9559326171875, 2.099609375, 2.2432861328125, 2.386962890625, 2.5306396484375, 2.67431640625, 2.8179931640625, 2.961669921875, 3.1053466796875, 3.2490234375, 3.3927001953125, 3.536376953125, 3.6800537109375, 3.82373046875, 3.9674072265625, 4.111083984375, 4.2547607421875, 4.3984375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 0.0, 4.0, 1.0, 3.0, 6.0, 2.0, 7.0, 8.0, 3.0, 14.0, 18.0, 17.0, 22.0, 39.0, 78.0, 101.0, 153.0, 287.0, 594.0, 1380.0, 3984.0, 14041.0, 129536.0, 844340.0, 41659.0, 7781.0, 2490.0, 944.0, 442.0, 234.0, 139.0, 73.0, 43.0, 36.0, 22.0, 17.0, 8.0, 7.0, 11.0, 3.0, 0.0, 6.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.150390625, -3.034942626953125, -2.91949462890625, -2.804046630859375, -2.6885986328125, -2.573150634765625, -2.45770263671875, -2.342254638671875, -2.226806640625, -2.111358642578125, -1.99591064453125, -1.880462646484375, -1.7650146484375, -1.649566650390625, -1.53411865234375, -1.418670654296875, -1.30322265625, -1.187774658203125, -1.07232666015625, -0.956878662109375, -0.8414306640625, -0.725982666015625, -0.61053466796875, -0.495086669921875, -0.379638671875, -0.264190673828125, -0.14874267578125, -0.033294677734375, 0.0821533203125, 0.197601318359375, 0.31304931640625, 0.428497314453125, 0.5439453125, 0.659393310546875, 0.77484130859375, 0.890289306640625, 1.0057373046875, 1.121185302734375, 1.23663330078125, 1.352081298828125, 1.467529296875, 1.582977294921875, 1.69842529296875, 1.813873291015625, 1.9293212890625, 2.044769287109375, 2.16021728515625, 2.275665283203125, 2.39111328125, 2.506561279296875, 2.62200927734375, 2.737457275390625, 2.8529052734375, 2.968353271484375, 3.08380126953125, 3.199249267578125, 3.314697265625, 3.430145263671875, 3.54559326171875, 3.661041259765625, 3.7764892578125, 3.891937255859375, 4.00738525390625, 4.122833251953125, 4.23828125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 7.0, 5.0, 5.0, 15.0, 15.0, 21.0, 39.0, 70.0, 226.0, 337.0, 117.0, 56.0, 29.0, 14.0, 15.0, 10.0, 8.0, 2.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005965232849121094, -0.0005737990140914917, -0.000551074743270874, -0.0005283504724502563, -0.0005056262016296387, -0.000482901930809021, -0.0004601776599884033, -0.00043745338916778564, -0.00041472911834716797, -0.0003920048475265503, -0.0003692805767059326, -0.00034655630588531494, -0.00032383203506469727, -0.0003011077642440796, -0.0002783834934234619, -0.00025565922260284424, -0.00023293495178222656, -0.0002102106809616089, -0.0001874864101409912, -0.00016476213932037354, -0.00014203786849975586, -0.00011931359767913818, -9.658932685852051e-05, -7.386505603790283e-05, -5.1140785217285156e-05, -2.841651439666748e-05, -5.692243576049805e-06, 1.703202724456787e-05, 3.975629806518555e-05, 6.248056888580322e-05, 8.52048397064209e-05, 0.00010792911052703857, 0.00013065338134765625, 0.00015337765216827393, 0.0001761019229888916, 0.00019882619380950928, 0.00022155046463012695, 0.00024427473545074463, 0.0002669990062713623, 0.00028972327709198, 0.00031244754791259766, 0.00033517181873321533, 0.000357896089553833, 0.0003806203603744507, 0.00040334463119506836, 0.00042606890201568604, 0.0004487931728363037, 0.0004715174436569214, 0.0004942417144775391, 0.0005169659852981567, 0.0005396902561187744, 0.0005624145269393921, 0.0005851387977600098, 0.0006078630685806274, 0.0006305873394012451, 0.0006533116102218628, 0.0006760358810424805, 0.0006987601518630981, 0.0007214844226837158, 0.0007442086935043335, 0.0007669329643249512, 0.0007896572351455688, 0.0008123815059661865, 0.0008351057767868042, 0.0008578300476074219]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 8.0, 7.0, 11.0, 22.0, 22.0, 37.0, 66.0, 109.0, 181.0, 492.0, 1732.0, 14014.0, 875501.0, 147846.0, 6652.0, 1117.0, 352.0, 155.0, 84.0, 43.0, 33.0, 26.0, 18.0, 8.0, 5.0, 4.0, 6.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.0703125, -6.7857666015625, -6.501220703125, -6.2166748046875, -5.93212890625, -5.6475830078125, -5.363037109375, -5.0784912109375, -4.7939453125, -4.5093994140625, -4.224853515625, -3.9403076171875, -3.65576171875, -3.3712158203125, -3.086669921875, -2.8021240234375, -2.517578125, -2.2330322265625, -1.948486328125, -1.6639404296875, -1.37939453125, -1.0948486328125, -0.810302734375, -0.5257568359375, -0.2412109375, 0.0433349609375, 0.327880859375, 0.6124267578125, 0.89697265625, 1.1815185546875, 1.466064453125, 1.7506103515625, 2.03515625, 2.3197021484375, 2.604248046875, 2.8887939453125, 3.17333984375, 3.4578857421875, 3.742431640625, 4.0269775390625, 4.3115234375, 4.5960693359375, 4.880615234375, 5.1651611328125, 5.44970703125, 5.7342529296875, 6.018798828125, 6.3033447265625, 6.587890625, 6.8724365234375, 7.156982421875, 7.4415283203125, 7.72607421875, 8.0106201171875, 8.295166015625, 8.5797119140625, 8.8642578125, 9.1488037109375, 9.433349609375, 9.7178955078125, 10.00244140625, 10.2869873046875, 10.571533203125, 10.8560791015625, 11.140625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 4.0, 1.0, 0.0, 5.0, 5.0, 9.0, 10.0, 9.0, 6.0, 10.0, 16.0, 27.0, 23.0, 36.0, 78.0, 145.0, 217.0, 160.0, 72.0, 41.0, 25.0, 21.0, 19.0, 9.0, 12.0, 13.0, 5.0, 11.0, 6.0, 3.0, 1.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.8671875, -2.790618896484375, -2.71405029296875, -2.637481689453125, -2.5609130859375, -2.484344482421875, -2.40777587890625, -2.331207275390625, -2.254638671875, -2.178070068359375, -2.10150146484375, -2.024932861328125, -1.9483642578125, -1.871795654296875, -1.79522705078125, -1.718658447265625, -1.64208984375, -1.565521240234375, -1.48895263671875, -1.412384033203125, -1.3358154296875, -1.259246826171875, -1.18267822265625, -1.106109619140625, -1.029541015625, -0.952972412109375, -0.87640380859375, -0.799835205078125, -0.7232666015625, -0.646697998046875, -0.57012939453125, -0.493560791015625, -0.4169921875, -0.340423583984375, -0.26385498046875, -0.187286376953125, -0.1107177734375, -0.034149169921875, 0.04241943359375, 0.118988037109375, 0.195556640625, 0.272125244140625, 0.34869384765625, 0.425262451171875, 0.5018310546875, 0.578399658203125, 0.65496826171875, 0.731536865234375, 0.80810546875, 0.884674072265625, 0.96124267578125, 1.037811279296875, 1.1143798828125, 1.190948486328125, 1.26751708984375, 1.344085693359375, 1.420654296875, 1.497222900390625, 1.57379150390625, 1.650360107421875, 1.7269287109375, 1.803497314453125, 1.88006591796875, 1.956634521484375, 2.033203125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 9.0, 29.0, 162.0, 477.0, 260.0, 56.0, 13.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.69691467285156, -63.147361755371094, -59.597808837890625, -56.048255920410156, -52.49870300292969, -48.94915008544922, -45.39959716796875, -41.85004425048828, -38.30049133300781, -34.750938415527344, -31.201385498046875, -27.651832580566406, -24.102279663085938, -20.5527286529541, -17.003175735473633, -13.453622817993164, -9.904071807861328, -6.354518890380859, -2.804966449737549, 0.7445859909057617, 4.2941389083862305, 7.843690872192383, 11.393243789672852, 14.94279670715332, 18.49234962463379, 22.041902542114258, 25.591455459594727, 29.141006469726562, 32.69055938720703, 36.2401123046875, 39.78966522216797, 43.33921813964844, 46.888771057128906, 50.438323974609375, 53.987876892089844, 57.53742980957031, 61.08698272705078, 64.63653564453125, 68.18608856201172, 71.73564147949219, 75.28519439697266, 78.83474731445312, 82.3843002319336, 85.93385314941406, 89.48340606689453, 93.032958984375, 96.58251190185547, 100.13206481933594, 103.68161010742188, 107.23116302490234, 110.78071594238281, 114.33026885986328, 117.87982177734375, 121.42937469482422, 124.97892761230469, 128.52847290039062, 132.07803344726562, 135.62757873535156, 139.17713928222656, 142.7266845703125, 146.2762451171875, 149.82579040527344, 153.37535095214844, 156.92489624023438, 160.47445678710938]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 1.0, 4.0, 8.0, 4.0, 4.0, 1.0, 9.0, 10.0, 11.0, 12.0, 12.0, 23.0, 20.0, 23.0, 21.0, 35.0, 34.0, 27.0, 24.0, 37.0, 39.0, 45.0, 29.0, 50.0, 50.0, 51.0, 43.0, 40.0, 42.0, 31.0, 34.0, 36.0, 25.0, 26.0, 20.0, 28.0, 18.0, 12.0, 12.0, 11.0, 6.0, 4.0, 4.0, 7.0, 8.0, 2.0, 3.0, 2.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.784160614013672, -20.155826568603516, -19.52749252319336, -18.899158477783203, -18.270822525024414, -17.642488479614258, -17.0141544342041, -16.385820388793945, -15.757486343383789, -15.129152297973633, -14.50081729888916, -13.872483253479004, -13.244149208068848, -12.615814208984375, -11.987480163574219, -11.359146118164062, -10.73081111907959, -10.102477073669434, -9.474142074584961, -8.845808029174805, -8.217473983764648, -7.589139461517334, -6.9608049392700195, -6.332470893859863, -5.704136371612549, -5.075801849365234, -4.447467803955078, -3.8191332817077637, -3.1907989978790283, -2.562464714050293, -1.9341301918029785, -1.3057961463928223, -0.6774616241455078, -0.049127280712127686, 0.5792070627212524, 1.2075414657592773, 1.8358757495880127, 2.464210033416748, 3.0925445556640625, 3.7208786010742188, 4.349213123321533, 4.977547645568848, 5.605881690979004, 6.234216213226318, 6.862550735473633, 7.490884780883789, 8.119218826293945, 8.747552871704102, 9.375887870788574, 10.00422191619873, 10.632556915283203, 11.26089096069336, 11.889225006103516, 12.517559051513672, 13.145894050598145, 13.7742280960083, 14.402563095092773, 15.03089714050293, 15.659232139587402, 16.287567138671875, 16.91590118408203, 17.544235229492188, 18.172569274902344, 18.8009033203125, 19.429237365722656]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 7.0, 2.0, 9.0, 4.0, 10.0, 13.0, 14.0, 34.0, 57.0, 93.0, 118.0, 186.0, 319.0, 662.0, 1382.0, 3414.0, 9851.0, 39130.0, 1375472.0, 2708145.0, 39333.0, 9553.0, 3312.0, 1362.0, 674.0, 398.0, 195.0, 138.0, 106.0, 87.0, 48.0, 38.0, 30.0, 14.0, 20.0, 12.0, 10.0, 10.0, 2.0, 12.0, 2.0, 6.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.66015625, -5.48870849609375, -5.3172607421875, -5.14581298828125, -4.974365234375, -4.80291748046875, -4.6314697265625, -4.46002197265625, -4.28857421875, -4.11712646484375, -3.9456787109375, -3.77423095703125, -3.602783203125, -3.43133544921875, -3.2598876953125, -3.08843994140625, -2.9169921875, -2.74554443359375, -2.5740966796875, -2.40264892578125, -2.231201171875, -2.05975341796875, -1.8883056640625, -1.71685791015625, -1.54541015625, -1.37396240234375, -1.2025146484375, -1.03106689453125, -0.859619140625, -0.68817138671875, -0.5167236328125, -0.34527587890625, -0.173828125, -0.00238037109375, 0.1690673828125, 0.34051513671875, 0.511962890625, 0.68341064453125, 0.8548583984375, 1.02630615234375, 1.19775390625, 1.36920166015625, 1.5406494140625, 1.71209716796875, 1.883544921875, 2.05499267578125, 2.2264404296875, 2.39788818359375, 2.5693359375, 2.74078369140625, 2.9122314453125, 3.08367919921875, 3.255126953125, 3.42657470703125, 3.5980224609375, 3.76947021484375, 3.94091796875, 4.11236572265625, 4.2838134765625, 4.45526123046875, 4.626708984375, 4.79815673828125, 4.9696044921875, 5.14105224609375, 5.3125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 3.0, 6.0, 8.0, 13.0, 12.0, 15.0, 25.0, 34.0, 39.0, 43.0, 52.0, 78.0, 55.0, 85.0, 60.0, 82.0, 69.0, 66.0, 59.0, 48.0, 33.0, 34.0, 30.0, 16.0, 14.0, 10.0, 6.0, 5.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95556640625, -0.9109573364257812, -0.8663482666015625, -0.8217391967773438, -0.777130126953125, -0.7325210571289062, -0.6879119873046875, -0.6433029174804688, -0.59869384765625, -0.5540847778320312, -0.5094757080078125, -0.46486663818359375, -0.420257568359375, -0.37564849853515625, -0.3310394287109375, -0.28643035888671875, -0.2418212890625, -0.19721221923828125, -0.1526031494140625, -0.10799407958984375, -0.063385009765625, -0.01877593994140625, 0.0258331298828125, 0.07044219970703125, 0.11505126953125, 0.15966033935546875, 0.2042694091796875, 0.24887847900390625, 0.293487548828125, 0.33809661865234375, 0.3827056884765625, 0.42731475830078125, 0.471923828125, 0.5165328979492188, 0.5611419677734375, 0.6057510375976562, 0.650360107421875, 0.6949691772460938, 0.7395782470703125, 0.7841873168945312, 0.82879638671875, 0.8734054565429688, 0.9180145263671875, 0.9626235961914062, 1.007232666015625, 1.0518417358398438, 1.0964508056640625, 1.1410598754882812, 1.1856689453125, 1.2302780151367188, 1.2748870849609375, 1.3194961547851562, 1.364105224609375, 1.4087142944335938, 1.4533233642578125, 1.4979324340820312, 1.54254150390625, 1.5871505737304688, 1.6317596435546875, 1.6763687133789062, 1.720977783203125, 1.7655868530273438, 1.8101959228515625, 1.8548049926757812, 1.8994140625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 7.0, 13.0, 12.0, 15.0, 17.0, 19.0, 36.0, 40.0, 38.0, 87.0, 138.0, 420.0, 1802.0, 15670.0, 3989873.0, 177932.0, 6507.0, 1053.0, 278.0, 106.0, 46.0, 43.0, 24.0, 24.0, 20.0, 11.0, 16.0, 10.0, 8.0, 10.0, 3.0, 5.0, 4.0, 3.0, 1.0, 3.0, 1.0, 2.0], "bins": [-17.671875, -17.2388916015625, -16.805908203125, -16.3729248046875, -15.93994140625, -15.5069580078125, -15.073974609375, -14.6409912109375, -14.2080078125, -13.7750244140625, -13.342041015625, -12.9090576171875, -12.47607421875, -12.0430908203125, -11.610107421875, -11.1771240234375, -10.744140625, -10.3111572265625, -9.878173828125, -9.4451904296875, -9.01220703125, -8.5792236328125, -8.146240234375, -7.7132568359375, -7.2802734375, -6.8472900390625, -6.414306640625, -5.9813232421875, -5.54833984375, -5.1153564453125, -4.682373046875, -4.2493896484375, -3.81640625, -3.3834228515625, -2.950439453125, -2.5174560546875, -2.08447265625, -1.6514892578125, -1.218505859375, -0.7855224609375, -0.3525390625, 0.0804443359375, 0.513427734375, 0.9464111328125, 1.37939453125, 1.8123779296875, 2.245361328125, 2.6783447265625, 3.111328125, 3.5443115234375, 3.977294921875, 4.4102783203125, 4.84326171875, 5.2762451171875, 5.709228515625, 6.1422119140625, 6.5751953125, 7.0081787109375, 7.441162109375, 7.8741455078125, 8.30712890625, 8.7401123046875, 9.173095703125, 9.6060791015625, 10.0390625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 5.0, 3.0, 11.0, 11.0, 14.0, 31.0, 38.0, 73.0, 119.0, 279.0, 1541.0, 1394.0, 261.0, 100.0, 49.0, 37.0, 23.0, 10.0, 18.0, 8.0, 11.0, 6.0, 3.0, 3.0, 8.0, 0.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.05078125, -1.99530029296875, -1.9398193359375, -1.88433837890625, -1.828857421875, -1.77337646484375, -1.7178955078125, -1.66241455078125, -1.60693359375, -1.55145263671875, -1.4959716796875, -1.44049072265625, -1.385009765625, -1.32952880859375, -1.2740478515625, -1.21856689453125, -1.1630859375, -1.10760498046875, -1.0521240234375, -0.99664306640625, -0.941162109375, -0.88568115234375, -0.8302001953125, -0.77471923828125, -0.71923828125, -0.66375732421875, -0.6082763671875, -0.55279541015625, -0.497314453125, -0.44183349609375, -0.3863525390625, -0.33087158203125, -0.275390625, -0.21990966796875, -0.1644287109375, -0.10894775390625, -0.053466796875, 0.00201416015625, 0.0574951171875, 0.11297607421875, 0.16845703125, 0.22393798828125, 0.2794189453125, 0.33489990234375, 0.390380859375, 0.44586181640625, 0.5013427734375, 0.55682373046875, 0.6123046875, 0.66778564453125, 0.7232666015625, 0.77874755859375, 0.834228515625, 0.88970947265625, 0.9451904296875, 1.00067138671875, 1.05615234375, 1.11163330078125, 1.1671142578125, 1.22259521484375, 1.278076171875, 1.33355712890625, 1.3890380859375, 1.44451904296875, 1.5]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 10.0, 18.0, 43.0, 98.0, 188.0, 267.0, 199.0, 103.0, 43.0, 18.0, 4.0, 9.0, 4.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.94827651977539, -10.363204956054688, -9.778132438659668, -9.193060874938965, -8.607988357543945, -8.022916793823242, -7.437844753265381, -6.8527727127075195, -6.267700672149658, -5.682628631591797, -5.0975565910339355, -4.512484550476074, -3.927412748336792, -3.3423407077789307, -2.7572689056396484, -2.172196865081787, -1.5871248245239258, -1.0020527839660645, -0.4169808626174927, 0.1680910587310791, 0.7531630992889404, 1.3382351398468018, 1.923306941986084, 2.5083789825439453, 3.0934510231018066, 3.678523063659668, 4.263595104217529, 4.848667144775391, 5.433738708496094, 6.018811225891113, 6.603882789611816, 7.188954830169678, 7.774026870727539, 8.359098434448242, 8.944170951843262, 9.529242515563965, 10.114315032958984, 10.699386596679688, 11.28445816040039, 11.86953067779541, 12.45460319519043, 13.039674758911133, 13.624747276306152, 14.209818840026855, 14.794891357421875, 15.379962921142578, 15.965034484863281, 16.550106048583984, 17.135177612304688, 17.72024917602539, 18.305320739746094, 18.89039421081543, 19.475465774536133, 20.060537338256836, 20.64560890197754, 21.230682373046875, 21.815753936767578, 22.40082550048828, 22.985897064208984, 23.57097053527832, 24.156042098999023, 24.741113662719727, 25.32618522644043, 25.911258697509766, 26.49633026123047]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 5.0, 5.0, 11.0, 11.0, 16.0, 14.0, 16.0, 25.0, 29.0, 39.0, 29.0, 37.0, 50.0, 51.0, 57.0, 49.0, 50.0, 62.0, 51.0, 60.0, 44.0, 42.0, 50.0, 28.0, 31.0, 33.0, 21.0, 24.0, 17.0, 12.0, 10.0, 6.0, 4.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.238128662109375, -5.049185276031494, -4.860241889953613, -4.671298980712891, -4.48235559463501, -4.293412208557129, -4.104469299316406, -3.9155259132385254, -3.7265825271606445, -3.5376391410827637, -3.348695993423462, -3.15975284576416, -2.9708094596862793, -2.7818660736083984, -2.5929229259490967, -2.403979778289795, -2.215036392211914, -2.026093006134033, -1.8371498584747314, -1.6482065916061401, -1.4592633247375488, -1.2703200578689575, -1.0813767910003662, -0.8924335241317749, -0.7034902572631836, -0.5145469903945923, -0.325603723526001, -0.13666045665740967, 0.05228281021118164, 0.24122607707977295, 0.43016934394836426, 0.6191126108169556, 0.8080554008483887, 0.99699866771698, 1.1859419345855713, 1.3748852014541626, 1.563828468322754, 1.7527717351913452, 1.9417150020599365, 2.1306581497192383, 2.319601535797119, 2.508544921875, 2.6974880695343018, 2.8864312171936035, 3.0753746032714844, 3.2643179893493652, 3.453261137008667, 3.6422042846679688, 3.8311476707458496, 4.0200910568237305, 4.209033966064453, 4.397977352142334, 4.586920738220215, 4.775864124298096, 4.964807510375977, 5.153750419616699, 5.34269380569458, 5.531637191772461, 5.720580101013184, 5.9095234870910645, 6.098466873168945, 6.287410259246826, 6.476353645324707, 6.66529655456543, 6.8542399406433105]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 4.0, 9.0, 9.0, 9.0, 9.0, 29.0, 53.0, 86.0, 167.0, 372.0, 1096.0, 4897.0, 37596.0, 479056.0, 480506.0, 37838.0, 4966.0, 1098.0, 364.0, 180.0, 74.0, 51.0, 37.0, 23.0, 12.0, 6.0, 6.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8359375, -5.5706787109375, -5.305419921875, -5.0401611328125, -4.77490234375, -4.5096435546875, -4.244384765625, -3.9791259765625, -3.7138671875, -3.4486083984375, -3.183349609375, -2.9180908203125, -2.65283203125, -2.3875732421875, -2.122314453125, -1.8570556640625, -1.591796875, -1.3265380859375, -1.061279296875, -0.7960205078125, -0.53076171875, -0.2655029296875, -0.000244140625, 0.2650146484375, 0.5302734375, 0.7955322265625, 1.060791015625, 1.3260498046875, 1.59130859375, 1.8565673828125, 2.121826171875, 2.3870849609375, 2.65234375, 2.9176025390625, 3.182861328125, 3.4481201171875, 3.71337890625, 3.9786376953125, 4.243896484375, 4.5091552734375, 4.7744140625, 5.0396728515625, 5.304931640625, 5.5701904296875, 5.83544921875, 6.1007080078125, 6.365966796875, 6.6312255859375, 6.896484375, 7.1617431640625, 7.427001953125, 7.6922607421875, 7.95751953125, 8.2227783203125, 8.488037109375, 8.7532958984375, 9.0185546875, 9.2838134765625, 9.549072265625, 9.8143310546875, 10.07958984375, 10.3448486328125, 10.610107421875, 10.8753662109375, 11.140625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 2.0, 4.0, 4.0, 5.0, 6.0, 6.0, 15.0, 15.0, 34.0, 32.0, 48.0, 56.0, 67.0, 79.0, 74.0, 78.0, 87.0, 62.0, 70.0, 66.0, 57.0, 47.0, 35.0, 22.0, 14.0, 10.0, 10.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.94140625, -0.8909912109375, -0.840576171875, -0.7901611328125, -0.73974609375, -0.6893310546875, -0.638916015625, -0.5885009765625, -0.5380859375, -0.4876708984375, -0.437255859375, -0.3868408203125, -0.33642578125, -0.2860107421875, -0.235595703125, -0.1851806640625, -0.134765625, -0.0843505859375, -0.033935546875, 0.0164794921875, 0.06689453125, 0.1173095703125, 0.167724609375, 0.2181396484375, 0.2685546875, 0.3189697265625, 0.369384765625, 0.4197998046875, 0.47021484375, 0.5206298828125, 0.571044921875, 0.6214599609375, 0.671875, 0.7222900390625, 0.772705078125, 0.8231201171875, 0.87353515625, 0.9239501953125, 0.974365234375, 1.0247802734375, 1.0751953125, 1.1256103515625, 1.176025390625, 1.2264404296875, 1.27685546875, 1.3272705078125, 1.377685546875, 1.4281005859375, 1.478515625, 1.5289306640625, 1.579345703125, 1.6297607421875, 1.68017578125, 1.7305908203125, 1.781005859375, 1.8314208984375, 1.8818359375, 1.9322509765625, 1.982666015625, 2.0330810546875, 2.08349609375, 2.1339111328125, 2.184326171875, 2.2347412109375, 2.28515625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 8.0, 3.0, 14.0, 11.0, 22.0, 26.0, 33.0, 42.0, 72.0, 102.0, 170.0, 329.0, 605.0, 1241.0, 3142.0, 8453.0, 27110.0, 99268.0, 428664.0, 360852.0, 82758.0, 23085.0, 7336.0, 2724.0, 1146.0, 542.0, 284.0, 183.0, 107.0, 80.0, 33.0, 29.0, 21.0, 20.0, 9.0, 8.0, 13.0, 6.0, 5.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.02734375, -3.905059814453125, -3.78277587890625, -3.660491943359375, -3.5382080078125, -3.415924072265625, -3.29364013671875, -3.171356201171875, -3.049072265625, -2.926788330078125, -2.80450439453125, -2.682220458984375, -2.5599365234375, -2.437652587890625, -2.31536865234375, -2.193084716796875, -2.07080078125, -1.948516845703125, -1.82623291015625, -1.703948974609375, -1.5816650390625, -1.459381103515625, -1.33709716796875, -1.214813232421875, -1.092529296875, -0.970245361328125, -0.84796142578125, -0.725677490234375, -0.6033935546875, -0.481109619140625, -0.35882568359375, -0.236541748046875, -0.1142578125, 0.008026123046875, 0.13031005859375, 0.252593994140625, 0.3748779296875, 0.497161865234375, 0.61944580078125, 0.741729736328125, 0.864013671875, 0.986297607421875, 1.10858154296875, 1.230865478515625, 1.3531494140625, 1.475433349609375, 1.59771728515625, 1.720001220703125, 1.84228515625, 1.964569091796875, 2.08685302734375, 2.209136962890625, 2.3314208984375, 2.453704833984375, 2.57598876953125, 2.698272705078125, 2.820556640625, 2.942840576171875, 3.06512451171875, 3.187408447265625, 3.3096923828125, 3.431976318359375, 3.55426025390625, 3.676544189453125, 3.798828125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 5.0, 4.0, 9.0, 3.0, 12.0, 8.0, 15.0, 16.0, 24.0, 19.0, 23.0, 13.0, 26.0, 33.0, 33.0, 39.0, 51.0, 38.0, 46.0, 48.0, 47.0, 46.0, 39.0, 40.0, 48.0, 38.0, 46.0, 34.0, 33.0, 33.0, 21.0, 21.0, 14.0, 26.0, 12.0, 8.0, 6.0, 7.0, 7.0, 4.0, 6.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0], "bins": [-4.546875, -4.424285888671875, -4.30169677734375, -4.179107666015625, -4.0565185546875, -3.933929443359375, -3.81134033203125, -3.688751220703125, -3.566162109375, -3.443572998046875, -3.32098388671875, -3.198394775390625, -3.0758056640625, -2.953216552734375, -2.83062744140625, -2.708038330078125, -2.58544921875, -2.462860107421875, -2.34027099609375, -2.217681884765625, -2.0950927734375, -1.972503662109375, -1.84991455078125, -1.727325439453125, -1.604736328125, -1.482147216796875, -1.35955810546875, -1.236968994140625, -1.1143798828125, -0.991790771484375, -0.86920166015625, -0.746612548828125, -0.6240234375, -0.501434326171875, -0.37884521484375, -0.256256103515625, -0.1336669921875, -0.011077880859375, 0.11151123046875, 0.234100341796875, 0.356689453125, 0.479278564453125, 0.60186767578125, 0.724456787109375, 0.8470458984375, 0.969635009765625, 1.09222412109375, 1.214813232421875, 1.33740234375, 1.459991455078125, 1.58258056640625, 1.705169677734375, 1.8277587890625, 1.950347900390625, 2.07293701171875, 2.195526123046875, 2.318115234375, 2.440704345703125, 2.56329345703125, 2.685882568359375, 2.8084716796875, 2.931060791015625, 3.05364990234375, 3.176239013671875, 3.298828125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 12.0, 15.0, 22.0, 39.0, 77.0, 145.0, 375.0, 978.0, 2934.0, 10930.0, 74444.0, 893931.0, 51779.0, 8980.0, 2472.0, 824.0, 320.0, 139.0, 61.0, 38.0, 18.0, 11.0, 8.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.046875, -3.90936279296875, -3.7718505859375, -3.63433837890625, -3.496826171875, -3.35931396484375, -3.2218017578125, -3.08428955078125, -2.94677734375, -2.80926513671875, -2.6717529296875, -2.53424072265625, -2.396728515625, -2.25921630859375, -2.1217041015625, -1.98419189453125, -1.8466796875, -1.70916748046875, -1.5716552734375, -1.43414306640625, -1.296630859375, -1.15911865234375, -1.0216064453125, -0.88409423828125, -0.74658203125, -0.60906982421875, -0.4715576171875, -0.33404541015625, -0.196533203125, -0.05902099609375, 0.0784912109375, 0.21600341796875, 0.353515625, 0.49102783203125, 0.6285400390625, 0.76605224609375, 0.903564453125, 1.04107666015625, 1.1785888671875, 1.31610107421875, 1.45361328125, 1.59112548828125, 1.7286376953125, 1.86614990234375, 2.003662109375, 2.14117431640625, 2.2786865234375, 2.41619873046875, 2.5537109375, 2.69122314453125, 2.8287353515625, 2.96624755859375, 3.103759765625, 3.24127197265625, 3.3787841796875, 3.51629638671875, 3.65380859375, 3.79132080078125, 3.9288330078125, 4.06634521484375, 4.203857421875, 4.34136962890625, 4.4788818359375, 4.61639404296875, 4.75390625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 6.0, 5.0, 2.0, 7.0, 9.0, 13.0, 22.0, 38.0, 66.0, 211.0, 316.0, 151.0, 60.0, 25.0, 20.0, 6.0, 16.0, 8.0, 5.0, 4.0, 1.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0006799697875976562, -0.000658869743347168, -0.0006377696990966797, -0.0006166696548461914, -0.0005955696105957031, -0.0005744695663452148, -0.0005533695220947266, -0.0005322694778442383, -0.00051116943359375, -0.0004900693893432617, -0.00046896934509277344, -0.00044786930084228516, -0.0004267692565917969, -0.0004056692123413086, -0.0003845691680908203, -0.00036346912384033203, -0.00034236907958984375, -0.00032126903533935547, -0.0003001689910888672, -0.0002790689468383789, -0.0002579689025878906, -0.00023686885833740234, -0.00021576881408691406, -0.00019466876983642578, -0.0001735687255859375, -0.00015246868133544922, -0.00013136863708496094, -0.00011026859283447266, -8.916854858398438e-05, -6.80685043334961e-05, -4.696846008300781e-05, -2.586841583251953e-05, -4.76837158203125e-06, 1.633167266845703e-05, 3.743171691894531e-05, 5.8531761169433594e-05, 7.963180541992188e-05, 0.00010073184967041016, 0.00012183189392089844, 0.00014293193817138672, 0.000164031982421875, 0.00018513202667236328, 0.00020623207092285156, 0.00022733211517333984, 0.0002484321594238281, 0.0002695322036743164, 0.0002906322479248047, 0.00031173229217529297, 0.00033283233642578125, 0.00035393238067626953, 0.0003750324249267578, 0.0003961324691772461, 0.0004172325134277344, 0.00043833255767822266, 0.00045943260192871094, 0.0004805326461791992, 0.0005016326904296875, 0.0005227327346801758, 0.0005438327789306641, 0.0005649328231811523, 0.0005860328674316406, 0.0006071329116821289, 0.0006282329559326172, 0.0006493330001831055, 0.0006704330444335938]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 4.0, 3.0, 2.0, 4.0, 12.0, 14.0, 22.0, 15.0, 32.0, 33.0, 54.0, 85.0, 140.0, 204.0, 304.0, 405.0, 702.0, 1084.0, 1848.0, 3165.0, 5733.0, 11543.0, 26098.0, 88103.0, 673804.0, 167486.0, 36332.0, 14538.0, 7117.0, 3819.0, 2229.0, 1280.0, 822.0, 506.0, 312.0, 224.0, 161.0, 90.0, 50.0, 45.0, 36.0, 39.0, 18.0, 17.0, 6.0, 6.0, 6.0, 6.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-2.294921875, -2.222442626953125, -2.14996337890625, -2.077484130859375, -2.0050048828125, -1.932525634765625, -1.86004638671875, -1.787567138671875, -1.715087890625, -1.642608642578125, -1.57012939453125, -1.497650146484375, -1.4251708984375, -1.352691650390625, -1.28021240234375, -1.207733154296875, -1.13525390625, -1.062774658203125, -0.99029541015625, -0.917816162109375, -0.8453369140625, -0.772857666015625, -0.70037841796875, -0.627899169921875, -0.555419921875, -0.482940673828125, -0.41046142578125, -0.337982177734375, -0.2655029296875, -0.193023681640625, -0.12054443359375, -0.048065185546875, 0.0244140625, 0.096893310546875, 0.16937255859375, 0.241851806640625, 0.3143310546875, 0.386810302734375, 0.45928955078125, 0.531768798828125, 0.604248046875, 0.676727294921875, 0.74920654296875, 0.821685791015625, 0.8941650390625, 0.966644287109375, 1.03912353515625, 1.111602783203125, 1.18408203125, 1.256561279296875, 1.32904052734375, 1.401519775390625, 1.4739990234375, 1.546478271484375, 1.61895751953125, 1.691436767578125, 1.763916015625, 1.836395263671875, 1.90887451171875, 1.981353759765625, 2.0538330078125, 2.126312255859375, 2.19879150390625, 2.271270751953125, 2.34375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 7.0, 6.0, 7.0, 7.0, 10.0, 14.0, 17.0, 32.0, 47.0, 52.0, 92.0, 197.0, 205.0, 92.0, 60.0, 43.0, 23.0, 27.0, 18.0, 10.0, 6.0, 8.0, 3.0, 4.0, 7.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.298828125, -2.207122802734375, -2.11541748046875, -2.023712158203125, -1.9320068359375, -1.840301513671875, -1.74859619140625, -1.656890869140625, -1.565185546875, -1.473480224609375, -1.38177490234375, -1.290069580078125, -1.1983642578125, -1.106658935546875, -1.01495361328125, -0.923248291015625, -0.83154296875, -0.739837646484375, -0.64813232421875, -0.556427001953125, -0.4647216796875, -0.373016357421875, -0.28131103515625, -0.189605712890625, -0.097900390625, -0.006195068359375, 0.08551025390625, 0.177215576171875, 0.2689208984375, 0.360626220703125, 0.45233154296875, 0.544036865234375, 0.6357421875, 0.727447509765625, 0.81915283203125, 0.910858154296875, 1.0025634765625, 1.094268798828125, 1.18597412109375, 1.277679443359375, 1.369384765625, 1.461090087890625, 1.55279541015625, 1.644500732421875, 1.7362060546875, 1.827911376953125, 1.91961669921875, 2.011322021484375, 2.10302734375, 2.194732666015625, 2.28643798828125, 2.378143310546875, 2.4698486328125, 2.561553955078125, 2.65325927734375, 2.744964599609375, 2.836669921875, 2.928375244140625, 3.02008056640625, 3.111785888671875, 3.2034912109375, 3.295196533203125, 3.38690185546875, 3.478607177734375, 3.5703125]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 1.0, 1.0, 1.0, 15.0, 16.0, 18.0, 44.0, 44.0, 54.0, 105.0, 96.0, 140.0, 117.0, 103.0, 93.0, 58.0, 38.0, 25.0, 14.0, 8.0, 6.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.38622283935547, -41.479339599609375, -40.57245635986328, -39.66557312011719, -38.758689880371094, -37.851806640625, -36.944923400878906, -36.03804016113281, -35.13115692138672, -34.224273681640625, -33.31739044189453, -32.41050720214844, -31.503623962402344, -30.59674072265625, -29.689855575561523, -28.78297233581543, -27.876087188720703, -26.96920394897461, -26.062320709228516, -25.155437469482422, -24.248554229736328, -23.341670989990234, -22.434785842895508, -21.527902603149414, -20.62101936340332, -19.714136123657227, -18.807252883911133, -17.90036964416504, -16.993484497070312, -16.08660125732422, -15.179718017578125, -14.272834777832031, -13.365949630737305, -12.459066390991211, -11.552183151245117, -10.645298957824707, -9.738415718078613, -8.83153247833252, -7.924648761749268, -7.017765045166016, -6.110881805419922, -5.203998565673828, -4.297114849090576, -3.3902313709259033, -2.4833478927612305, -1.5764646530151367, -0.6695809364318848, 0.2373027801513672, 1.144186019897461, 2.051069498062134, 2.9579529762268066, 3.8648364543914795, 4.771719932556152, 5.678603172302246, 6.585486888885498, 7.49237060546875, 8.399253845214844, 9.306137084960938, 10.213020324707031, 11.119904518127441, 12.026787757873535, 12.933670997619629, 13.840555191040039, 14.747438430786133, 15.654321670532227]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 1.0, 6.0, 5.0, 3.0, 11.0, 16.0, 18.0, 8.0, 19.0, 24.0, 15.0, 29.0, 40.0, 38.0, 45.0, 38.0, 39.0, 38.0, 42.0, 34.0, 51.0, 44.0, 38.0, 46.0, 36.0, 46.0, 40.0, 35.0, 23.0, 21.0, 24.0, 17.0, 29.0, 27.0, 14.0, 10.0, 7.0, 6.0, 6.0, 4.0, 1.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.68540382385254, -17.069652557373047, -16.453901290893555, -15.838150024414062, -15.22239875793457, -14.606647491455078, -13.990897178649902, -13.37514591217041, -12.759394645690918, -12.143643379211426, -11.527892112731934, -10.912140846252441, -10.296390533447266, -9.680639266967773, -9.064888000488281, -8.449136734008789, -7.833385467529297, -7.217634201049805, -6.6018829345703125, -5.9861321449279785, -5.370380878448486, -4.754629611968994, -4.13887882232666, -3.523127555847168, -2.907376289367676, -2.2916250228881836, -1.6758739948272705, -1.0601228475570679, -0.44437170028686523, 0.17137956619262695, 0.78713059425354, 1.4028816223144531, 2.018634796142578, 2.6343860626220703, 3.2501370906829834, 3.8658881187438965, 4.481639385223389, 5.097390651702881, 5.713141441345215, 6.328892707824707, 6.944643974304199, 7.560395240783691, 8.176146507263184, 8.791897773742676, 9.407648086547852, 10.023399353027344, 10.639150619506836, 11.254901885986328, 11.87065315246582, 12.486404418945312, 13.102155685424805, 13.717906951904297, 14.333658218383789, 14.949409484863281, 15.565159797668457, 16.180912017822266, 16.796661376953125, 17.412412643432617, 18.02816390991211, 18.6439151763916, 19.259666442871094, 19.875417709350586, 20.491168975830078, 21.106918334960938, 21.722671508789062]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 7.0, 9.0, 14.0, 24.0, 34.0, 65.0, 110.0, 136.0, 279.0, 536.0, 1395.0, 5595.0, 48390.0, 4093177.0, 36991.0, 4957.0, 1351.0, 548.0, 245.0, 169.0, 96.0, 53.0, 41.0, 28.0, 11.0, 14.0, 4.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.34375, -19.828125, -19.3125, -18.796875, -18.28125, -17.765625, -17.25, -16.734375, -16.21875, -15.703125, -15.1875, -14.671875, -14.15625, -13.640625, -13.125, -12.609375, -12.09375, -11.578125, -11.0625, -10.546875, -10.03125, -9.515625, -9.0, -8.484375, -7.96875, -7.453125, -6.9375, -6.421875, -5.90625, -5.390625, -4.875, -4.359375, -3.84375, -3.328125, -2.8125, -2.296875, -1.78125, -1.265625, -0.75, -0.234375, 0.28125, 0.796875, 1.3125, 1.828125, 2.34375, 2.859375, 3.375, 3.890625, 4.40625, 4.921875, 5.4375, 5.953125, 6.46875, 6.984375, 7.5, 8.015625, 8.53125, 9.046875, 9.5625, 10.078125, 10.59375, 11.109375, 11.625, 12.140625, 12.65625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 5.0, 9.0, 8.0, 11.0, 18.0, 26.0, 26.0, 34.0, 36.0, 52.0, 62.0, 61.0, 66.0, 55.0, 65.0, 65.0, 74.0, 51.0, 61.0, 50.0, 47.0, 31.0, 31.0, 22.0, 13.0, 10.0, 4.0, 6.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0751953125, -1.0290679931640625, -0.982940673828125, -0.9368133544921875, -0.89068603515625, -0.8445587158203125, -0.798431396484375, -0.7523040771484375, -0.7061767578125, -0.6600494384765625, -0.613922119140625, -0.5677947998046875, -0.52166748046875, -0.4755401611328125, -0.429412841796875, -0.3832855224609375, -0.337158203125, -0.2910308837890625, -0.244903564453125, -0.1987762451171875, -0.15264892578125, -0.1065216064453125, -0.060394287109375, -0.0142669677734375, 0.0318603515625, 0.0779876708984375, 0.124114990234375, 0.1702423095703125, 0.21636962890625, 0.2624969482421875, 0.308624267578125, 0.3547515869140625, 0.40087890625, 0.4470062255859375, 0.493133544921875, 0.5392608642578125, 0.58538818359375, 0.6315155029296875, 0.677642822265625, 0.7237701416015625, 0.7698974609375, 0.8160247802734375, 0.862152099609375, 0.9082794189453125, 0.95440673828125, 1.0005340576171875, 1.046661376953125, 1.0927886962890625, 1.138916015625, 1.1850433349609375, 1.231170654296875, 1.2772979736328125, 1.32342529296875, 1.3695526123046875, 1.415679931640625, 1.4618072509765625, 1.5079345703125, 1.5540618896484375, 1.600189208984375, 1.6463165283203125, 1.69244384765625, 1.7385711669921875, 1.784698486328125, 1.8308258056640625, 1.876953125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 2.0, 2.0, 7.0, 4.0, 9.0, 19.0, 22.0, 28.0, 38.0, 59.0, 73.0, 121.0, 212.0, 325.0, 492.0, 804.0, 1461.0, 2625.0, 5510.0, 13576.0, 45880.0, 581181.0, 3446955.0, 64181.0, 17173.0, 6565.0, 3039.0, 1538.0, 933.0, 548.0, 316.0, 189.0, 125.0, 75.0, 64.0, 37.0, 42.0, 25.0, 13.0, 8.0, 4.0, 3.0, 0.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.125, -4.92083740234375, -4.7166748046875, -4.51251220703125, -4.308349609375, -4.10418701171875, -3.9000244140625, -3.69586181640625, -3.49169921875, -3.28753662109375, -3.0833740234375, -2.87921142578125, -2.675048828125, -2.47088623046875, -2.2667236328125, -2.06256103515625, -1.8583984375, -1.65423583984375, -1.4500732421875, -1.24591064453125, -1.041748046875, -0.83758544921875, -0.6334228515625, -0.42926025390625, -0.22509765625, -0.02093505859375, 0.1832275390625, 0.38739013671875, 0.591552734375, 0.79571533203125, 0.9998779296875, 1.20404052734375, 1.408203125, 1.61236572265625, 1.8165283203125, 2.02069091796875, 2.224853515625, 2.42901611328125, 2.6331787109375, 2.83734130859375, 3.04150390625, 3.24566650390625, 3.4498291015625, 3.65399169921875, 3.858154296875, 4.06231689453125, 4.2664794921875, 4.47064208984375, 4.6748046875, 4.87896728515625, 5.0831298828125, 5.28729248046875, 5.491455078125, 5.69561767578125, 5.8997802734375, 6.10394287109375, 6.30810546875, 6.51226806640625, 6.7164306640625, 6.92059326171875, 7.124755859375, 7.32891845703125, 7.5330810546875, 7.73724365234375, 7.94140625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 6.0, 1.0, 15.0, 20.0, 16.0, 35.0, 57.0, 112.0, 613.0, 2741.0, 209.0, 81.0, 51.0, 30.0, 23.0, 14.0, 8.0, 8.0, 6.0, 5.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.416015625, -3.319061279296875, -3.22210693359375, -3.125152587890625, -3.0281982421875, -2.931243896484375, -2.83428955078125, -2.737335205078125, -2.640380859375, -2.543426513671875, -2.44647216796875, -2.349517822265625, -2.2525634765625, -2.155609130859375, -2.05865478515625, -1.961700439453125, -1.86474609375, -1.767791748046875, -1.67083740234375, -1.573883056640625, -1.4769287109375, -1.379974365234375, -1.28302001953125, -1.186065673828125, -1.089111328125, -0.992156982421875, -0.89520263671875, -0.798248291015625, -0.7012939453125, -0.604339599609375, -0.50738525390625, -0.410430908203125, -0.3134765625, -0.216522216796875, -0.11956787109375, -0.022613525390625, 0.0743408203125, 0.171295166015625, 0.26824951171875, 0.365203857421875, 0.462158203125, 0.559112548828125, 0.65606689453125, 0.753021240234375, 0.8499755859375, 0.946929931640625, 1.04388427734375, 1.140838623046875, 1.23779296875, 1.334747314453125, 1.43170166015625, 1.528656005859375, 1.6256103515625, 1.722564697265625, 1.81951904296875, 1.916473388671875, 2.013427734375, 2.110382080078125, 2.20733642578125, 2.304290771484375, 2.4012451171875, 2.498199462890625, 2.59515380859375, 2.692108154296875, 2.7890625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 4.0, 0.0, 6.0, 8.0, 21.0, 39.0, 87.0, 135.0, 181.0, 186.0, 159.0, 86.0, 35.0, 24.0, 17.0, 7.0, 6.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.366625785827637, -6.812401294708252, -6.258176803588867, -5.703952312469482, -5.149727821350098, -4.595503330230713, -4.041278839111328, -3.4870543479919434, -2.9328298568725586, -2.378605365753174, -1.824380874633789, -1.2701563835144043, -0.7159318923950195, -0.16170740127563477, 0.39251708984375, 0.9467415809631348, 1.5009660720825195, 2.0551905632019043, 2.609415054321289, 3.163639545440674, 3.7178640365600586, 4.272088527679443, 4.826313018798828, 5.380537509918213, 5.934762001037598, 6.488986492156982, 7.043210983276367, 7.597435474395752, 8.151659965515137, 8.70588493347168, 9.260108947753906, 9.814332962036133, 10.36855697631836, 10.922780990600586, 11.477005958557129, 12.031230926513672, 12.585454940795898, 13.139678955078125, 13.693903923034668, 14.248128890991211, 14.802352905273438, 15.356576919555664, 15.910801887512207, 16.46502685546875, 17.019250869750977, 17.573474884033203, 18.127700805664062, 18.68192481994629, 19.236148834228516, 19.790372848510742, 20.34459686279297, 20.898822784423828, 21.453046798706055, 22.00727081298828, 22.56149673461914, 23.115720748901367, 23.669944763183594, 24.22416877746582, 24.778392791748047, 25.332618713378906, 25.886842727661133, 26.44106674194336, 26.99529266357422, 27.549516677856445, 28.103740692138672]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 9.0, 12.0, 11.0, 5.0, 16.0, 13.0, 17.0, 23.0, 30.0, 28.0, 26.0, 32.0, 36.0, 34.0, 56.0, 37.0, 46.0, 38.0, 52.0, 54.0, 52.0, 48.0, 34.0, 38.0, 40.0, 33.0, 36.0, 14.0, 23.0, 20.0, 15.0, 17.0, 12.0, 7.0, 7.0, 6.0, 7.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.337601184844971, -6.139631748199463, -5.941661834716797, -5.743692398071289, -5.545722961425781, -5.347753524780273, -5.149784088134766, -4.9518141746521, -4.753844738006592, -4.555875301361084, -4.357905387878418, -4.15993595123291, -3.9619665145874023, -3.7639970779418945, -3.5660274028778076, -3.3680577278137207, -3.170088291168213, -2.972118854522705, -2.774149179458618, -2.5761795043945312, -2.3782100677490234, -2.1802406311035156, -1.9822709560394287, -1.7843014001846313, -1.586331844329834, -1.3883622884750366, -1.1903927326202393, -0.9924231767654419, -0.7944536209106445, -0.5964840650558472, -0.3985145092010498, -0.20054495334625244, -0.002575397491455078, 0.19539415836334229, 0.39336371421813965, 0.591333270072937, 0.7893028259277344, 0.9872723817825317, 1.185241937637329, 1.3832114934921265, 1.5811810493469238, 1.7791506052017212, 1.9771201610565186, 2.1750898361206055, 2.3730592727661133, 2.571028709411621, 2.768998384475708, 2.966968059539795, 3.1649374961853027, 3.3629069328308105, 3.5608766078948975, 3.7588462829589844, 3.956815719604492, 4.15478515625, 4.352754592895508, 4.550724506378174, 4.748693943023682, 4.9466633796691895, 5.1446332931518555, 5.342602729797363, 5.540572166442871, 5.738541603088379, 5.936511039733887, 6.134480953216553, 6.3324503898620605]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 7.0, 4.0, 6.0, 13.0, 22.0, 34.0, 58.0, 67.0, 183.0, 317.0, 605.0, 1343.0, 3134.0, 8410.0, 27975.0, 125600.0, 551227.0, 257181.0, 50515.0, 13511.0, 4745.0, 1846.0, 827.0, 439.0, 187.0, 124.0, 66.0, 45.0, 22.0, 16.0, 5.0, 8.0, 3.0, 5.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.73046875, -7.50775146484375, -7.2850341796875, -7.06231689453125, -6.839599609375, -6.61688232421875, -6.3941650390625, -6.17144775390625, -5.94873046875, -5.72601318359375, -5.5032958984375, -5.28057861328125, -5.057861328125, -4.83514404296875, -4.6124267578125, -4.38970947265625, -4.1669921875, -3.94427490234375, -3.7215576171875, -3.49884033203125, -3.276123046875, -3.05340576171875, -2.8306884765625, -2.60797119140625, -2.38525390625, -2.16253662109375, -1.9398193359375, -1.71710205078125, -1.494384765625, -1.27166748046875, -1.0489501953125, -0.82623291015625, -0.603515625, -0.38079833984375, -0.1580810546875, 0.06463623046875, 0.287353515625, 0.51007080078125, 0.7327880859375, 0.95550537109375, 1.17822265625, 1.40093994140625, 1.6236572265625, 1.84637451171875, 2.069091796875, 2.29180908203125, 2.5145263671875, 2.73724365234375, 2.9599609375, 3.18267822265625, 3.4053955078125, 3.62811279296875, 3.850830078125, 4.07354736328125, 4.2962646484375, 4.51898193359375, 4.74169921875, 4.96441650390625, 5.1871337890625, 5.40985107421875, 5.632568359375, 5.85528564453125, 6.0780029296875, 6.30072021484375, 6.5234375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 4.0, 12.0, 17.0, 15.0, 24.0, 34.0, 32.0, 53.0, 54.0, 65.0, 76.0, 81.0, 87.0, 56.0, 62.0, 72.0, 63.0, 55.0, 38.0, 35.0, 23.0, 11.0, 15.0, 7.0, 5.0, 6.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.205078125, -1.151519775390625, -1.09796142578125, -1.044403076171875, -0.9908447265625, -0.937286376953125, -0.88372802734375, -0.830169677734375, -0.776611328125, -0.723052978515625, -0.66949462890625, -0.615936279296875, -0.5623779296875, -0.508819580078125, -0.45526123046875, -0.401702880859375, -0.34814453125, -0.294586181640625, -0.24102783203125, -0.187469482421875, -0.1339111328125, -0.080352783203125, -0.02679443359375, 0.026763916015625, 0.080322265625, 0.133880615234375, 0.18743896484375, 0.240997314453125, 0.2945556640625, 0.348114013671875, 0.40167236328125, 0.455230712890625, 0.5087890625, 0.562347412109375, 0.61590576171875, 0.669464111328125, 0.7230224609375, 0.776580810546875, 0.83013916015625, 0.883697509765625, 0.937255859375, 0.990814208984375, 1.04437255859375, 1.097930908203125, 1.1514892578125, 1.205047607421875, 1.25860595703125, 1.312164306640625, 1.36572265625, 1.419281005859375, 1.47283935546875, 1.526397705078125, 1.5799560546875, 1.633514404296875, 1.68707275390625, 1.740631103515625, 1.794189453125, 1.847747802734375, 1.90130615234375, 1.954864501953125, 2.0084228515625, 2.061981201171875, 2.11553955078125, 2.169097900390625, 2.22265625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 5.0, 2.0, 7.0, 6.0, 7.0, 14.0, 9.0, 11.0, 24.0, 30.0, 42.0, 63.0, 114.0, 207.0, 456.0, 1136.0, 3940.0, 21985.0, 280247.0, 679385.0, 50911.0, 6980.0, 1697.0, 608.0, 285.0, 126.0, 74.0, 42.0, 42.0, 19.0, 21.0, 18.0, 10.0, 7.0, 3.0, 4.0, 5.0, 4.0, 2.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-10.9375, -10.63525390625, -10.3330078125, -10.03076171875, -9.728515625, -9.42626953125, -9.1240234375, -8.82177734375, -8.51953125, -8.21728515625, -7.9150390625, -7.61279296875, -7.310546875, -7.00830078125, -6.7060546875, -6.40380859375, -6.1015625, -5.79931640625, -5.4970703125, -5.19482421875, -4.892578125, -4.59033203125, -4.2880859375, -3.98583984375, -3.68359375, -3.38134765625, -3.0791015625, -2.77685546875, -2.474609375, -2.17236328125, -1.8701171875, -1.56787109375, -1.265625, -0.96337890625, -0.6611328125, -0.35888671875, -0.056640625, 0.24560546875, 0.5478515625, 0.85009765625, 1.15234375, 1.45458984375, 1.7568359375, 2.05908203125, 2.361328125, 2.66357421875, 2.9658203125, 3.26806640625, 3.5703125, 3.87255859375, 4.1748046875, 4.47705078125, 4.779296875, 5.08154296875, 5.3837890625, 5.68603515625, 5.98828125, 6.29052734375, 6.5927734375, 6.89501953125, 7.197265625, 7.49951171875, 7.8017578125, 8.10400390625, 8.40625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 7.0, 7.0, 1.0, 3.0, 6.0, 9.0, 12.0, 21.0, 13.0, 28.0, 32.0, 38.0, 38.0, 38.0, 57.0, 42.0, 72.0, 65.0, 51.0, 67.0, 56.0, 39.0, 47.0, 52.0, 35.0, 31.0, 31.0, 16.0, 16.0, 16.0, 12.0, 13.0, 8.0, 7.0, 2.0, 3.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-7.375, -7.17230224609375, -6.9696044921875, -6.76690673828125, -6.564208984375, -6.36151123046875, -6.1588134765625, -5.95611572265625, -5.75341796875, -5.55072021484375, -5.3480224609375, -5.14532470703125, -4.942626953125, -4.73992919921875, -4.5372314453125, -4.33453369140625, -4.1318359375, -3.92913818359375, -3.7264404296875, -3.52374267578125, -3.321044921875, -3.11834716796875, -2.9156494140625, -2.71295166015625, -2.51025390625, -2.30755615234375, -2.1048583984375, -1.90216064453125, -1.699462890625, -1.49676513671875, -1.2940673828125, -1.09136962890625, -0.888671875, -0.68597412109375, -0.4832763671875, -0.28057861328125, -0.077880859375, 0.12481689453125, 0.3275146484375, 0.53021240234375, 0.73291015625, 0.93560791015625, 1.1383056640625, 1.34100341796875, 1.543701171875, 1.74639892578125, 1.9490966796875, 2.15179443359375, 2.3544921875, 2.55718994140625, 2.7598876953125, 2.96258544921875, 3.165283203125, 3.36798095703125, 3.5706787109375, 3.77337646484375, 3.97607421875, 4.17877197265625, 4.3814697265625, 4.58416748046875, 4.786865234375, 4.98956298828125, 5.1922607421875, 5.39495849609375, 5.59765625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 2.0, 8.0, 6.0, 9.0, 17.0, 21.0, 30.0, 51.0, 68.0, 115.0, 187.0, 353.0, 725.0, 1779.0, 6305.0, 42228.0, 918828.0, 65808.0, 8049.0, 2120.0, 904.0, 395.0, 193.0, 118.0, 72.0, 44.0, 32.0, 18.0, 20.0, 15.0, 8.0, 3.0, 7.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.109375, -11.71337890625, -11.3173828125, -10.92138671875, -10.525390625, -10.12939453125, -9.7333984375, -9.33740234375, -8.94140625, -8.54541015625, -8.1494140625, -7.75341796875, -7.357421875, -6.96142578125, -6.5654296875, -6.16943359375, -5.7734375, -5.37744140625, -4.9814453125, -4.58544921875, -4.189453125, -3.79345703125, -3.3974609375, -3.00146484375, -2.60546875, -2.20947265625, -1.8134765625, -1.41748046875, -1.021484375, -0.62548828125, -0.2294921875, 0.16650390625, 0.5625, 0.95849609375, 1.3544921875, 1.75048828125, 2.146484375, 2.54248046875, 2.9384765625, 3.33447265625, 3.73046875, 4.12646484375, 4.5224609375, 4.91845703125, 5.314453125, 5.71044921875, 6.1064453125, 6.50244140625, 6.8984375, 7.29443359375, 7.6904296875, 8.08642578125, 8.482421875, 8.87841796875, 9.2744140625, 9.67041015625, 10.06640625, 10.46240234375, 10.8583984375, 11.25439453125, 11.650390625, 12.04638671875, 12.4423828125, 12.83837890625, 13.234375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 7.0, 5.0, 11.0, 13.0, 17.0, 15.0, 33.0, 61.0, 192.0, 370.0, 115.0, 71.0, 32.0, 22.0, 12.0, 9.0, 6.0, 4.0, 9.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0015697479248046875, -0.0015160739421844482, -0.001462399959564209, -0.0014087259769439697, -0.0013550519943237305, -0.0013013780117034912, -0.001247704029083252, -0.0011940300464630127, -0.0011403560638427734, -0.0010866820812225342, -0.001033008098602295, -0.0009793341159820557, -0.0009256601333618164, -0.0008719861507415771, -0.0008183121681213379, -0.0007646381855010986, -0.0007109642028808594, -0.0006572902202606201, -0.0006036162376403809, -0.0005499422550201416, -0.0004962682723999023, -0.0004425942897796631, -0.00038892030715942383, -0.00033524632453918457, -0.0002815723419189453, -0.00022789835929870605, -0.0001742243766784668, -0.00012055039405822754, -6.687641143798828e-05, -1.3202428817749023e-05, 4.0471553802490234e-05, 9.414553642272949e-05, 0.00014781951904296875, 0.000201493501663208, 0.00025516748428344727, 0.0003088414669036865, 0.0003625154495239258, 0.00041618943214416504, 0.0004698634147644043, 0.0005235373973846436, 0.0005772113800048828, 0.0006308853626251221, 0.0006845593452453613, 0.0007382333278656006, 0.0007919073104858398, 0.0008455812931060791, 0.0008992552757263184, 0.0009529292583465576, 0.0010066032409667969, 0.0010602772235870361, 0.0011139512062072754, 0.0011676251888275146, 0.001221299171447754, 0.0012749731540679932, 0.0013286471366882324, 0.0013823211193084717, 0.001435995101928711, 0.0014896690845489502, 0.0015433430671691895, 0.0015970170497894287, 0.001650691032409668, 0.0017043650150299072, 0.0017580389976501465, 0.0018117129802703857, 0.001865386962890625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 8.0, 13.0, 28.0, 32.0, 66.0, 132.0, 256.0, 586.0, 1440.0, 5742.0, 52054.0, 936452.0, 43998.0, 5404.0, 1345.0, 495.0, 233.0, 112.0, 68.0, 35.0, 20.0, 14.0, 3.0, 8.0, 4.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-20.28125, -19.739990234375, -19.19873046875, -18.657470703125, -18.1162109375, -17.574951171875, -17.03369140625, -16.492431640625, -15.951171875, -15.409912109375, -14.86865234375, -14.327392578125, -13.7861328125, -13.244873046875, -12.70361328125, -12.162353515625, -11.62109375, -11.079833984375, -10.53857421875, -9.997314453125, -9.4560546875, -8.914794921875, -8.37353515625, -7.832275390625, -7.291015625, -6.749755859375, -6.20849609375, -5.667236328125, -5.1259765625, -4.584716796875, -4.04345703125, -3.502197265625, -2.9609375, -2.419677734375, -1.87841796875, -1.337158203125, -0.7958984375, -0.254638671875, 0.28662109375, 0.827880859375, 1.369140625, 1.910400390625, 2.45166015625, 2.992919921875, 3.5341796875, 4.075439453125, 4.61669921875, 5.157958984375, 5.69921875, 6.240478515625, 6.78173828125, 7.322998046875, 7.8642578125, 8.405517578125, 8.94677734375, 9.488037109375, 10.029296875, 10.570556640625, 11.11181640625, 11.653076171875, 12.1943359375, 12.735595703125, 13.27685546875, 13.818115234375, 14.359375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 4.0, 6.0, 13.0, 16.0, 20.0, 42.0, 53.0, 133.0, 396.0, 132.0, 65.0, 38.0, 27.0, 22.0, 7.0, 8.0, 6.0, 2.0, 8.0, 3.0, 4.0, 1.0, 1.0, 3.0], "bins": [-16.609375, -16.26763916015625, -15.9259033203125, -15.58416748046875, -15.242431640625, -14.90069580078125, -14.5589599609375, -14.21722412109375, -13.87548828125, -13.53375244140625, -13.1920166015625, -12.85028076171875, -12.508544921875, -12.16680908203125, -11.8250732421875, -11.48333740234375, -11.1416015625, -10.79986572265625, -10.4581298828125, -10.11639404296875, -9.774658203125, -9.43292236328125, -9.0911865234375, -8.74945068359375, -8.40771484375, -8.06597900390625, -7.7242431640625, -7.38250732421875, -7.040771484375, -6.69903564453125, -6.3572998046875, -6.01556396484375, -5.673828125, -5.33209228515625, -4.9903564453125, -4.64862060546875, -4.306884765625, -3.96514892578125, -3.6234130859375, -3.28167724609375, -2.93994140625, -2.59820556640625, -2.2564697265625, -1.91473388671875, -1.572998046875, -1.23126220703125, -0.8895263671875, -0.54779052734375, -0.2060546875, 0.13568115234375, 0.4774169921875, 0.81915283203125, 1.160888671875, 1.50262451171875, 1.8443603515625, 2.18609619140625, 2.52783203125, 2.86956787109375, 3.2113037109375, 3.55303955078125, 3.894775390625, 4.23651123046875, 4.5782470703125, 4.91998291015625, 5.26171875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 9.0, 10.0, 31.0, 82.0, 119.0, 147.0, 177.0, 183.0, 120.0, 57.0, 40.0, 17.0, 12.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-111.11772155761719, -108.29843139648438, -105.47914123535156, -102.65985870361328, -99.84056854248047, -97.02127838134766, -94.20199584960938, -91.38270568847656, -88.56341552734375, -85.74412536621094, -82.92483520507812, -80.10555267333984, -77.28626251220703, -74.46697235107422, -71.64768981933594, -68.82839965820312, -66.00910949707031, -63.1898193359375, -60.37053298950195, -57.551246643066406, -54.731956481933594, -51.91266632080078, -49.093379974365234, -46.27409362792969, -43.454803466796875, -40.63551330566406, -37.816226959228516, -34.99694061279297, -32.177650451660156, -29.358362197875977, -26.539073944091797, -23.719785690307617, -20.900497436523438, -18.081209182739258, -15.261920928955078, -12.442632675170898, -9.623344421386719, -6.804056167602539, -3.9847679138183594, -1.1654796600341797, 1.65380859375, 4.47309684753418, 7.292385101318359, 10.111673355102539, 12.930961608886719, 15.750249862670898, 18.569538116455078, 21.388826370239258, 24.208114624023438, 27.027402877807617, 29.846691131591797, 32.665977478027344, 35.485267639160156, 38.30455780029297, 41.123844146728516, 43.94313049316406, 46.762420654296875, 49.58171081542969, 52.400997161865234, 55.22028350830078, 58.039573669433594, 60.858863830566406, 63.67815017700195, 66.4974365234375, 69.31672668457031]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 6.0, 9.0, 3.0, 13.0, 10.0, 17.0, 25.0, 25.0, 38.0, 31.0, 30.0, 51.0, 56.0, 50.0, 45.0, 46.0, 59.0, 59.0, 52.0, 52.0, 41.0, 36.0, 41.0, 38.0, 31.0, 28.0, 27.0, 14.0, 17.0, 22.0, 9.0, 8.0, 6.0, 6.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.18307876586914, -45.781185150146484, -44.379295349121094, -42.97740173339844, -41.57550811767578, -40.173614501953125, -38.77172088623047, -37.36983108520508, -35.96793746948242, -34.566043853759766, -33.164154052734375, -31.76226043701172, -30.360366821289062, -28.958473205566406, -27.556581497192383, -26.15468978881836, -24.752796173095703, -23.350902557373047, -21.949010848999023, -20.547119140625, -19.145225524902344, -17.743331909179688, -16.341440200805664, -14.939547538757324, -13.537654876708984, -12.135762214660645, -10.733869552612305, -9.331976890563965, -7.930084228515625, -6.528191566467285, -5.126298904418945, -3.7244062423706055, -2.3225173950195312, -0.9206247329711914, 0.48126792907714844, 1.8831605911254883, 3.285053253173828, 4.686945915222168, 6.088838577270508, 7.490731239318848, 8.892623901367188, 10.294516563415527, 11.696409225463867, 13.098301887512207, 14.500194549560547, 15.902087211608887, 17.303979873657227, 18.70587158203125, 20.107765197753906, 21.509658813476562, 22.911550521850586, 24.31344223022461, 25.715335845947266, 27.117229461669922, 28.519121170043945, 29.92101287841797, 31.322906494140625, 32.72480010986328, 34.12669372558594, 35.52858352661133, 36.930477142333984, 38.33237075805664, 39.73426055908203, 41.13615417480469, 42.538047790527344]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 6.0, 7.0, 9.0, 5.0, 9.0, 18.0, 23.0, 41.0, 56.0, 101.0, 174.0, 280.0, 563.0, 1098.0, 2501.0, 6364.0, 18572.0, 86011.0, 3680613.0, 341844.0, 37426.0, 10714.0, 4022.0, 1776.0, 876.0, 504.0, 244.0, 126.0, 92.0, 63.0, 48.0, 22.0, 26.0, 14.0, 11.0, 8.0, 8.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.53125, -7.29412841796875, -7.0570068359375, -6.81988525390625, -6.582763671875, -6.34564208984375, -6.1085205078125, -5.87139892578125, -5.63427734375, -5.39715576171875, -5.1600341796875, -4.92291259765625, -4.685791015625, -4.44866943359375, -4.2115478515625, -3.97442626953125, -3.7373046875, -3.50018310546875, -3.2630615234375, -3.02593994140625, -2.788818359375, -2.55169677734375, -2.3145751953125, -2.07745361328125, -1.84033203125, -1.60321044921875, -1.3660888671875, -1.12896728515625, -0.891845703125, -0.65472412109375, -0.4176025390625, -0.18048095703125, 0.056640625, 0.29376220703125, 0.5308837890625, 0.76800537109375, 1.005126953125, 1.24224853515625, 1.4793701171875, 1.71649169921875, 1.95361328125, 2.19073486328125, 2.4278564453125, 2.66497802734375, 2.902099609375, 3.13922119140625, 3.3763427734375, 3.61346435546875, 3.8505859375, 4.08770751953125, 4.3248291015625, 4.56195068359375, 4.799072265625, 5.03619384765625, 5.2733154296875, 5.51043701171875, 5.74755859375, 5.98468017578125, 6.2218017578125, 6.45892333984375, 6.696044921875, 6.93316650390625, 7.1702880859375, 7.40740966796875, 7.64453125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 7.0, 10.0, 8.0, 15.0, 22.0, 19.0, 27.0, 32.0, 38.0, 56.0, 62.0, 67.0, 67.0, 60.0, 63.0, 55.0, 73.0, 59.0, 53.0, 31.0, 39.0, 31.0, 35.0, 28.0, 18.0, 12.0, 5.0, 4.0, 7.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.755859375, -1.693878173828125, -1.63189697265625, -1.569915771484375, -1.5079345703125, -1.445953369140625, -1.38397216796875, -1.321990966796875, -1.260009765625, -1.198028564453125, -1.13604736328125, -1.074066162109375, -1.0120849609375, -0.950103759765625, -0.88812255859375, -0.826141357421875, -0.76416015625, -0.702178955078125, -0.64019775390625, -0.578216552734375, -0.5162353515625, -0.454254150390625, -0.39227294921875, -0.330291748046875, -0.268310546875, -0.206329345703125, -0.14434814453125, -0.082366943359375, -0.0203857421875, 0.041595458984375, 0.10357666015625, 0.165557861328125, 0.2275390625, 0.289520263671875, 0.35150146484375, 0.413482666015625, 0.4754638671875, 0.537445068359375, 0.59942626953125, 0.661407470703125, 0.723388671875, 0.785369873046875, 0.84735107421875, 0.909332275390625, 0.9713134765625, 1.033294677734375, 1.09527587890625, 1.157257080078125, 1.21923828125, 1.281219482421875, 1.34320068359375, 1.405181884765625, 1.4671630859375, 1.529144287109375, 1.59112548828125, 1.653106689453125, 1.715087890625, 1.777069091796875, 1.83905029296875, 1.901031494140625, 1.9630126953125, 2.024993896484375, 2.08697509765625, 2.148956298828125, 2.2109375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 7.0, 11.0, 18.0, 16.0, 25.0, 51.0, 124.0, 253.0, 530.0, 1233.0, 3336.0, 10081.0, 48518.0, 3097905.0, 979286.0, 39064.0, 8860.0, 2909.0, 1116.0, 468.0, 229.0, 95.0, 70.0, 25.0, 24.0, 7.0, 7.0, 8.0, 5.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.71875, -8.3546142578125, -7.990478515625, -7.6263427734375, -7.26220703125, -6.8980712890625, -6.533935546875, -6.1697998046875, -5.8056640625, -5.4415283203125, -5.077392578125, -4.7132568359375, -4.34912109375, -3.9849853515625, -3.620849609375, -3.2567138671875, -2.892578125, -2.5284423828125, -2.164306640625, -1.8001708984375, -1.43603515625, -1.0718994140625, -0.707763671875, -0.3436279296875, 0.0205078125, 0.3846435546875, 0.748779296875, 1.1129150390625, 1.47705078125, 1.8411865234375, 2.205322265625, 2.5694580078125, 2.93359375, 3.2977294921875, 3.661865234375, 4.0260009765625, 4.39013671875, 4.7542724609375, 5.118408203125, 5.4825439453125, 5.8466796875, 6.2108154296875, 6.574951171875, 6.9390869140625, 7.30322265625, 7.6673583984375, 8.031494140625, 8.3956298828125, 8.759765625, 9.1239013671875, 9.488037109375, 9.8521728515625, 10.21630859375, 10.5804443359375, 10.944580078125, 11.3087158203125, 11.6728515625, 12.0369873046875, 12.401123046875, 12.7652587890625, 13.12939453125, 13.4935302734375, 13.857666015625, 14.2218017578125, 14.5859375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 5.0, 3.0, 4.0, 7.0, 11.0, 9.0, 20.0, 24.0, 35.0, 44.0, 80.0, 124.0, 266.0, 1210.0, 1556.0, 277.0, 134.0, 89.0, 33.0, 34.0, 18.0, 17.0, 17.0, 9.0, 6.0, 4.0, 9.0, 5.0, 4.0, 4.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.759765625, -3.645965576171875, -3.53216552734375, -3.418365478515625, -3.3045654296875, -3.190765380859375, -3.07696533203125, -2.963165283203125, -2.849365234375, -2.735565185546875, -2.62176513671875, -2.507965087890625, -2.3941650390625, -2.280364990234375, -2.16656494140625, -2.052764892578125, -1.93896484375, -1.825164794921875, -1.71136474609375, -1.597564697265625, -1.4837646484375, -1.369964599609375, -1.25616455078125, -1.142364501953125, -1.028564453125, -0.914764404296875, -0.80096435546875, -0.687164306640625, -0.5733642578125, -0.459564208984375, -0.34576416015625, -0.231964111328125, -0.1181640625, -0.004364013671875, 0.10943603515625, 0.223236083984375, 0.3370361328125, 0.450836181640625, 0.56463623046875, 0.678436279296875, 0.792236328125, 0.906036376953125, 1.01983642578125, 1.133636474609375, 1.2474365234375, 1.361236572265625, 1.47503662109375, 1.588836669921875, 1.70263671875, 1.816436767578125, 1.93023681640625, 2.044036865234375, 2.1578369140625, 2.271636962890625, 2.38543701171875, 2.499237060546875, 2.613037109375, 2.726837158203125, 2.84063720703125, 2.954437255859375, 3.0682373046875, 3.182037353515625, 3.29583740234375, 3.409637451171875, 3.5234375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 22.0, 61.0, 215.0, 373.0, 239.0, 69.0, 17.0, 7.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-98.48078918457031, -96.53252410888672, -94.58426666259766, -92.63600158691406, -90.687744140625, -88.7394790649414, -86.79121398925781, -84.84295654296875, -82.89469146728516, -80.94642639160156, -78.9981689453125, -77.0499038696289, -75.10164642333984, -73.15338134765625, -71.20511627197266, -69.2568588256836, -67.30859375, -65.3603286743164, -63.412071228027344, -61.46380615234375, -59.51554489135742, -57.567283630371094, -55.619022369384766, -53.67076110839844, -51.72249984741211, -49.77423858642578, -47.82597732543945, -45.87771224975586, -43.92945098876953, -41.9811897277832, -40.032928466796875, -38.08466339111328, -36.13639831542969, -34.18813705444336, -32.23987579345703, -30.29161262512207, -28.34334945678711, -26.39508819580078, -24.446826934814453, -22.498563766479492, -20.550304412841797, -18.60204315185547, -16.653779983520508, -14.70551872253418, -12.757255554199219, -10.80899429321289, -8.860732078552246, -6.912469863891602, -4.964206695556641, -3.015944480895996, -1.0676825046539307, 0.8805794715881348, 2.8288416862487793, 4.777103424072266, 6.72536563873291, 8.673627853393555, 10.6218900680542, 12.570152282714844, 14.518414497375488, 16.466676712036133, 18.41493797302246, 20.363201141357422, 22.31146240234375, 24.259723663330078, 26.20798683166504]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 4.0, 1.0, 3.0, 3.0, 4.0, 3.0, 12.0, 9.0, 10.0, 9.0, 15.0, 21.0, 31.0, 18.0, 27.0, 29.0, 41.0, 36.0, 42.0, 39.0, 56.0, 49.0, 55.0, 37.0, 53.0, 54.0, 45.0, 44.0, 34.0, 39.0, 29.0, 25.0, 24.0, 27.0, 18.0, 7.0, 17.0, 9.0, 5.0, 8.0, 0.0, 4.0, 6.0, 1.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.456963539123535, -12.078927040100098, -11.700889587402344, -11.322853088378906, -10.944816589355469, -10.566780090332031, -10.188742637634277, -9.81070613861084, -9.432668685913086, -9.054632186889648, -8.676594734191895, -8.298558235168457, -7.9205217361450195, -7.542484760284424, -7.164447784423828, -6.786411285400391, -6.408374786376953, -6.030337810516357, -5.65230131149292, -5.274264335632324, -4.896227836608887, -4.518190860748291, -4.140153884887695, -3.7621171474456787, -3.384080410003662, -3.0060436725616455, -2.628006935119629, -2.249969959259033, -1.8719332218170166, -1.493896484375, -1.1158595085144043, -0.7378227710723877, -0.3597850799560547, 0.01825171709060669, 0.39628851413726807, 0.7743253707885742, 1.1523621082305908, 1.5303988456726074, 1.9084358215332031, 2.2864725589752197, 2.6645092964172363, 3.042546033859253, 3.4205827713012695, 3.7986197471618652, 4.176656723022461, 4.554693222045898, 4.932730197906494, 5.31076717376709, 5.688803672790527, 6.066840648651123, 6.4448771476745605, 6.822914123535156, 7.200950622558594, 7.5789875984191895, 7.957024574279785, 8.335061073303223, 8.713098526000977, 9.091135025024414, 9.469172477722168, 9.847208976745605, 10.225245475769043, 10.603282928466797, 10.981319427490234, 11.359355926513672, 11.73739242553711]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 6.0, 1.0, 9.0, 10.0, 16.0, 16.0, 19.0, 42.0, 54.0, 81.0, 141.0, 221.0, 351.0, 581.0, 1118.0, 2177.0, 4201.0, 8657.0, 18486.0, 42617.0, 99061.0, 212363.0, 294595.0, 199674.0, 90868.0, 39392.0, 17205.0, 8144.0, 3837.0, 1999.0, 1050.0, 590.0, 345.0, 217.0, 133.0, 90.0, 56.0, 41.0, 29.0, 27.0, 9.0, 12.0, 7.0, 2.0, 2.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.515625, -3.400177001953125, -3.28472900390625, -3.169281005859375, -3.0538330078125, -2.938385009765625, -2.82293701171875, -2.707489013671875, -2.592041015625, -2.476593017578125, -2.36114501953125, -2.245697021484375, -2.1302490234375, -2.014801025390625, -1.89935302734375, -1.783905029296875, -1.66845703125, -1.553009033203125, -1.43756103515625, -1.322113037109375, -1.2066650390625, -1.091217041015625, -0.97576904296875, -0.860321044921875, -0.744873046875, -0.629425048828125, -0.51397705078125, -0.398529052734375, -0.2830810546875, -0.167633056640625, -0.05218505859375, 0.063262939453125, 0.1787109375, 0.294158935546875, 0.40960693359375, 0.525054931640625, 0.6405029296875, 0.755950927734375, 0.87139892578125, 0.986846923828125, 1.102294921875, 1.217742919921875, 1.33319091796875, 1.448638916015625, 1.5640869140625, 1.679534912109375, 1.79498291015625, 1.910430908203125, 2.02587890625, 2.141326904296875, 2.25677490234375, 2.372222900390625, 2.4876708984375, 2.603118896484375, 2.71856689453125, 2.834014892578125, 2.949462890625, 3.064910888671875, 3.18035888671875, 3.295806884765625, 3.4112548828125, 3.526702880859375, 3.64215087890625, 3.757598876953125, 3.873046875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 8.0, 8.0, 15.0, 12.0, 19.0, 22.0, 16.0, 37.0, 41.0, 57.0, 45.0, 54.0, 59.0, 51.0, 55.0, 74.0, 70.0, 59.0, 49.0, 44.0, 28.0, 35.0, 29.0, 24.0, 19.0, 15.0, 17.0, 11.0, 13.0, 5.0, 4.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.44140625, -1.38104248046875, -1.3206787109375, -1.26031494140625, -1.199951171875, -1.13958740234375, -1.0792236328125, -1.01885986328125, -0.95849609375, -0.89813232421875, -0.8377685546875, -0.77740478515625, -0.717041015625, -0.65667724609375, -0.5963134765625, -0.53594970703125, -0.4755859375, -0.41522216796875, -0.3548583984375, -0.29449462890625, -0.234130859375, -0.17376708984375, -0.1134033203125, -0.05303955078125, 0.00732421875, 0.06768798828125, 0.1280517578125, 0.18841552734375, 0.248779296875, 0.30914306640625, 0.3695068359375, 0.42987060546875, 0.490234375, 0.55059814453125, 0.6109619140625, 0.67132568359375, 0.731689453125, 0.79205322265625, 0.8524169921875, 0.91278076171875, 0.97314453125, 1.03350830078125, 1.0938720703125, 1.15423583984375, 1.214599609375, 1.27496337890625, 1.3353271484375, 1.39569091796875, 1.4560546875, 1.51641845703125, 1.5767822265625, 1.63714599609375, 1.697509765625, 1.75787353515625, 1.8182373046875, 1.87860107421875, 1.93896484375, 1.99932861328125, 2.0596923828125, 2.12005615234375, 2.180419921875, 2.24078369140625, 2.3011474609375, 2.36151123046875, 2.421875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 4.0, 3.0, 6.0, 3.0, 4.0, 4.0, 7.0, 14.0, 17.0, 15.0, 26.0, 49.0, 70.0, 99.0, 179.0, 388.0, 1192.0, 5675.0, 62878.0, 746297.0, 214874.0, 13520.0, 2031.0, 566.0, 255.0, 123.0, 84.0, 54.0, 28.0, 17.0, 16.0, 13.0, 20.0, 7.0, 6.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.1875, -10.7685546875, -10.349609375, -9.9306640625, -9.51171875, -9.0927734375, -8.673828125, -8.2548828125, -7.8359375, -7.4169921875, -6.998046875, -6.5791015625, -6.16015625, -5.7412109375, -5.322265625, -4.9033203125, -4.484375, -4.0654296875, -3.646484375, -3.2275390625, -2.80859375, -2.3896484375, -1.970703125, -1.5517578125, -1.1328125, -0.7138671875, -0.294921875, 0.1240234375, 0.54296875, 0.9619140625, 1.380859375, 1.7998046875, 2.21875, 2.6376953125, 3.056640625, 3.4755859375, 3.89453125, 4.3134765625, 4.732421875, 5.1513671875, 5.5703125, 5.9892578125, 6.408203125, 6.8271484375, 7.24609375, 7.6650390625, 8.083984375, 8.5029296875, 8.921875, 9.3408203125, 9.759765625, 10.1787109375, 10.59765625, 11.0166015625, 11.435546875, 11.8544921875, 12.2734375, 12.6923828125, 13.111328125, 13.5302734375, 13.94921875, 14.3681640625, 14.787109375, 15.2060546875, 15.625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 3.0, 1.0, 2.0, 6.0, 5.0, 8.0, 9.0, 11.0, 16.0, 11.0, 18.0, 15.0, 18.0, 15.0, 30.0, 26.0, 26.0, 42.0, 50.0, 41.0, 36.0, 53.0, 38.0, 42.0, 53.0, 49.0, 45.0, 39.0, 33.0, 42.0, 35.0, 26.0, 27.0, 25.0, 21.0, 17.0, 14.0, 10.0, 15.0, 6.0, 12.0, 5.0, 2.0, 8.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-9.4765625, -9.200439453125, -8.92431640625, -8.648193359375, -8.3720703125, -8.095947265625, -7.81982421875, -7.543701171875, -7.267578125, -6.991455078125, -6.71533203125, -6.439208984375, -6.1630859375, -5.886962890625, -5.61083984375, -5.334716796875, -5.05859375, -4.782470703125, -4.50634765625, -4.230224609375, -3.9541015625, -3.677978515625, -3.40185546875, -3.125732421875, -2.849609375, -2.573486328125, -2.29736328125, -2.021240234375, -1.7451171875, -1.468994140625, -1.19287109375, -0.916748046875, -0.640625, -0.364501953125, -0.08837890625, 0.187744140625, 0.4638671875, 0.739990234375, 1.01611328125, 1.292236328125, 1.568359375, 1.844482421875, 2.12060546875, 2.396728515625, 2.6728515625, 2.948974609375, 3.22509765625, 3.501220703125, 3.77734375, 4.053466796875, 4.32958984375, 4.605712890625, 4.8818359375, 5.157958984375, 5.43408203125, 5.710205078125, 5.986328125, 6.262451171875, 6.53857421875, 6.814697265625, 7.0908203125, 7.366943359375, 7.64306640625, 7.919189453125, 8.1953125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 9.0, 3.0, 7.0, 8.0, 11.0, 24.0, 33.0, 54.0, 101.0, 185.0, 307.0, 651.0, 1501.0, 3805.0, 11651.0, 56074.0, 416904.0, 471979.0, 65157.0, 12873.0, 4121.0, 1570.0, 741.0, 335.0, 194.0, 99.0, 52.0, 40.0, 21.0, 10.0, 14.0, 8.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.01171875, -3.85150146484375, -3.6912841796875, -3.53106689453125, -3.370849609375, -3.21063232421875, -3.0504150390625, -2.89019775390625, -2.72998046875, -2.56976318359375, -2.4095458984375, -2.24932861328125, -2.089111328125, -1.92889404296875, -1.7686767578125, -1.60845947265625, -1.4482421875, -1.28802490234375, -1.1278076171875, -0.96759033203125, -0.807373046875, -0.64715576171875, -0.4869384765625, -0.32672119140625, -0.16650390625, -0.00628662109375, 0.1539306640625, 0.31414794921875, 0.474365234375, 0.63458251953125, 0.7947998046875, 0.95501708984375, 1.115234375, 1.27545166015625, 1.4356689453125, 1.59588623046875, 1.756103515625, 1.91632080078125, 2.0765380859375, 2.23675537109375, 2.39697265625, 2.55718994140625, 2.7174072265625, 2.87762451171875, 3.037841796875, 3.19805908203125, 3.3582763671875, 3.51849365234375, 3.6787109375, 3.83892822265625, 3.9991455078125, 4.15936279296875, 4.319580078125, 4.47979736328125, 4.6400146484375, 4.80023193359375, 4.96044921875, 5.12066650390625, 5.2808837890625, 5.44110107421875, 5.601318359375, 5.76153564453125, 5.9217529296875, 6.08197021484375, 6.2421875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 1.0, 7.0, 7.0, 13.0, 20.0, 32.0, 48.0, 91.0, 114.0, 146.0, 171.0, 146.0, 88.0, 45.0, 22.0, 17.0, 6.0, 9.0, 2.0, 8.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011777877807617188, -0.00113716721534729, -0.0010965466499328613, -0.0010559260845184326, -0.001015305519104004, -0.0009746849536895752, -0.0009340643882751465, -0.0008934438228607178, -0.0008528232574462891, -0.0008122026920318604, -0.0007715821266174316, -0.0007309615612030029, -0.0006903409957885742, -0.0006497204303741455, -0.0006090998649597168, -0.0005684792995452881, -0.0005278587341308594, -0.00048723816871643066, -0.00044661760330200195, -0.00040599703788757324, -0.00036537647247314453, -0.0003247559070587158, -0.0002841353416442871, -0.0002435147762298584, -0.0002028942108154297, -0.00016227364540100098, -0.00012165307998657227, -8.103251457214355e-05, -4.0411949157714844e-05, 2.086162567138672e-07, 4.082918167114258e-05, 8.144974708557129e-05, 0.0001220703125, 0.0001626908779144287, 0.00020331144332885742, 0.00024393200874328613, 0.00028455257415771484, 0.00032517313957214355, 0.00036579370498657227, 0.000406414270401001, 0.0004470348358154297, 0.0004876554012298584, 0.0005282759666442871, 0.0005688965320587158, 0.0006095170974731445, 0.0006501376628875732, 0.000690758228302002, 0.0007313787937164307, 0.0007719993591308594, 0.0008126199245452881, 0.0008532404899597168, 0.0008938610553741455, 0.0009344816207885742, 0.0009751021862030029, 0.0010157227516174316, 0.0010563433170318604, 0.001096963882446289, 0.0011375844478607178, 0.0011782050132751465, 0.0012188255786895752, 0.001259446144104004, 0.0013000667095184326, 0.0013406872749328613, 0.00138130784034729, 0.0014219284057617188]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 2.0, 14.0, 4.0, 12.0, 16.0, 22.0, 29.0, 28.0, 47.0, 85.0, 96.0, 165.0, 304.0, 525.0, 1022.0, 1999.0, 4193.0, 9898.0, 28466.0, 111497.0, 448205.0, 331830.0, 74464.0, 20856.0, 7631.0, 3441.0, 1695.0, 888.0, 449.0, 263.0, 150.0, 82.0, 61.0, 28.0, 19.0, 17.0, 9.0, 13.0, 7.0, 7.0, 8.0, 1.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.40625, -4.26348876953125, -4.1207275390625, -3.97796630859375, -3.835205078125, -3.69244384765625, -3.5496826171875, -3.40692138671875, -3.26416015625, -3.12139892578125, -2.9786376953125, -2.83587646484375, -2.693115234375, -2.55035400390625, -2.4075927734375, -2.26483154296875, -2.1220703125, -1.97930908203125, -1.8365478515625, -1.69378662109375, -1.551025390625, -1.40826416015625, -1.2655029296875, -1.12274169921875, -0.97998046875, -0.83721923828125, -0.6944580078125, -0.55169677734375, -0.408935546875, -0.26617431640625, -0.1234130859375, 0.01934814453125, 0.162109375, 0.30487060546875, 0.4476318359375, 0.59039306640625, 0.733154296875, 0.87591552734375, 1.0186767578125, 1.16143798828125, 1.30419921875, 1.44696044921875, 1.5897216796875, 1.73248291015625, 1.875244140625, 2.01800537109375, 2.1607666015625, 2.30352783203125, 2.4462890625, 2.58905029296875, 2.7318115234375, 2.87457275390625, 3.017333984375, 3.16009521484375, 3.3028564453125, 3.44561767578125, 3.58837890625, 3.73114013671875, 3.8739013671875, 4.01666259765625, 4.159423828125, 4.30218505859375, 4.4449462890625, 4.58770751953125, 4.73046875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 1.0, 2.0, 6.0, 3.0, 6.0, 8.0, 13.0, 21.0, 27.0, 32.0, 34.0, 43.0, 60.0, 82.0, 108.0, 92.0, 101.0, 64.0, 58.0, 53.0, 31.0, 35.0, 32.0, 26.0, 10.0, 14.0, 9.0, 8.0, 6.0, 5.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.28515625, -5.12811279296875, -4.9710693359375, -4.81402587890625, -4.656982421875, -4.49993896484375, -4.3428955078125, -4.18585205078125, -4.02880859375, -3.87176513671875, -3.7147216796875, -3.55767822265625, -3.400634765625, -3.24359130859375, -3.0865478515625, -2.92950439453125, -2.7724609375, -2.61541748046875, -2.4583740234375, -2.30133056640625, -2.144287109375, -1.98724365234375, -1.8302001953125, -1.67315673828125, -1.51611328125, -1.35906982421875, -1.2020263671875, -1.04498291015625, -0.887939453125, -0.73089599609375, -0.5738525390625, -0.41680908203125, -0.259765625, -0.10272216796875, 0.0543212890625, 0.21136474609375, 0.368408203125, 0.52545166015625, 0.6824951171875, 0.83953857421875, 0.99658203125, 1.15362548828125, 1.3106689453125, 1.46771240234375, 1.624755859375, 1.78179931640625, 1.9388427734375, 2.09588623046875, 2.2529296875, 2.40997314453125, 2.5670166015625, 2.72406005859375, 2.881103515625, 3.03814697265625, 3.1951904296875, 3.35223388671875, 3.50927734375, 3.66632080078125, 3.8233642578125, 3.98040771484375, 4.137451171875, 4.29449462890625, 4.4515380859375, 4.60858154296875, 4.765625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 8.0, 14.0, 36.0, 68.0, 144.0, 232.0, 230.0, 152.0, 66.0, 31.0, 16.0, 7.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.33068084716797, -54.92445755004883, -51.51823425292969, -48.11201477050781, -44.70579147338867, -41.29956817626953, -37.893348693847656, -34.487125396728516, -31.080902099609375, -27.674678802490234, -24.268457412719727, -20.86223602294922, -17.456012725830078, -14.049789428710938, -10.64356803894043, -7.237346649169922, -3.8311233520507812, -0.42490100860595703, 2.981321334838867, 6.387543678283691, 9.793766021728516, 13.199989318847656, 16.606210708618164, 20.012432098388672, 23.418655395507812, 26.824878692626953, 30.23110008239746, 33.63732147216797, 37.04354476928711, 40.44976806640625, 43.855987548828125, 47.262210845947266, 50.66844177246094, 54.07466506958008, 57.48088836669922, 60.887107849121094, 64.2933349609375, 67.69955444335938, 71.10577392578125, 74.51199340820312, 77.91822052001953, 81.3244400024414, 84.73066711425781, 88.13688659667969, 91.54310607910156, 94.94933319091797, 98.35555267333984, 101.76177978515625, 105.16799926757812, 108.57421875, 111.9804458618164, 115.38666534423828, 118.79289245605469, 122.19911193847656, 125.60533142089844, 129.0115509033203, 132.41778564453125, 135.82400512695312, 139.230224609375, 142.63645935058594, 146.0426788330078, 149.4488983154297, 152.85511779785156, 156.26133728027344, 159.6675567626953]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 2.0, 3.0, 5.0, 5.0, 8.0, 18.0, 8.0, 15.0, 13.0, 21.0, 23.0, 26.0, 26.0, 32.0, 29.0, 37.0, 43.0, 47.0, 44.0, 55.0, 58.0, 56.0, 53.0, 47.0, 51.0, 37.0, 34.0, 28.0, 27.0, 29.0, 11.0, 17.0, 21.0, 20.0, 11.0, 5.0, 7.0, 9.0, 3.0, 5.0, 1.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-49.12413024902344, -47.650535583496094, -46.17694091796875, -44.70334243774414, -43.2297477722168, -41.75615310668945, -40.28255844116211, -38.8089599609375, -37.335365295410156, -35.86177062988281, -34.38817596435547, -32.91457748413086, -31.440982818603516, -29.967388153076172, -28.493793487548828, -27.02019691467285, -25.546602249145508, -24.073007583618164, -22.599411010742188, -21.125816345214844, -19.652219772338867, -18.178625106811523, -16.705028533935547, -15.231433868408203, -13.757838249206543, -12.284242630004883, -10.810647010803223, -9.337051391601562, -7.8634562492370605, -6.3898606300354, -4.916265487670898, -3.4426698684692383, -1.9690742492675781, -0.4954787492752075, 0.9781167507171631, 2.451712131500244, 3.9253077507019043, 5.3989033699035645, 6.872498512268066, 8.346094131469727, 9.819689750671387, 11.293285369873047, 12.766880989074707, 14.240476608276367, 15.714071273803711, 17.187667846679688, 18.66126251220703, 20.134857177734375, 21.60845375061035, 23.082048416137695, 24.555644989013672, 26.029239654541016, 27.502836227416992, 28.976430892944336, 30.450027465820312, 31.923622131347656, 33.397216796875, 34.870811462402344, 36.34440612792969, 37.8180046081543, 39.29159927368164, 40.765193939208984, 42.23878860473633, 43.71238708496094, 45.18598175048828]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 5.0, 2.0, 9.0, 13.0, 18.0, 20.0, 36.0, 55.0, 69.0, 112.0, 161.0, 216.0, 324.0, 544.0, 1023.0, 2118.0, 5280.0, 25419.0, 3969409.0, 169572.0, 12581.0, 3486.0, 1501.0, 822.0, 492.0, 330.0, 200.0, 147.0, 93.0, 68.0, 46.0, 35.0, 32.0, 13.0, 12.0, 5.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6875, -8.3961181640625, -8.104736328125, -7.8133544921875, -7.52197265625, -7.2305908203125, -6.939208984375, -6.6478271484375, -6.3564453125, -6.0650634765625, -5.773681640625, -5.4822998046875, -5.19091796875, -4.8995361328125, -4.608154296875, -4.3167724609375, -4.025390625, -3.7340087890625, -3.442626953125, -3.1512451171875, -2.85986328125, -2.5684814453125, -2.277099609375, -1.9857177734375, -1.6943359375, -1.4029541015625, -1.111572265625, -0.8201904296875, -0.52880859375, -0.2374267578125, 0.053955078125, 0.3453369140625, 0.63671875, 0.9281005859375, 1.219482421875, 1.5108642578125, 1.80224609375, 2.0936279296875, 2.385009765625, 2.6763916015625, 2.9677734375, 3.2591552734375, 3.550537109375, 3.8419189453125, 4.13330078125, 4.4246826171875, 4.716064453125, 5.0074462890625, 5.298828125, 5.5902099609375, 5.881591796875, 6.1729736328125, 6.46435546875, 6.7557373046875, 7.047119140625, 7.3385009765625, 7.6298828125, 7.9212646484375, 8.212646484375, 8.5040283203125, 8.79541015625, 9.0867919921875, 9.378173828125, 9.6695556640625, 9.9609375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 7.0, 3.0, 6.0, 6.0, 24.0, 10.0, 17.0, 21.0, 22.0, 28.0, 33.0, 31.0, 47.0, 51.0, 42.0, 50.0, 69.0, 55.0, 39.0, 60.0, 53.0, 51.0, 45.0, 39.0, 31.0, 26.0, 28.0, 16.0, 19.0, 17.0, 11.0, 8.0, 9.0, 9.0, 8.0, 6.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6708984375, -1.6064910888671875, -1.542083740234375, -1.4776763916015625, -1.41326904296875, -1.3488616943359375, -1.284454345703125, -1.2200469970703125, -1.1556396484375, -1.0912322998046875, -1.026824951171875, -0.9624176025390625, -0.89801025390625, -0.8336029052734375, -0.769195556640625, -0.7047882080078125, -0.640380859375, -0.5759735107421875, -0.511566162109375, -0.4471588134765625, -0.38275146484375, -0.3183441162109375, -0.253936767578125, -0.1895294189453125, -0.1251220703125, -0.0607147216796875, 0.003692626953125, 0.0680999755859375, 0.13250732421875, 0.1969146728515625, 0.261322021484375, 0.3257293701171875, 0.39013671875, 0.4545440673828125, 0.518951416015625, 0.5833587646484375, 0.64776611328125, 0.7121734619140625, 0.776580810546875, 0.8409881591796875, 0.9053955078125, 0.9698028564453125, 1.034210205078125, 1.0986175537109375, 1.16302490234375, 1.2274322509765625, 1.291839599609375, 1.3562469482421875, 1.420654296875, 1.4850616455078125, 1.549468994140625, 1.6138763427734375, 1.67828369140625, 1.7426910400390625, 1.807098388671875, 1.8715057373046875, 1.9359130859375, 2.0003204345703125, 2.064727783203125, 2.1291351318359375, 2.19354248046875, 2.2579498291015625, 2.322357177734375, 2.3867645263671875, 2.451171875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 2.0, 9.0, 10.0, 19.0, 17.0, 27.0, 28.0, 30.0, 51.0, 75.0, 97.0, 134.0, 156.0, 210.0, 340.0, 515.0, 1210.0, 2968.0, 12812.0, 131376.0, 3984520.0, 47973.0, 7242.0, 2035.0, 905.0, 437.0, 307.0, 200.0, 122.0, 110.0, 87.0, 79.0, 46.0, 40.0, 27.0, 25.0, 12.0, 19.0, 4.0, 3.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.2890625, -10.9287109375, -10.568359375, -10.2080078125, -9.84765625, -9.4873046875, -9.126953125, -8.7666015625, -8.40625, -8.0458984375, -7.685546875, -7.3251953125, -6.96484375, -6.6044921875, -6.244140625, -5.8837890625, -5.5234375, -5.1630859375, -4.802734375, -4.4423828125, -4.08203125, -3.7216796875, -3.361328125, -3.0009765625, -2.640625, -2.2802734375, -1.919921875, -1.5595703125, -1.19921875, -0.8388671875, -0.478515625, -0.1181640625, 0.2421875, 0.6025390625, 0.962890625, 1.3232421875, 1.68359375, 2.0439453125, 2.404296875, 2.7646484375, 3.125, 3.4853515625, 3.845703125, 4.2060546875, 4.56640625, 4.9267578125, 5.287109375, 5.6474609375, 6.0078125, 6.3681640625, 6.728515625, 7.0888671875, 7.44921875, 7.8095703125, 8.169921875, 8.5302734375, 8.890625, 9.2509765625, 9.611328125, 9.9716796875, 10.33203125, 10.6923828125, 11.052734375, 11.4130859375, 11.7734375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 7.0, 3.0, 5.0, 13.0, 29.0, 48.0, 93.0, 495.0, 3066.0, 184.0, 56.0, 28.0, 25.0, 14.0, 1.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-3.0625, -2.98828125, -2.9140625, -2.83984375, -2.765625, -2.69140625, -2.6171875, -2.54296875, -2.46875, -2.39453125, -2.3203125, -2.24609375, -2.171875, -2.09765625, -2.0234375, -1.94921875, -1.875, -1.80078125, -1.7265625, -1.65234375, -1.578125, -1.50390625, -1.4296875, -1.35546875, -1.28125, -1.20703125, -1.1328125, -1.05859375, -0.984375, -0.91015625, -0.8359375, -0.76171875, -0.6875, -0.61328125, -0.5390625, -0.46484375, -0.390625, -0.31640625, -0.2421875, -0.16796875, -0.09375, -0.01953125, 0.0546875, 0.12890625, 0.203125, 0.27734375, 0.3515625, 0.42578125, 0.5, 0.57421875, 0.6484375, 0.72265625, 0.796875, 0.87109375, 0.9453125, 1.01953125, 1.09375, 1.16796875, 1.2421875, 1.31640625, 1.390625, 1.46484375, 1.5390625, 1.61328125, 1.6875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 6.0, 6.0, 8.0, 14.0, 11.0, 37.0, 46.0, 55.0, 101.0, 95.0, 134.0, 120.0, 96.0, 97.0, 48.0, 44.0, 32.0, 13.0, 13.0, 6.0, 12.0, 8.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.122503280639648, -8.90251636505127, -8.68252944946289, -8.462541580200195, -8.242554664611816, -8.022567749023438, -7.802580833435059, -7.58259391784668, -7.362606525421143, -7.142619609832764, -6.922632217407227, -6.702645301818848, -6.482658386230469, -6.262670993804932, -6.042684078216553, -5.822696685791016, -5.602709770202637, -5.382722854614258, -5.162735462188721, -4.942748546600342, -4.722761154174805, -4.502774238586426, -4.282787322998047, -4.062800407409668, -3.842813014984131, -3.622825860977173, -3.402838706970215, -3.182851791381836, -2.962864637374878, -2.74287748336792, -2.522890567779541, -2.302903413772583, -2.082915782928467, -1.8629286289215088, -1.6429415941238403, -1.4229545593261719, -1.2029674053192139, -0.9829802513122559, -0.7629932165145874, -0.543006181716919, -0.32301902770996094, -0.1030319333076477, 0.11695516109466553, 0.33694225549697876, 0.556929349899292, 0.77691650390625, 0.9969035387039185, 1.216890573501587, 1.436877727508545, 1.656864881515503, 1.8768519163131714, 2.09683895111084, 2.316826105117798, 2.536813259124756, 2.7568001747131348, 2.9767873287200928, 3.196774482727051, 3.416761636734009, 3.636748790740967, 3.8567357063293457, 4.076723098754883, 4.296710014343262, 4.516696929931641, 4.7366838455200195, 4.956671237945557]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 6.0, 8.0, 9.0, 5.0, 12.0, 11.0, 15.0, 18.0, 9.0, 23.0, 28.0, 26.0, 26.0, 40.0, 36.0, 39.0, 27.0, 33.0, 45.0, 37.0, 41.0, 28.0, 37.0, 25.0, 31.0, 37.0, 38.0, 38.0, 31.0, 27.0, 21.0, 31.0, 21.0, 21.0, 17.0, 20.0, 8.0, 16.0, 10.0, 15.0, 5.0, 7.0, 4.0, 3.0, 7.0, 2.0, 2.0, 4.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.9954991340637207, -2.896855115890503, -2.7982113361358643, -2.6995673179626465, -2.6009232997894287, -2.50227952003479, -2.4036355018615723, -2.3049917221069336, -2.206347703933716, -2.107703685760498, -2.0090599060058594, -1.9104158878326416, -1.8117719888687134, -1.7131280899047852, -1.6144840717315674, -1.5158401727676392, -1.4171961545944214, -1.3185522556304932, -1.2199082374572754, -1.1212643384933472, -1.022620439529419, -0.923976480960846, -0.825332522392273, -0.7266886234283447, -0.6280446648597717, -0.5294007062911987, -0.4307568073272705, -0.3321128487586975, -0.2334689199924469, -0.1348249912261963, -0.03618103265762329, 0.06246286630630493, 0.16110682487487793, 0.25975075364112854, 0.35839468240737915, 0.45703864097595215, 0.5556825399398804, 0.6543264985084534, 0.7529704570770264, 0.8516143560409546, 0.9502583146095276, 1.0489022731781006, 1.1475461721420288, 1.246190071105957, 1.3448340892791748, 1.443477988243103, 1.5421218872070312, 1.640765905380249, 1.7394098043441772, 1.8380537033081055, 1.9366977214813232, 2.035341739654541, 2.1339855194091797, 2.2326295375823975, 2.3312735557556152, 2.429917335510254, 2.5285613536834717, 2.6272053718566895, 2.725849151611328, 2.824493169784546, 2.9231371879577637, 3.0217809677124023, 3.12042498588562, 3.219069004058838, 3.3177127838134766]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 6.0, 7.0, 6.0, 16.0, 20.0, 41.0, 56.0, 86.0, 141.0, 254.0, 394.0, 727.0, 1371.0, 2811.0, 6144.0, 14317.0, 36039.0, 96610.0, 235727.0, 334345.0, 193930.0, 75502.0, 28454.0, 11521.0, 4975.0, 2388.0, 1146.0, 639.0, 344.0, 194.0, 131.0, 67.0, 45.0, 32.0, 21.0, 22.0, 10.0, 4.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-4.37890625, -4.24365234375, -4.1083984375, -3.97314453125, -3.837890625, -3.70263671875, -3.5673828125, -3.43212890625, -3.296875, -3.16162109375, -3.0263671875, -2.89111328125, -2.755859375, -2.62060546875, -2.4853515625, -2.35009765625, -2.21484375, -2.07958984375, -1.9443359375, -1.80908203125, -1.673828125, -1.53857421875, -1.4033203125, -1.26806640625, -1.1328125, -0.99755859375, -0.8623046875, -0.72705078125, -0.591796875, -0.45654296875, -0.3212890625, -0.18603515625, -0.05078125, 0.08447265625, 0.2197265625, 0.35498046875, 0.490234375, 0.62548828125, 0.7607421875, 0.89599609375, 1.03125, 1.16650390625, 1.3017578125, 1.43701171875, 1.572265625, 1.70751953125, 1.8427734375, 1.97802734375, 2.11328125, 2.24853515625, 2.3837890625, 2.51904296875, 2.654296875, 2.78955078125, 2.9248046875, 3.06005859375, 3.1953125, 3.33056640625, 3.4658203125, 3.60107421875, 3.736328125, 3.87158203125, 4.0068359375, 4.14208984375, 4.27734375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 8.0, 5.0, 10.0, 20.0, 14.0, 27.0, 30.0, 30.0, 37.0, 55.0, 62.0, 52.0, 55.0, 69.0, 73.0, 65.0, 69.0, 54.0, 49.0, 43.0, 36.0, 28.0, 21.0, 19.0, 17.0, 12.0, 9.0, 10.0, 10.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.83984375, -2.75677490234375, -2.6737060546875, -2.59063720703125, -2.507568359375, -2.42449951171875, -2.3414306640625, -2.25836181640625, -2.17529296875, -2.09222412109375, -2.0091552734375, -1.92608642578125, -1.843017578125, -1.75994873046875, -1.6768798828125, -1.59381103515625, -1.5107421875, -1.42767333984375, -1.3446044921875, -1.26153564453125, -1.178466796875, -1.09539794921875, -1.0123291015625, -0.92926025390625, -0.84619140625, -0.76312255859375, -0.6800537109375, -0.59698486328125, -0.513916015625, -0.43084716796875, -0.3477783203125, -0.26470947265625, -0.181640625, -0.09857177734375, -0.0155029296875, 0.06756591796875, 0.150634765625, 0.23370361328125, 0.3167724609375, 0.39984130859375, 0.48291015625, 0.56597900390625, 0.6490478515625, 0.73211669921875, 0.815185546875, 0.89825439453125, 0.9813232421875, 1.06439208984375, 1.1474609375, 1.23052978515625, 1.3135986328125, 1.39666748046875, 1.479736328125, 1.56280517578125, 1.6458740234375, 1.72894287109375, 1.81201171875, 1.89508056640625, 1.9781494140625, 2.06121826171875, 2.144287109375, 2.22735595703125, 2.3104248046875, 2.39349365234375, 2.4765625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 11.0, 3.0, 11.0, 11.0, 18.0, 22.0, 28.0, 62.0, 104.0, 199.0, 450.0, 1285.0, 5896.0, 62977.0, 751665.0, 208721.0, 13610.0, 2182.0, 693.0, 282.0, 123.0, 70.0, 49.0, 27.0, 12.0, 12.0, 6.0, 3.0, 5.0, 8.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.2578125, -12.839599609375, -12.42138671875, -12.003173828125, -11.5849609375, -11.166748046875, -10.74853515625, -10.330322265625, -9.912109375, -9.493896484375, -9.07568359375, -8.657470703125, -8.2392578125, -7.821044921875, -7.40283203125, -6.984619140625, -6.56640625, -6.148193359375, -5.72998046875, -5.311767578125, -4.8935546875, -4.475341796875, -4.05712890625, -3.638916015625, -3.220703125, -2.802490234375, -2.38427734375, -1.966064453125, -1.5478515625, -1.129638671875, -0.71142578125, -0.293212890625, 0.125, 0.543212890625, 0.96142578125, 1.379638671875, 1.7978515625, 2.216064453125, 2.63427734375, 3.052490234375, 3.470703125, 3.888916015625, 4.30712890625, 4.725341796875, 5.1435546875, 5.561767578125, 5.97998046875, 6.398193359375, 6.81640625, 7.234619140625, 7.65283203125, 8.071044921875, 8.4892578125, 8.907470703125, 9.32568359375, 9.743896484375, 10.162109375, 10.580322265625, 10.99853515625, 11.416748046875, 11.8349609375, 12.253173828125, 12.67138671875, 13.089599609375, 13.5078125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 6.0, 1.0, 10.0, 12.0, 6.0, 10.0, 14.0, 13.0, 14.0, 23.0, 21.0, 26.0, 32.0, 27.0, 35.0, 27.0, 35.0, 36.0, 41.0, 50.0, 38.0, 49.0, 33.0, 44.0, 41.0, 35.0, 39.0, 28.0, 37.0, 24.0, 32.0, 29.0, 17.0, 19.0, 22.0, 12.0, 15.0, 9.0, 7.0, 5.0, 6.0, 7.0, 5.0, 1.0, 3.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.640625, -9.329345703125, -9.01806640625, -8.706787109375, -8.3955078125, -8.084228515625, -7.77294921875, -7.461669921875, -7.150390625, -6.839111328125, -6.52783203125, -6.216552734375, -5.9052734375, -5.593994140625, -5.28271484375, -4.971435546875, -4.66015625, -4.348876953125, -4.03759765625, -3.726318359375, -3.4150390625, -3.103759765625, -2.79248046875, -2.481201171875, -2.169921875, -1.858642578125, -1.54736328125, -1.236083984375, -0.9248046875, -0.613525390625, -0.30224609375, 0.009033203125, 0.3203125, 0.631591796875, 0.94287109375, 1.254150390625, 1.5654296875, 1.876708984375, 2.18798828125, 2.499267578125, 2.810546875, 3.121826171875, 3.43310546875, 3.744384765625, 4.0556640625, 4.366943359375, 4.67822265625, 4.989501953125, 5.30078125, 5.612060546875, 5.92333984375, 6.234619140625, 6.5458984375, 6.857177734375, 7.16845703125, 7.479736328125, 7.791015625, 8.102294921875, 8.41357421875, 8.724853515625, 9.0361328125, 9.347412109375, 9.65869140625, 9.969970703125, 10.28125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 1.0, 5.0, 2.0, 9.0, 13.0, 23.0, 31.0, 46.0, 55.0, 113.0, 220.0, 453.0, 1162.0, 4108.0, 23705.0, 260594.0, 667601.0, 77554.0, 9250.0, 2108.0, 745.0, 357.0, 165.0, 92.0, 59.0, 22.0, 23.0, 16.0, 7.0, 6.0, 7.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.11328125, -2.97943115234375, -2.8455810546875, -2.71173095703125, -2.577880859375, -2.44403076171875, -2.3101806640625, -2.17633056640625, -2.04248046875, -1.90863037109375, -1.7747802734375, -1.64093017578125, -1.507080078125, -1.37322998046875, -1.2393798828125, -1.10552978515625, -0.9716796875, -0.83782958984375, -0.7039794921875, -0.57012939453125, -0.436279296875, -0.30242919921875, -0.1685791015625, -0.03472900390625, 0.09912109375, 0.23297119140625, 0.3668212890625, 0.50067138671875, 0.634521484375, 0.76837158203125, 0.9022216796875, 1.03607177734375, 1.169921875, 1.30377197265625, 1.4376220703125, 1.57147216796875, 1.705322265625, 1.83917236328125, 1.9730224609375, 2.10687255859375, 2.24072265625, 2.37457275390625, 2.5084228515625, 2.64227294921875, 2.776123046875, 2.90997314453125, 3.0438232421875, 3.17767333984375, 3.3115234375, 3.44537353515625, 3.5792236328125, 3.71307373046875, 3.846923828125, 3.98077392578125, 4.1146240234375, 4.24847412109375, 4.38232421875, 4.51617431640625, 4.6500244140625, 4.78387451171875, 4.917724609375, 5.05157470703125, 5.1854248046875, 5.31927490234375, 5.453125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 3.0, 0.0, 4.0, 1.0, 4.0, 2.0, 8.0, 7.0, 9.0, 12.0, 21.0, 19.0, 42.0, 40.0, 51.0, 69.0, 73.0, 79.0, 89.0, 88.0, 77.0, 60.0, 59.0, 51.0, 27.0, 22.0, 24.0, 17.0, 12.0, 8.0, 4.0, 11.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0006165504455566406, -0.0005993247032165527, -0.0005820989608764648, -0.000564873218536377, -0.0005476474761962891, -0.0005304217338562012, -0.0005131959915161133, -0.0004959702491760254, -0.0004787445068359375, -0.0004615187644958496, -0.0004442930221557617, -0.00042706727981567383, -0.00040984153747558594, -0.00039261579513549805, -0.00037539005279541016, -0.00035816431045532227, -0.0003409385681152344, -0.0003237128257751465, -0.0003064870834350586, -0.0002892613410949707, -0.0002720355987548828, -0.0002548098564147949, -0.00023758411407470703, -0.00022035837173461914, -0.00020313262939453125, -0.00018590688705444336, -0.00016868114471435547, -0.00015145540237426758, -0.0001342296600341797, -0.0001170039176940918, -9.97781753540039e-05, -8.255243301391602e-05, -6.532669067382812e-05, -4.8100948333740234e-05, -3.0875205993652344e-05, -1.3649463653564453e-05, 3.5762786865234375e-06, 2.0802021026611328e-05, 3.802776336669922e-05, 5.525350570678711e-05, 7.2479248046875e-05, 8.970499038696289e-05, 0.00010693073272705078, 0.00012415647506713867, 0.00014138221740722656, 0.00015860795974731445, 0.00017583370208740234, 0.00019305944442749023, 0.00021028518676757812, 0.00022751092910766602, 0.0002447366714477539, 0.0002619624137878418, 0.0002791881561279297, 0.0002964138984680176, 0.00031363964080810547, 0.00033086538314819336, 0.00034809112548828125, 0.00036531686782836914, 0.00038254261016845703, 0.0003997683525085449, 0.0004169940948486328, 0.0004342198371887207, 0.0004514455795288086, 0.0004686713218688965, 0.0004858970642089844]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 7.0, 2.0, 6.0, 13.0, 14.0, 30.0, 30.0, 48.0, 76.0, 109.0, 224.0, 431.0, 830.0, 1938.0, 5097.0, 17070.0, 81403.0, 446652.0, 399536.0, 71676.0, 15280.0, 4539.0, 1797.0, 859.0, 357.0, 215.0, 108.0, 72.0, 51.0, 28.0, 19.0, 9.0, 7.0, 5.0, 8.0, 6.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.212890625, -3.089141845703125, -2.96539306640625, -2.841644287109375, -2.7178955078125, -2.594146728515625, -2.47039794921875, -2.346649169921875, -2.222900390625, -2.099151611328125, -1.97540283203125, -1.851654052734375, -1.7279052734375, -1.604156494140625, -1.48040771484375, -1.356658935546875, -1.23291015625, -1.109161376953125, -0.98541259765625, -0.861663818359375, -0.7379150390625, -0.614166259765625, -0.49041748046875, -0.366668701171875, -0.242919921875, -0.119171142578125, 0.00457763671875, 0.128326416015625, 0.2520751953125, 0.375823974609375, 0.49957275390625, 0.623321533203125, 0.7470703125, 0.870819091796875, 0.99456787109375, 1.118316650390625, 1.2420654296875, 1.365814208984375, 1.48956298828125, 1.613311767578125, 1.737060546875, 1.860809326171875, 1.98455810546875, 2.108306884765625, 2.2320556640625, 2.355804443359375, 2.47955322265625, 2.603302001953125, 2.72705078125, 2.850799560546875, 2.97454833984375, 3.098297119140625, 3.2220458984375, 3.345794677734375, 3.46954345703125, 3.593292236328125, 3.717041015625, 3.840789794921875, 3.96453857421875, 4.088287353515625, 4.2120361328125, 4.335784912109375, 4.45953369140625, 4.583282470703125, 4.70703125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 4.0, 11.0, 7.0, 8.0, 12.0, 9.0, 29.0, 27.0, 31.0, 52.0, 60.0, 99.0, 90.0, 101.0, 107.0, 97.0, 65.0, 49.0, 41.0, 26.0, 28.0, 14.0, 13.0, 7.0, 8.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0546875, -3.9178466796875, -3.781005859375, -3.6441650390625, -3.50732421875, -3.3704833984375, -3.233642578125, -3.0968017578125, -2.9599609375, -2.8231201171875, -2.686279296875, -2.5494384765625, -2.41259765625, -2.2757568359375, -2.138916015625, -2.0020751953125, -1.865234375, -1.7283935546875, -1.591552734375, -1.4547119140625, -1.31787109375, -1.1810302734375, -1.044189453125, -0.9073486328125, -0.7705078125, -0.6336669921875, -0.496826171875, -0.3599853515625, -0.22314453125, -0.0863037109375, 0.050537109375, 0.1873779296875, 0.32421875, 0.4610595703125, 0.597900390625, 0.7347412109375, 0.87158203125, 1.0084228515625, 1.145263671875, 1.2821044921875, 1.4189453125, 1.5557861328125, 1.692626953125, 1.8294677734375, 1.96630859375, 2.1031494140625, 2.239990234375, 2.3768310546875, 2.513671875, 2.6505126953125, 2.787353515625, 2.9241943359375, 3.06103515625, 3.1978759765625, 3.334716796875, 3.4715576171875, 3.6083984375, 3.7452392578125, 3.882080078125, 4.0189208984375, 4.15576171875, 4.2926025390625, 4.429443359375, 4.5662841796875, 4.703125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 3.0, 0.0, 7.0, 3.0, 8.0, 27.0, 71.0, 141.0, 248.0, 244.0, 170.0, 43.0, 32.0, 9.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-185.21636962890625, -181.73155212402344, -178.24673461914062, -174.7619171142578, -171.277099609375, -167.79226684570312, -164.3074493408203, -160.8226318359375, -157.3378143310547, -153.85299682617188, -150.36817932128906, -146.88336181640625, -143.39852905273438, -139.91371154785156, -136.42889404296875, -132.94407653808594, -129.45925903320312, -125.97444152832031, -122.4896240234375, -119.00479888916016, -115.51998138427734, -112.03516387939453, -108.55033874511719, -105.06552124023438, -101.58070373535156, -98.09588623046875, -94.61106872558594, -91.1262435913086, -87.64142608642578, -84.15660858154297, -80.67178344726562, -77.18696594238281, -73.70214080810547, -70.21732330322266, -66.73249816894531, -63.2476806640625, -59.76286315917969, -56.278045654296875, -52.7932243347168, -49.30840301513672, -45.823585510253906, -42.338768005371094, -38.853946685791016, -35.36912536621094, -31.884307861328125, -28.39948844909668, -24.914669036865234, -21.42984962463379, -17.945030212402344, -14.460210800170898, -10.975391387939453, -7.490571975708008, -4.0057525634765625, -0.5209331512451172, 2.963886260986328, 6.448705673217773, 9.933525085449219, 13.418344497680664, 16.90316390991211, 20.387983322143555, 23.872802734375, 27.357622146606445, 30.84244155883789, 34.32726287841797, 37.81208038330078]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 8.0, 4.0, 8.0, 8.0, 6.0, 13.0, 15.0, 20.0, 11.0, 18.0, 17.0, 19.0, 28.0, 36.0, 34.0, 39.0, 23.0, 38.0, 43.0, 52.0, 53.0, 38.0, 53.0, 44.0, 42.0, 30.0, 39.0, 58.0, 30.0, 33.0, 27.0, 19.0, 21.0, 17.0, 13.0, 9.0, 5.0, 7.0, 3.0, 4.0, 7.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-54.860511779785156, -53.23564147949219, -51.61076736450195, -49.985897064208984, -48.36102294921875, -46.73615264892578, -45.11128234863281, -43.48640823364258, -41.86153793334961, -40.23666763305664, -38.611793518066406, -36.98692321777344, -35.3620491027832, -33.737178802490234, -32.1123046875, -30.48743438720703, -28.86256217956543, -27.237689971923828, -25.612817764282227, -23.987945556640625, -22.363075256347656, -20.738203048706055, -19.113330841064453, -17.488460540771484, -15.863587379455566, -14.238715171813965, -12.61384391784668, -10.988971710205078, -9.364099502563477, -7.739228248596191, -6.11435604095459, -4.489484786987305, -2.864612579345703, -1.2397407293319702, 0.3851311206817627, 2.010003089904785, 3.6348748207092285, 5.259746551513672, 6.884618759155273, 8.509490013122559, 10.13436222076416, 11.759234428405762, 13.384105682373047, 15.008977890014648, 16.63385009765625, 18.25872039794922, 19.883594512939453, 21.508464813232422, 23.133337020874023, 24.758209228515625, 26.383081436157227, 28.007953643798828, 29.632823944091797, 31.2576961517334, 32.882568359375, 34.50743865966797, 36.1323127746582, 37.75718307495117, 39.382057189941406, 41.006927490234375, 42.63180160522461, 44.25667190551758, 45.88154602050781, 47.50641632080078, 49.13128662109375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 7.0, 5.0, 8.0, 9.0, 11.0, 23.0, 27.0, 40.0, 52.0, 67.0, 94.0, 159.0, 238.0, 408.0, 870.0, 2808.0, 16368.0, 3928066.0, 231627.0, 9578.0, 2012.0, 731.0, 367.0, 227.0, 145.0, 102.0, 55.0, 60.0, 42.0, 24.0, 17.0, 11.0, 6.0, 5.0, 8.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.828125, -13.472412109375, -13.11669921875, -12.760986328125, -12.4052734375, -12.049560546875, -11.69384765625, -11.338134765625, -10.982421875, -10.626708984375, -10.27099609375, -9.915283203125, -9.5595703125, -9.203857421875, -8.84814453125, -8.492431640625, -8.13671875, -7.781005859375, -7.42529296875, -7.069580078125, -6.7138671875, -6.358154296875, -6.00244140625, -5.646728515625, -5.291015625, -4.935302734375, -4.57958984375, -4.223876953125, -3.8681640625, -3.512451171875, -3.15673828125, -2.801025390625, -2.4453125, -2.089599609375, -1.73388671875, -1.378173828125, -1.0224609375, -0.666748046875, -0.31103515625, 0.044677734375, 0.400390625, 0.756103515625, 1.11181640625, 1.467529296875, 1.8232421875, 2.178955078125, 2.53466796875, 2.890380859375, 3.24609375, 3.601806640625, 3.95751953125, 4.313232421875, 4.6689453125, 5.024658203125, 5.38037109375, 5.736083984375, 6.091796875, 6.447509765625, 6.80322265625, 7.158935546875, 7.5146484375, 7.870361328125, 8.22607421875, 8.581787109375, 8.9375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 5.0, 6.0, 7.0, 10.0, 13.0, 9.0, 29.0, 17.0, 21.0, 30.0, 37.0, 38.0, 47.0, 47.0, 56.0, 35.0, 46.0, 44.0, 62.0, 51.0, 56.0, 45.0, 42.0, 38.0, 37.0, 31.0, 26.0, 18.0, 15.0, 12.0, 12.0, 7.0, 11.0, 5.0, 5.0, 4.0, 6.0, 8.0, 5.0, 5.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-2.16796875, -2.095458984375, -2.02294921875, -1.950439453125, -1.8779296875, -1.805419921875, -1.73291015625, -1.660400390625, -1.587890625, -1.515380859375, -1.44287109375, -1.370361328125, -1.2978515625, -1.225341796875, -1.15283203125, -1.080322265625, -1.0078125, -0.935302734375, -0.86279296875, -0.790283203125, -0.7177734375, -0.645263671875, -0.57275390625, -0.500244140625, -0.427734375, -0.355224609375, -0.28271484375, -0.210205078125, -0.1376953125, -0.065185546875, 0.00732421875, 0.079833984375, 0.15234375, 0.224853515625, 0.29736328125, 0.369873046875, 0.4423828125, 0.514892578125, 0.58740234375, 0.659912109375, 0.732421875, 0.804931640625, 0.87744140625, 0.949951171875, 1.0224609375, 1.094970703125, 1.16748046875, 1.239990234375, 1.3125, 1.385009765625, 1.45751953125, 1.530029296875, 1.6025390625, 1.675048828125, 1.74755859375, 1.820068359375, 1.892578125, 1.965087890625, 2.03759765625, 2.110107421875, 2.1826171875, 2.255126953125, 2.32763671875, 2.400146484375, 2.47265625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 4.0, 6.0, 8.0, 15.0, 14.0, 31.0, 38.0, 49.0, 61.0, 82.0, 121.0, 124.0, 195.0, 294.0, 366.0, 635.0, 1158.0, 2364.0, 6742.0, 35628.0, 3426899.0, 681770.0, 27020.0, 5679.0, 2041.0, 1019.0, 581.0, 362.0, 242.0, 193.0, 141.0, 94.0, 88.0, 63.0, 33.0, 34.0, 21.0, 18.0, 10.0, 10.0, 9.0, 3.0, 6.0, 7.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1171875, -8.8316650390625, -8.546142578125, -8.2606201171875, -7.97509765625, -7.6895751953125, -7.404052734375, -7.1185302734375, -6.8330078125, -6.5474853515625, -6.261962890625, -5.9764404296875, -5.69091796875, -5.4053955078125, -5.119873046875, -4.8343505859375, -4.548828125, -4.2633056640625, -3.977783203125, -3.6922607421875, -3.40673828125, -3.1212158203125, -2.835693359375, -2.5501708984375, -2.2646484375, -1.9791259765625, -1.693603515625, -1.4080810546875, -1.12255859375, -0.8370361328125, -0.551513671875, -0.2659912109375, 0.01953125, 0.3050537109375, 0.590576171875, 0.8760986328125, 1.16162109375, 1.4471435546875, 1.732666015625, 2.0181884765625, 2.3037109375, 2.5892333984375, 2.874755859375, 3.1602783203125, 3.44580078125, 3.7313232421875, 4.016845703125, 4.3023681640625, 4.587890625, 4.8734130859375, 5.158935546875, 5.4444580078125, 5.72998046875, 6.0155029296875, 6.301025390625, 6.5865478515625, 6.8720703125, 7.1575927734375, 7.443115234375, 7.7286376953125, 8.01416015625, 8.2996826171875, 8.585205078125, 8.8707275390625, 9.15625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 10.0, 10.0, 21.0, 61.0, 148.0, 948.0, 2535.0, 199.0, 65.0, 32.0, 14.0, 9.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.685546875, -3.5979461669921875, -3.510345458984375, -3.4227447509765625, -3.33514404296875, -3.2475433349609375, -3.159942626953125, -3.0723419189453125, -2.9847412109375, -2.8971405029296875, -2.809539794921875, -2.7219390869140625, -2.63433837890625, -2.5467376708984375, -2.459136962890625, -2.3715362548828125, -2.283935546875, -2.1963348388671875, -2.108734130859375, -2.0211334228515625, -1.93353271484375, -1.8459320068359375, -1.758331298828125, -1.6707305908203125, -1.5831298828125, -1.4955291748046875, -1.407928466796875, -1.3203277587890625, -1.23272705078125, -1.1451263427734375, -1.057525634765625, -0.9699249267578125, -0.88232421875, -0.7947235107421875, -0.707122802734375, -0.6195220947265625, -0.53192138671875, -0.4443206787109375, -0.356719970703125, -0.2691192626953125, -0.1815185546875, -0.0939178466796875, -0.006317138671875, 0.0812835693359375, 0.16888427734375, 0.2564849853515625, 0.344085693359375, 0.4316864013671875, 0.519287109375, 0.6068878173828125, 0.694488525390625, 0.7820892333984375, 0.86968994140625, 0.9572906494140625, 1.044891357421875, 1.1324920654296875, 1.2200927734375, 1.3076934814453125, 1.395294189453125, 1.4828948974609375, 1.57049560546875, 1.6580963134765625, 1.745697021484375, 1.8332977294921875, 1.9208984375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 5.0, 1.0, 6.0, 5.0, 12.0, 12.0, 8.0, 22.0, 33.0, 45.0, 56.0, 69.0, 72.0, 75.0, 96.0, 97.0, 96.0, 69.0, 48.0, 49.0, 32.0, 30.0, 20.0, 16.0, 7.0, 6.0, 8.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.3749260902404785, -5.160675048828125, -4.94642448425293, -4.732173442840576, -4.517922878265381, -4.303671836853027, -4.089421272277832, -3.8751702308654785, -3.660919427871704, -3.4466686248779297, -3.2324178218841553, -3.018167018890381, -2.8039159774780273, -2.589665412902832, -2.3754143714904785, -2.161163568496704, -1.9469127655029297, -1.7326619625091553, -1.5184111595153809, -1.304160237312317, -1.0899094343185425, -0.8756586313247681, -0.6614077091217041, -0.4471569061279297, -0.23290610313415527, -0.01865527033805847, 0.19559556245803833, 0.4098464250564575, 0.6240972280502319, 0.8383480310440063, 1.0525989532470703, 1.2668497562408447, 1.4811010360717773, 1.6953518390655518, 1.9096026420593262, 2.1238536834716797, 2.338104248046875, 2.5523552894592285, 2.766606092453003, 2.9808568954467773, 3.1951076984405518, 3.409358501434326, 3.6236093044281006, 3.837860107421875, 4.0521111488342285, 4.266361713409424, 4.480612754821777, 4.694863319396973, 4.909114360809326, 5.12336540222168, 5.337615966796875, 5.5518670082092285, 5.766117572784424, 5.980368614196777, 6.194619178771973, 6.408870220184326, 6.62312126159668, 6.837372303009033, 7.0516228675842285, 7.265873908996582, 7.480124473571777, 7.694375514984131, 7.908626556396484, 8.12287712097168, 8.337127685546875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 6.0, 8.0, 6.0, 10.0, 9.0, 13.0, 18.0, 24.0, 12.0, 15.0, 19.0, 24.0, 34.0, 30.0, 39.0, 34.0, 30.0, 38.0, 40.0, 33.0, 42.0, 50.0, 37.0, 33.0, 36.0, 39.0, 46.0, 33.0, 32.0, 25.0, 27.0, 18.0, 17.0, 26.0, 21.0, 12.0, 11.0, 7.0, 9.0, 10.0, 4.0, 6.0, 4.0, 3.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.16778564453125, -4.037766933441162, -3.907748222351074, -3.7777297496795654, -3.6477110385894775, -3.5176923274993896, -3.387673854827881, -3.257655143737793, -3.127636432647705, -2.997617721557617, -2.8675990104675293, -2.7375805377960205, -2.6075618267059326, -2.4775431156158447, -2.347524642944336, -2.217505931854248, -2.08748722076416, -1.9574685096740723, -1.827449917793274, -1.6974313259124756, -1.5674126148223877, -1.4373939037322998, -1.3073753118515015, -1.1773567199707031, -1.0473380088806152, -0.9173193573951721, -0.787300705909729, -0.6572820544242859, -0.5272634029388428, -0.39724475145339966, -0.26722609996795654, -0.13720744848251343, -0.0071887969970703125, 0.1228298544883728, 0.2528485059738159, 0.38286715745925903, 0.5128858089447021, 0.6429044604301453, 0.7729231119155884, 0.9029417634010315, 1.0329604148864746, 1.1629791259765625, 1.2929977178573608, 1.4230163097381592, 1.553035020828247, 1.683053731918335, 1.8130723237991333, 1.9430909156799316, 2.0731096267700195, 2.2031283378601074, 2.3331470489501953, 2.463165521621704, 2.593184232711792, 2.72320294380188, 2.8532214164733887, 2.9832401275634766, 3.1132588386535645, 3.2432775497436523, 3.3732962608337402, 3.503314733505249, 3.633333444595337, 3.763352155685425, 3.8933706283569336, 4.0233893394470215, 4.153408050537109]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 8.0, 8.0, 6.0, 14.0, 30.0, 30.0, 49.0, 64.0, 110.0, 149.0, 277.0, 436.0, 781.0, 1249.0, 2356.0, 4411.0, 8797.0, 19028.0, 43574.0, 105266.0, 235062.0, 306462.0, 182085.0, 76857.0, 31927.0, 14481.0, 6967.0, 3546.0, 1894.0, 1018.0, 607.0, 365.0, 229.0, 134.0, 79.0, 59.0, 42.0, 16.0, 25.0, 13.0, 15.0, 10.0, 4.0, 2.0, 3.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-3.408203125, -3.295806884765625, -3.18341064453125, -3.071014404296875, -2.9586181640625, -2.846221923828125, -2.73382568359375, -2.621429443359375, -2.509033203125, -2.396636962890625, -2.28424072265625, -2.171844482421875, -2.0594482421875, -1.947052001953125, -1.83465576171875, -1.722259521484375, -1.60986328125, -1.497467041015625, -1.38507080078125, -1.272674560546875, -1.1602783203125, -1.047882080078125, -0.93548583984375, -0.823089599609375, -0.710693359375, -0.598297119140625, -0.48590087890625, -0.373504638671875, -0.2611083984375, -0.148712158203125, -0.03631591796875, 0.076080322265625, 0.1884765625, 0.300872802734375, 0.41326904296875, 0.525665283203125, 0.6380615234375, 0.750457763671875, 0.86285400390625, 0.975250244140625, 1.087646484375, 1.200042724609375, 1.31243896484375, 1.424835205078125, 1.5372314453125, 1.649627685546875, 1.76202392578125, 1.874420166015625, 1.98681640625, 2.099212646484375, 2.21160888671875, 2.324005126953125, 2.4364013671875, 2.548797607421875, 2.66119384765625, 2.773590087890625, 2.885986328125, 2.998382568359375, 3.11077880859375, 3.223175048828125, 3.3355712890625, 3.447967529296875, 3.56036376953125, 3.672760009765625, 3.78515625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 4.0, 6.0, 7.0, 7.0, 5.0, 6.0, 11.0, 16.0, 24.0, 35.0, 23.0, 31.0, 30.0, 34.0, 37.0, 47.0, 38.0, 50.0, 63.0, 43.0, 59.0, 45.0, 57.0, 50.0, 35.0, 41.0, 22.0, 26.0, 35.0, 19.0, 17.0, 15.0, 12.0, 10.0, 6.0, 11.0, 8.0, 6.0, 4.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.375, -2.294830322265625, -2.21466064453125, -2.134490966796875, -2.0543212890625, -1.974151611328125, -1.89398193359375, -1.813812255859375, -1.733642578125, -1.653472900390625, -1.57330322265625, -1.493133544921875, -1.4129638671875, -1.332794189453125, -1.25262451171875, -1.172454833984375, -1.09228515625, -1.012115478515625, -0.93194580078125, -0.851776123046875, -0.7716064453125, -0.691436767578125, -0.61126708984375, -0.531097412109375, -0.450927734375, -0.370758056640625, -0.29058837890625, -0.210418701171875, -0.1302490234375, -0.050079345703125, 0.03009033203125, 0.110260009765625, 0.1904296875, 0.270599365234375, 0.35076904296875, 0.430938720703125, 0.5111083984375, 0.591278076171875, 0.67144775390625, 0.751617431640625, 0.831787109375, 0.911956787109375, 0.99212646484375, 1.072296142578125, 1.1524658203125, 1.232635498046875, 1.31280517578125, 1.392974853515625, 1.47314453125, 1.553314208984375, 1.63348388671875, 1.713653564453125, 1.7938232421875, 1.873992919921875, 1.95416259765625, 2.034332275390625, 2.114501953125, 2.194671630859375, 2.27484130859375, 2.355010986328125, 2.4351806640625, 2.515350341796875, 2.59552001953125, 2.675689697265625, 2.755859375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 0.0, 5.0, 5.0, 9.0, 12.0, 18.0, 15.0, 21.0, 53.0, 87.0, 147.0, 317.0, 742.0, 2121.0, 9118.0, 73638.0, 778994.0, 163180.0, 15130.0, 3120.0, 972.0, 432.0, 184.0, 90.0, 54.0, 23.0, 24.0, 6.0, 14.0, 4.0, 3.0, 7.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-15.1171875, -14.73583984375, -14.3544921875, -13.97314453125, -13.591796875, -13.21044921875, -12.8291015625, -12.44775390625, -12.06640625, -11.68505859375, -11.3037109375, -10.92236328125, -10.541015625, -10.15966796875, -9.7783203125, -9.39697265625, -9.015625, -8.63427734375, -8.2529296875, -7.87158203125, -7.490234375, -7.10888671875, -6.7275390625, -6.34619140625, -5.96484375, -5.58349609375, -5.2021484375, -4.82080078125, -4.439453125, -4.05810546875, -3.6767578125, -3.29541015625, -2.9140625, -2.53271484375, -2.1513671875, -1.77001953125, -1.388671875, -1.00732421875, -0.6259765625, -0.24462890625, 0.13671875, 0.51806640625, 0.8994140625, 1.28076171875, 1.662109375, 2.04345703125, 2.4248046875, 2.80615234375, 3.1875, 3.56884765625, 3.9501953125, 4.33154296875, 4.712890625, 5.09423828125, 5.4755859375, 5.85693359375, 6.23828125, 6.61962890625, 7.0009765625, 7.38232421875, 7.763671875, 8.14501953125, 8.5263671875, 8.90771484375, 9.2890625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 4.0, 8.0, 10.0, 6.0, 10.0, 5.0, 10.0, 17.0, 16.0, 26.0, 37.0, 25.0, 40.0, 43.0, 35.0, 39.0, 54.0, 60.0, 56.0, 47.0, 43.0, 57.0, 45.0, 58.0, 36.0, 32.0, 27.0, 19.0, 26.0, 19.0, 22.0, 10.0, 13.0, 9.0, 3.0, 10.0, 5.0, 8.0, 3.0, 2.0, 4.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.71875, -11.305908203125, -10.89306640625, -10.480224609375, -10.0673828125, -9.654541015625, -9.24169921875, -8.828857421875, -8.416015625, -8.003173828125, -7.59033203125, -7.177490234375, -6.7646484375, -6.351806640625, -5.93896484375, -5.526123046875, -5.11328125, -4.700439453125, -4.28759765625, -3.874755859375, -3.4619140625, -3.049072265625, -2.63623046875, -2.223388671875, -1.810546875, -1.397705078125, -0.98486328125, -0.572021484375, -0.1591796875, 0.253662109375, 0.66650390625, 1.079345703125, 1.4921875, 1.905029296875, 2.31787109375, 2.730712890625, 3.1435546875, 3.556396484375, 3.96923828125, 4.382080078125, 4.794921875, 5.207763671875, 5.62060546875, 6.033447265625, 6.4462890625, 6.859130859375, 7.27197265625, 7.684814453125, 8.09765625, 8.510498046875, 8.92333984375, 9.336181640625, 9.7490234375, 10.161865234375, 10.57470703125, 10.987548828125, 11.400390625, 11.813232421875, 12.22607421875, 12.638916015625, 13.0517578125, 13.464599609375, 13.87744140625, 14.290283203125, 14.703125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 6.0, 10.0, 4.0, 7.0, 18.0, 20.0, 31.0, 64.0, 136.0, 323.0, 946.0, 6177.0, 310971.0, 717419.0, 10440.0, 1286.0, 371.0, 134.0, 80.0, 44.0, 23.0, 11.0, 13.0, 7.0, 6.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5859375, -6.30078125, -6.015625, -5.73046875, -5.4453125, -5.16015625, -4.875, -4.58984375, -4.3046875, -4.01953125, -3.734375, -3.44921875, -3.1640625, -2.87890625, -2.59375, -2.30859375, -2.0234375, -1.73828125, -1.453125, -1.16796875, -0.8828125, -0.59765625, -0.3125, -0.02734375, 0.2578125, 0.54296875, 0.828125, 1.11328125, 1.3984375, 1.68359375, 1.96875, 2.25390625, 2.5390625, 2.82421875, 3.109375, 3.39453125, 3.6796875, 3.96484375, 4.25, 4.53515625, 4.8203125, 5.10546875, 5.390625, 5.67578125, 5.9609375, 6.24609375, 6.53125, 6.81640625, 7.1015625, 7.38671875, 7.671875, 7.95703125, 8.2421875, 8.52734375, 8.8125, 9.09765625, 9.3828125, 9.66796875, 9.953125, 10.23828125, 10.5234375, 10.80859375, 11.09375, 11.37890625, 11.6640625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 5.0, 3.0, 2.0, 8.0, 8.0, 6.0, 7.0, 14.0, 24.0, 23.0, 35.0, 51.0, 36.0, 58.0, 65.0, 70.0, 98.0, 85.0, 82.0, 49.0, 58.0, 36.0, 41.0, 29.0, 17.0, 26.0, 13.0, 8.0, 11.0, 3.0, 6.0, 3.0, 2.0, 1.0, 4.0, 1.0, 4.0, 1.0, 1.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0005383491516113281, -0.0005203932523727417, -0.0005024373531341553, -0.00048448145389556885, -0.0004665255546569824, -0.000448569655418396, -0.00043061375617980957, -0.00041265785694122314, -0.0003947019577026367, -0.0003767460584640503, -0.00035879015922546387, -0.00034083425998687744, -0.000322878360748291, -0.0003049224615097046, -0.00028696656227111816, -0.00026901066303253174, -0.0002510547637939453, -0.0002330988645553589, -0.00021514296531677246, -0.00019718706607818604, -0.0001792311668395996, -0.00016127526760101318, -0.00014331936836242676, -0.00012536346912384033, -0.0001074075698852539, -8.945167064666748e-05, -7.149577140808105e-05, -5.353987216949463e-05, -3.55839729309082e-05, -1.7628073692321777e-05, 3.2782554626464844e-07, 1.8283724784851074e-05, 3.62396240234375e-05, 5.4195523262023926e-05, 7.215142250061035e-05, 9.010732173919678e-05, 0.0001080632209777832, 0.00012601912021636963, 0.00014397501945495605, 0.00016193091869354248, 0.0001798868179321289, 0.00019784271717071533, 0.00021579861640930176, 0.00023375451564788818, 0.0002517104148864746, 0.00026966631412506104, 0.00028762221336364746, 0.0003055781126022339, 0.0003235340118408203, 0.00034148991107940674, 0.00035944581031799316, 0.0003774017095565796, 0.000395357608795166, 0.00041331350803375244, 0.00043126940727233887, 0.0004492253065109253, 0.0004671812057495117, 0.00048513710498809814, 0.0005030930042266846, 0.000521048903465271, 0.0005390048027038574, 0.0005569607019424438, 0.0005749166011810303, 0.0005928725004196167, 0.0006108283996582031]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 12.0, 8.0, 16.0, 16.0, 35.0, 65.0, 100.0, 195.0, 499.0, 1953.0, 19731.0, 860087.0, 158596.0, 5710.0, 874.0, 310.0, 142.0, 85.0, 47.0, 33.0, 14.0, 9.0, 5.0, 10.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.9609375, -8.63818359375, -8.3154296875, -7.99267578125, -7.669921875, -7.34716796875, -7.0244140625, -6.70166015625, -6.37890625, -6.05615234375, -5.7333984375, -5.41064453125, -5.087890625, -4.76513671875, -4.4423828125, -4.11962890625, -3.796875, -3.47412109375, -3.1513671875, -2.82861328125, -2.505859375, -2.18310546875, -1.8603515625, -1.53759765625, -1.21484375, -0.89208984375, -0.5693359375, -0.24658203125, 0.076171875, 0.39892578125, 0.7216796875, 1.04443359375, 1.3671875, 1.68994140625, 2.0126953125, 2.33544921875, 2.658203125, 2.98095703125, 3.3037109375, 3.62646484375, 3.94921875, 4.27197265625, 4.5947265625, 4.91748046875, 5.240234375, 5.56298828125, 5.8857421875, 6.20849609375, 6.53125, 6.85400390625, 7.1767578125, 7.49951171875, 7.822265625, 8.14501953125, 8.4677734375, 8.79052734375, 9.11328125, 9.43603515625, 9.7587890625, 10.08154296875, 10.404296875, 10.72705078125, 11.0498046875, 11.37255859375, 11.6953125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 6.0, 8.0, 15.0, 21.0, 45.0, 69.0, 72.0, 85.0, 112.0, 146.0, 118.0, 88.0, 74.0, 57.0, 22.0, 19.0, 16.0, 4.0, 3.0, 7.0, 2.0, 3.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.54296875, -5.38623046875, -5.2294921875, -5.07275390625, -4.916015625, -4.75927734375, -4.6025390625, -4.44580078125, -4.2890625, -4.13232421875, -3.9755859375, -3.81884765625, -3.662109375, -3.50537109375, -3.3486328125, -3.19189453125, -3.03515625, -2.87841796875, -2.7216796875, -2.56494140625, -2.408203125, -2.25146484375, -2.0947265625, -1.93798828125, -1.78125, -1.62451171875, -1.4677734375, -1.31103515625, -1.154296875, -0.99755859375, -0.8408203125, -0.68408203125, -0.52734375, -0.37060546875, -0.2138671875, -0.05712890625, 0.099609375, 0.25634765625, 0.4130859375, 0.56982421875, 0.7265625, 0.88330078125, 1.0400390625, 1.19677734375, 1.353515625, 1.51025390625, 1.6669921875, 1.82373046875, 1.98046875, 2.13720703125, 2.2939453125, 2.45068359375, 2.607421875, 2.76416015625, 2.9208984375, 3.07763671875, 3.234375, 3.39111328125, 3.5478515625, 3.70458984375, 3.861328125, 4.01806640625, 4.1748046875, 4.33154296875, 4.48828125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 4.0, 7.0, 15.0, 32.0, 46.0, 95.0, 147.0, 201.0, 180.0, 124.0, 70.0, 36.0, 19.0, 10.0, 9.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.8558349609375, -60.21604537963867, -57.57625961303711, -54.93647003173828, -52.29668426513672, -49.65689468383789, -47.01710510253906, -44.3773193359375, -41.73752975463867, -39.097740173339844, -36.45795440673828, -33.81816482543945, -31.178377151489258, -28.538589477539062, -25.898799896240234, -23.25901222229004, -20.619224548339844, -17.97943687438965, -15.339648246765137, -12.699859619140625, -10.06007194519043, -7.420284271240234, -4.780495643615723, -2.140707015991211, 0.4990806579589844, 3.138868808746338, 5.778656959533691, 8.418445587158203, 11.058233261108398, 13.698020935058594, 16.337810516357422, 18.977598190307617, 21.617385864257812, 24.257173538208008, 26.896961212158203, 29.53675079345703, 32.176536560058594, 34.81632614135742, 37.45611572265625, 40.09590148925781, 42.73569107055664, 45.37548065185547, 48.01526641845703, 50.65505599975586, 53.29484558105469, 55.93463134765625, 58.57442092895508, 61.214210510253906, 63.85399627685547, 66.49378204345703, 69.13357543945312, 71.77336120605469, 74.41314697265625, 77.05293273925781, 79.6927261352539, 82.33251190185547, 84.97230529785156, 87.61209106445312, 90.25188446044922, 92.89167022705078, 95.53145599365234, 98.17124938964844, 100.81103515625, 103.45082092285156, 106.09060668945312]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 5.0, 5.0, 6.0, 3.0, 7.0, 12.0, 10.0, 8.0, 16.0, 11.0, 16.0, 30.0, 18.0, 32.0, 38.0, 34.0, 38.0, 60.0, 49.0, 47.0, 58.0, 63.0, 49.0, 58.0, 40.0, 45.0, 35.0, 33.0, 32.0, 24.0, 24.0, 24.0, 13.0, 17.0, 5.0, 4.0, 7.0, 7.0, 6.0, 4.0, 3.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.33013153076172, -53.39470672607422, -51.45928192138672, -49.52385711669922, -47.58843231201172, -45.65300750732422, -43.71758270263672, -41.78215408325195, -39.84672927856445, -37.91130447387695, -35.97587966918945, -34.04045486450195, -32.10503005981445, -30.16960334777832, -28.23417854309082, -26.298751831054688, -24.36332893371582, -22.42790412902832, -20.49247932434082, -18.557052612304688, -16.621627807617188, -14.686203002929688, -12.750778198242188, -10.815352439880371, -8.879927635192871, -6.944502353668213, -5.009077072143555, -3.0736522674560547, -1.1382269859313965, 0.7971982955932617, 2.7326231002807617, 4.668048858642578, 6.603473663330078, 8.538898468017578, 10.474324226379395, 12.409749031066895, 14.345174789428711, 16.28059959411621, 18.21602439880371, 20.151451110839844, 22.086875915527344, 24.022300720214844, 25.957725524902344, 27.893150329589844, 29.828577041625977, 31.764001846313477, 33.699424743652344, 35.63485336303711, 37.570274353027344, 39.505699157714844, 41.441123962402344, 43.376548767089844, 45.311973571777344, 47.247398376464844, 49.182823181152344, 51.11825180053711, 53.05367660522461, 54.98910140991211, 56.92452621459961, 58.85995101928711, 60.79537582397461, 62.730804443359375, 64.66622924804688, 66.60165405273438, 68.53707885742188]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 6.0, 5.0, 6.0, 9.0, 16.0, 26.0, 26.0, 37.0, 53.0, 63.0, 85.0, 133.0, 164.0, 402.0, 779.0, 2025.0, 6631.0, 36221.0, 4037939.0, 93226.0, 11167.0, 3038.0, 1076.0, 437.0, 224.0, 132.0, 82.0, 58.0, 55.0, 47.0, 22.0, 26.0, 15.0, 11.0, 10.0, 8.0, 5.0, 4.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-9.1640625, -8.9141845703125, -8.664306640625, -8.4144287109375, -8.16455078125, -7.9146728515625, -7.664794921875, -7.4149169921875, -7.1650390625, -6.9151611328125, -6.665283203125, -6.4154052734375, -6.16552734375, -5.9156494140625, -5.665771484375, -5.4158935546875, -5.166015625, -4.9161376953125, -4.666259765625, -4.4163818359375, -4.16650390625, -3.9166259765625, -3.666748046875, -3.4168701171875, -3.1669921875, -2.9171142578125, -2.667236328125, -2.4173583984375, -2.16748046875, -1.9176025390625, -1.667724609375, -1.4178466796875, -1.16796875, -0.9180908203125, -0.668212890625, -0.4183349609375, -0.16845703125, 0.0814208984375, 0.331298828125, 0.5811767578125, 0.8310546875, 1.0809326171875, 1.330810546875, 1.5806884765625, 1.83056640625, 2.0804443359375, 2.330322265625, 2.5802001953125, 2.830078125, 3.0799560546875, 3.329833984375, 3.5797119140625, 3.82958984375, 4.0794677734375, 4.329345703125, 4.5792236328125, 4.8291015625, 5.0789794921875, 5.328857421875, 5.5787353515625, 5.82861328125, 6.0784912109375, 6.328369140625, 6.5782470703125, 6.828125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 5.0, 5.0, 8.0, 12.0, 27.0, 20.0, 21.0, 35.0, 30.0, 43.0, 36.0, 55.0, 60.0, 64.0, 62.0, 59.0, 59.0, 57.0, 48.0, 50.0, 48.0, 43.0, 29.0, 26.0, 22.0, 20.0, 9.0, 13.0, 9.0, 6.0, 0.0, 2.0, 1.0, 7.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-3.814453125, -3.714874267578125, -3.61529541015625, -3.515716552734375, -3.4161376953125, -3.316558837890625, -3.21697998046875, -3.117401123046875, -3.017822265625, -2.918243408203125, -2.81866455078125, -2.719085693359375, -2.6195068359375, -2.519927978515625, -2.42034912109375, -2.320770263671875, -2.22119140625, -2.121612548828125, -2.02203369140625, -1.922454833984375, -1.8228759765625, -1.723297119140625, -1.62371826171875, -1.524139404296875, -1.424560546875, -1.324981689453125, -1.22540283203125, -1.125823974609375, -1.0262451171875, -0.926666259765625, -0.82708740234375, -0.727508544921875, -0.6279296875, -0.528350830078125, -0.42877197265625, -0.329193115234375, -0.2296142578125, -0.130035400390625, -0.03045654296875, 0.069122314453125, 0.168701171875, 0.268280029296875, 0.36785888671875, 0.467437744140625, 0.5670166015625, 0.666595458984375, 0.76617431640625, 0.865753173828125, 0.96533203125, 1.064910888671875, 1.16448974609375, 1.264068603515625, 1.3636474609375, 1.463226318359375, 1.56280517578125, 1.662384033203125, 1.761962890625, 1.861541748046875, 1.96112060546875, 2.060699462890625, 2.1602783203125, 2.259857177734375, 2.35943603515625, 2.459014892578125, 2.55859375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 2.0, 5.0, 3.0, 4.0, 16.0, 16.0, 21.0, 25.0, 26.0, 35.0, 57.0, 69.0, 85.0, 90.0, 131.0, 155.0, 229.0, 342.0, 768.0, 2631.0, 18486.0, 3988428.0, 171821.0, 7770.0, 1457.0, 498.0, 273.0, 174.0, 148.0, 103.0, 86.0, 89.0, 56.0, 32.0, 25.0, 27.0, 19.0, 17.0, 16.0, 15.0, 8.0, 6.0, 5.0, 5.0, 10.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.671875, -12.260498046875, -11.84912109375, -11.437744140625, -11.0263671875, -10.614990234375, -10.20361328125, -9.792236328125, -9.380859375, -8.969482421875, -8.55810546875, -8.146728515625, -7.7353515625, -7.323974609375, -6.91259765625, -6.501220703125, -6.08984375, -5.678466796875, -5.26708984375, -4.855712890625, -4.4443359375, -4.032958984375, -3.62158203125, -3.210205078125, -2.798828125, -2.387451171875, -1.97607421875, -1.564697265625, -1.1533203125, -0.741943359375, -0.33056640625, 0.080810546875, 0.4921875, 0.903564453125, 1.31494140625, 1.726318359375, 2.1376953125, 2.549072265625, 2.96044921875, 3.371826171875, 3.783203125, 4.194580078125, 4.60595703125, 5.017333984375, 5.4287109375, 5.840087890625, 6.25146484375, 6.662841796875, 7.07421875, 7.485595703125, 7.89697265625, 8.308349609375, 8.7197265625, 9.131103515625, 9.54248046875, 9.953857421875, 10.365234375, 10.776611328125, 11.18798828125, 11.599365234375, 12.0107421875, 12.422119140625, 12.83349609375, 13.244873046875, 13.65625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 13.0, 20.0, 116.0, 3205.0, 586.0, 97.0, 25.0, 9.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.97265625, -3.851715087890625, -3.73077392578125, -3.609832763671875, -3.4888916015625, -3.367950439453125, -3.24700927734375, -3.126068115234375, -3.005126953125, -2.884185791015625, -2.76324462890625, -2.642303466796875, -2.5213623046875, -2.400421142578125, -2.27947998046875, -2.158538818359375, -2.03759765625, -1.916656494140625, -1.79571533203125, -1.674774169921875, -1.5538330078125, -1.432891845703125, -1.31195068359375, -1.191009521484375, -1.070068359375, -0.949127197265625, -0.82818603515625, -0.707244873046875, -0.5863037109375, -0.465362548828125, -0.34442138671875, -0.223480224609375, -0.1025390625, 0.018402099609375, 0.13934326171875, 0.260284423828125, 0.3812255859375, 0.502166748046875, 0.62310791015625, 0.744049072265625, 0.864990234375, 0.985931396484375, 1.10687255859375, 1.227813720703125, 1.3487548828125, 1.469696044921875, 1.59063720703125, 1.711578369140625, 1.83251953125, 1.953460693359375, 2.07440185546875, 2.195343017578125, 2.3162841796875, 2.437225341796875, 2.55816650390625, 2.679107666015625, 2.800048828125, 2.920989990234375, 3.04193115234375, 3.162872314453125, 3.2838134765625, 3.404754638671875, 3.52569580078125, 3.646636962890625, 3.767578125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 4.0, 6.0, 4.0, 6.0, 5.0, 16.0, 11.0, 24.0, 38.0, 56.0, 78.0, 94.0, 110.0, 111.0, 100.0, 89.0, 64.0, 61.0, 28.0, 28.0, 15.0, 14.0, 11.0, 8.0, 11.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.840864658355713, -4.631157398223877, -4.421449661254883, -4.211742401123047, -4.002034664154053, -3.792327404022217, -3.5826199054718018, -3.3729124069213867, -3.1632049083709717, -2.9534974098205566, -2.7437899112701416, -2.5340824127197266, -2.3243751525878906, -2.1146674156188965, -1.9049601554870605, -1.6952526569366455, -1.4855451583862305, -1.2758376598358154, -1.0661301612854004, -0.8564227819442749, -0.6467152833938599, -0.4370077848434448, -0.22730040550231934, -0.017592906951904297, 0.19211459159851074, 0.4018220603466034, 0.611529529094696, 0.8212369680404663, 1.0309444665908813, 1.2406519651412964, 1.4503593444824219, 1.660066843032837, 1.8697738647460938, 2.079481363296509, 2.289188861846924, 2.4988961219787598, 2.708603858947754, 2.91831111907959, 3.128018617630005, 3.33772611618042, 3.547433614730835, 3.75714111328125, 3.966848611831665, 4.17655611038208, 4.386263370513916, 4.59597110748291, 4.805678367614746, 5.015385627746582, 5.225093364715576, 5.434800624847412, 5.644508361816406, 5.854215621948242, 6.063923358917236, 6.273630619049072, 6.483338356018066, 6.693045616149902, 6.902752876281738, 7.112460136413574, 7.322167873382568, 7.531875133514404, 7.741582870483398, 7.951290130615234, 8.16099739074707, 8.370704650878906, 8.580412864685059]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 7.0, 7.0, 13.0, 9.0, 8.0, 16.0, 17.0, 25.0, 20.0, 25.0, 26.0, 30.0, 30.0, 32.0, 45.0, 46.0, 43.0, 36.0, 48.0, 47.0, 44.0, 46.0, 47.0, 29.0, 34.0, 31.0, 40.0, 26.0, 32.0, 38.0, 18.0, 14.0, 14.0, 10.0, 14.0, 8.0, 5.0, 2.0, 4.0, 0.0, 3.0, 5.0, 2.0, 0.0, 1.0, 4.0, 0.0, 2.0], "bins": [-4.488011360168457, -4.360357284545898, -4.23270320892334, -4.105049133300781, -3.9773948192596436, -3.849740743637085, -3.7220864295959473, -3.5944323539733887, -3.46677827835083, -3.3391242027282715, -3.211470127105713, -3.083815813064575, -2.9561617374420166, -2.828507661819458, -2.7008533477783203, -2.5731992721557617, -2.445545196533203, -2.3178911209106445, -2.190237045288086, -2.0625827312469482, -1.9349286556243896, -1.807274580001831, -1.679620385169983, -1.5519661903381348, -1.4243121147155762, -1.2966580390930176, -1.1690038442611694, -1.0413496494293213, -0.9136955738067627, -0.7860414385795593, -0.658387303352356, -0.5307331681251526, -0.4030790328979492, -0.27542489767074585, -0.14777076244354248, -0.02011662721633911, 0.10753750801086426, 0.23519164323806763, 0.362845778465271, 0.49049991369247437, 0.6181540489196777, 0.7458081841468811, 0.8734623193740845, 1.0011165142059326, 1.1287705898284912, 1.2564246654510498, 1.384078860282898, 1.511733055114746, 1.6393871307373047, 1.7670412063598633, 1.8946954011917114, 2.0223495960235596, 2.150003671646118, 2.2776577472686768, 2.4053120613098145, 2.532966136932373, 2.6606202125549316, 2.7882742881774902, 2.915928363800049, 3.0435826778411865, 3.171236753463745, 3.2988908290863037, 3.4265451431274414, 3.55419921875, 3.6818532943725586]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 7.0, 3.0, 5.0, 12.0, 15.0, 18.0, 29.0, 48.0, 54.0, 85.0, 139.0, 200.0, 357.0, 527.0, 1015.0, 1909.0, 3553.0, 6872.0, 14385.0, 31185.0, 69326.0, 151379.0, 273409.0, 252669.0, 130361.0, 59074.0, 26661.0, 12363.0, 6016.0, 3015.0, 1671.0, 836.0, 477.0, 301.0, 185.0, 127.0, 78.0, 62.0, 38.0, 31.0, 18.0, 18.0, 10.0, 4.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.015625, -2.91802978515625, -2.8204345703125, -2.72283935546875, -2.625244140625, -2.52764892578125, -2.4300537109375, -2.33245849609375, -2.23486328125, -2.13726806640625, -2.0396728515625, -1.94207763671875, -1.844482421875, -1.74688720703125, -1.6492919921875, -1.55169677734375, -1.4541015625, -1.35650634765625, -1.2589111328125, -1.16131591796875, -1.063720703125, -0.96612548828125, -0.8685302734375, -0.77093505859375, -0.67333984375, -0.57574462890625, -0.4781494140625, -0.38055419921875, -0.282958984375, -0.18536376953125, -0.0877685546875, 0.00982666015625, 0.107421875, 0.20501708984375, 0.3026123046875, 0.40020751953125, 0.497802734375, 0.59539794921875, 0.6929931640625, 0.79058837890625, 0.88818359375, 0.98577880859375, 1.0833740234375, 1.18096923828125, 1.278564453125, 1.37615966796875, 1.4737548828125, 1.57135009765625, 1.6689453125, 1.76654052734375, 1.8641357421875, 1.96173095703125, 2.059326171875, 2.15692138671875, 2.2545166015625, 2.35211181640625, 2.44970703125, 2.54730224609375, 2.6448974609375, 2.74249267578125, 2.840087890625, 2.93768310546875, 3.0352783203125, 3.13287353515625, 3.23046875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 9.0, 7.0, 9.0, 26.0, 22.0, 29.0, 19.0, 38.0, 28.0, 45.0, 61.0, 67.0, 43.0, 61.0, 62.0, 52.0, 57.0, 60.0, 55.0, 44.0, 45.0, 40.0, 31.0, 18.0, 17.0, 9.0, 10.0, 10.0, 10.0, 2.0, 7.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.876953125, -3.768096923828125, -3.65924072265625, -3.550384521484375, -3.4415283203125, -3.332672119140625, -3.22381591796875, -3.114959716796875, -3.006103515625, -2.897247314453125, -2.78839111328125, -2.679534912109375, -2.5706787109375, -2.461822509765625, -2.35296630859375, -2.244110107421875, -2.13525390625, -2.026397705078125, -1.91754150390625, -1.808685302734375, -1.6998291015625, -1.590972900390625, -1.48211669921875, -1.373260498046875, -1.264404296875, -1.155548095703125, -1.04669189453125, -0.937835693359375, -0.8289794921875, -0.720123291015625, -0.61126708984375, -0.502410888671875, -0.3935546875, -0.284698486328125, -0.17584228515625, -0.066986083984375, 0.0418701171875, 0.150726318359375, 0.25958251953125, 0.368438720703125, 0.477294921875, 0.586151123046875, 0.69500732421875, 0.803863525390625, 0.9127197265625, 1.021575927734375, 1.13043212890625, 1.239288330078125, 1.34814453125, 1.457000732421875, 1.56585693359375, 1.674713134765625, 1.7835693359375, 1.892425537109375, 2.00128173828125, 2.110137939453125, 2.218994140625, 2.327850341796875, 2.43670654296875, 2.545562744140625, 2.6544189453125, 2.763275146484375, 2.87213134765625, 2.980987548828125, 3.08984375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 3.0, 5.0, 5.0, 3.0, 8.0, 26.0, 38.0, 60.0, 148.0, 444.0, 2348.0, 48484.0, 965298.0, 29281.0, 1740.0, 424.0, 98.0, 61.0, 26.0, 9.0, 13.0, 5.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.59375, -19.917236328125, -19.24072265625, -18.564208984375, -17.8876953125, -17.211181640625, -16.53466796875, -15.858154296875, -15.181640625, -14.505126953125, -13.82861328125, -13.152099609375, -12.4755859375, -11.799072265625, -11.12255859375, -10.446044921875, -9.76953125, -9.093017578125, -8.41650390625, -7.739990234375, -7.0634765625, -6.386962890625, -5.71044921875, -5.033935546875, -4.357421875, -3.680908203125, -3.00439453125, -2.327880859375, -1.6513671875, -0.974853515625, -0.29833984375, 0.378173828125, 1.0546875, 1.731201171875, 2.40771484375, 3.084228515625, 3.7607421875, 4.437255859375, 5.11376953125, 5.790283203125, 6.466796875, 7.143310546875, 7.81982421875, 8.496337890625, 9.1728515625, 9.849365234375, 10.52587890625, 11.202392578125, 11.87890625, 12.555419921875, 13.23193359375, 13.908447265625, 14.5849609375, 15.261474609375, 15.93798828125, 16.614501953125, 17.291015625, 17.967529296875, 18.64404296875, 19.320556640625, 19.9970703125, 20.673583984375, 21.35009765625, 22.026611328125, 22.703125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 1.0, 5.0, 7.0, 9.0, 12.0, 17.0, 21.0, 14.0, 29.0, 27.0, 32.0, 33.0, 54.0, 54.0, 54.0, 46.0, 57.0, 52.0, 54.0, 53.0, 58.0, 51.0, 35.0, 40.0, 33.0, 35.0, 28.0, 14.0, 14.0, 15.0, 12.0, 9.0, 9.0, 13.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.25, -17.74560546875, -17.2412109375, -16.73681640625, -16.232421875, -15.72802734375, -15.2236328125, -14.71923828125, -14.21484375, -13.71044921875, -13.2060546875, -12.70166015625, -12.197265625, -11.69287109375, -11.1884765625, -10.68408203125, -10.1796875, -9.67529296875, -9.1708984375, -8.66650390625, -8.162109375, -7.65771484375, -7.1533203125, -6.64892578125, -6.14453125, -5.64013671875, -5.1357421875, -4.63134765625, -4.126953125, -3.62255859375, -3.1181640625, -2.61376953125, -2.109375, -1.60498046875, -1.1005859375, -0.59619140625, -0.091796875, 0.41259765625, 0.9169921875, 1.42138671875, 1.92578125, 2.43017578125, 2.9345703125, 3.43896484375, 3.943359375, 4.44775390625, 4.9521484375, 5.45654296875, 5.9609375, 6.46533203125, 6.9697265625, 7.47412109375, 7.978515625, 8.48291015625, 8.9873046875, 9.49169921875, 9.99609375, 10.50048828125, 11.0048828125, 11.50927734375, 12.013671875, 12.51806640625, 13.0224609375, 13.52685546875, 14.03125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 5.0, 9.0, 14.0, 28.0, 56.0, 166.0, 520.0, 3366.0, 804195.0, 237333.0, 2233.0, 403.0, 130.0, 52.0, 17.0, 10.0, 10.0, 5.0, 2.0, 3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.625, -16.2283935546875, -15.831787109375, -15.4351806640625, -15.03857421875, -14.6419677734375, -14.245361328125, -13.8487548828125, -13.4521484375, -13.0555419921875, -12.658935546875, -12.2623291015625, -11.86572265625, -11.4691162109375, -11.072509765625, -10.6759033203125, -10.279296875, -9.8826904296875, -9.486083984375, -9.0894775390625, -8.69287109375, -8.2962646484375, -7.899658203125, -7.5030517578125, -7.1064453125, -6.7098388671875, -6.313232421875, -5.9166259765625, -5.52001953125, -5.1234130859375, -4.726806640625, -4.3302001953125, -3.93359375, -3.5369873046875, -3.140380859375, -2.7437744140625, -2.34716796875, -1.9505615234375, -1.553955078125, -1.1573486328125, -0.7607421875, -0.3641357421875, 0.032470703125, 0.4290771484375, 0.82568359375, 1.2222900390625, 1.618896484375, 2.0155029296875, 2.412109375, 2.8087158203125, 3.205322265625, 3.6019287109375, 3.99853515625, 4.3951416015625, 4.791748046875, 5.1883544921875, 5.5849609375, 5.9815673828125, 6.378173828125, 6.7747802734375, 7.17138671875, 7.5679931640625, 7.964599609375, 8.3612060546875, 8.7578125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 5.0, 5.0, 3.0, 11.0, 9.0, 14.0, 9.0, 16.0, 17.0, 21.0, 27.0, 29.0, 32.0, 52.0, 57.0, 71.0, 80.0, 73.0, 73.0, 59.0, 60.0, 40.0, 39.0, 42.0, 23.0, 30.0, 27.0, 13.0, 11.0, 5.0, 7.0, 6.0, 8.0, 8.0, 6.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0004513263702392578, -0.0004375167191028595, -0.0004237070679664612, -0.00040989741683006287, -0.00039608776569366455, -0.00038227811455726624, -0.0003684684634208679, -0.0003546588122844696, -0.0003408491611480713, -0.000327039510011673, -0.00031322985887527466, -0.00029942020773887634, -0.00028561055660247803, -0.0002718009054660797, -0.0002579912543296814, -0.0002441816031932831, -0.00023037195205688477, -0.00021656230092048645, -0.00020275264978408813, -0.00018894299864768982, -0.0001751333475112915, -0.0001613236963748932, -0.00014751404523849487, -0.00013370439410209656, -0.00011989474296569824, -0.00010608509182929993, -9.227544069290161e-05, -7.84657895565033e-05, -6.465613842010498e-05, -5.0846487283706665e-05, -3.703683614730835e-05, -2.3227185010910034e-05, -9.417533874511719e-06, 4.392117261886597e-06, 1.8201768398284912e-05, 3.201141953468323e-05, 4.582107067108154e-05, 5.963072180747986e-05, 7.344037294387817e-05, 8.725002408027649e-05, 0.0001010596752166748, 0.00011486932635307312, 0.00012867897748947144, 0.00014248862862586975, 0.00015629827976226807, 0.00017010793089866638, 0.0001839175820350647, 0.000197727233171463, 0.00021153688430786133, 0.00022534653544425964, 0.00023915618658065796, 0.0002529658377170563, 0.0002667754888534546, 0.0002805851399898529, 0.0002943947911262512, 0.00030820444226264954, 0.00032201409339904785, 0.00033582374453544617, 0.0003496333956718445, 0.0003634430468082428, 0.0003772526979446411, 0.00039106234908103943, 0.00040487200021743774, 0.00041868165135383606, 0.0004324913024902344]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 10.0, 7.0, 13.0, 13.0, 21.0, 34.0, 62.0, 83.0, 148.0, 284.0, 647.0, 1362.0, 3505.0, 11926.0, 67111.0, 629736.0, 289623.0, 32161.0, 7400.0, 2402.0, 983.0, 446.0, 233.0, 128.0, 53.0, 35.0, 36.0, 23.0, 15.0, 11.0, 9.0, 8.0, 7.0, 5.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-5.046875, -4.916839599609375, -4.78680419921875, -4.656768798828125, -4.5267333984375, -4.396697998046875, -4.26666259765625, -4.136627197265625, -4.006591796875, -3.876556396484375, -3.74652099609375, -3.616485595703125, -3.4864501953125, -3.356414794921875, -3.22637939453125, -3.096343994140625, -2.96630859375, -2.836273193359375, -2.70623779296875, -2.576202392578125, -2.4461669921875, -2.316131591796875, -2.18609619140625, -2.056060791015625, -1.926025390625, -1.795989990234375, -1.66595458984375, -1.535919189453125, -1.4058837890625, -1.275848388671875, -1.14581298828125, -1.015777587890625, -0.8857421875, -0.755706787109375, -0.62567138671875, -0.495635986328125, -0.3656005859375, -0.235565185546875, -0.10552978515625, 0.024505615234375, 0.154541015625, 0.284576416015625, 0.41461181640625, 0.544647216796875, 0.6746826171875, 0.804718017578125, 0.93475341796875, 1.064788818359375, 1.19482421875, 1.324859619140625, 1.45489501953125, 1.584930419921875, 1.7149658203125, 1.845001220703125, 1.97503662109375, 2.105072021484375, 2.235107421875, 2.365142822265625, 2.49517822265625, 2.625213623046875, 2.7552490234375, 2.885284423828125, 3.01531982421875, 3.145355224609375, 3.275390625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 7.0, 4.0, 6.0, 12.0, 12.0, 31.0, 54.0, 73.0, 124.0, 132.0, 134.0, 107.0, 95.0, 61.0, 56.0, 32.0, 16.0, 12.0, 9.0, 9.0, 5.0, 4.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.23046875, -6.05914306640625, -5.8878173828125, -5.71649169921875, -5.545166015625, -5.37384033203125, -5.2025146484375, -5.03118896484375, -4.85986328125, -4.68853759765625, -4.5172119140625, -4.34588623046875, -4.174560546875, -4.00323486328125, -3.8319091796875, -3.66058349609375, -3.4892578125, -3.31793212890625, -3.1466064453125, -2.97528076171875, -2.803955078125, -2.63262939453125, -2.4613037109375, -2.28997802734375, -2.11865234375, -1.94732666015625, -1.7760009765625, -1.60467529296875, -1.433349609375, -1.26202392578125, -1.0906982421875, -0.91937255859375, -0.748046875, -0.57672119140625, -0.4053955078125, -0.23406982421875, -0.062744140625, 0.10858154296875, 0.2799072265625, 0.45123291015625, 0.62255859375, 0.79388427734375, 0.9652099609375, 1.13653564453125, 1.307861328125, 1.47918701171875, 1.6505126953125, 1.82183837890625, 1.9931640625, 2.16448974609375, 2.3358154296875, 2.50714111328125, 2.678466796875, 2.84979248046875, 3.0211181640625, 3.19244384765625, 3.36376953125, 3.53509521484375, 3.7064208984375, 3.87774658203125, 4.049072265625, 4.22039794921875, 4.3917236328125, 4.56304931640625, 4.734375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 15.0, 45.0, 166.0, 342.0, 272.0, 96.0, 40.0, 9.0, 10.0, 9.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.49655151367188, -88.25054931640625, -84.00454711914062, -79.758544921875, -75.5125503540039, -71.26654815673828, -67.02054595947266, -62.77454376220703, -58.52854537963867, -54.28254318237305, -50.03654479980469, -45.79054260253906, -41.54454040527344, -37.29854202270508, -33.05253982543945, -28.80653953552246, -24.56053924560547, -20.314538955688477, -16.068538665771484, -11.82253646850586, -7.576536178588867, -3.330535888671875, 0.91546630859375, 5.161466598510742, 9.407466888427734, 13.653467178344727, 17.89946746826172, 22.145469665527344, 26.391469955444336, 30.637470245361328, 34.88347244262695, 39.12947082519531, 43.37547302246094, 47.62147521972656, 51.86747360229492, 56.11347579956055, 60.359474182128906, 64.60547637939453, 68.85147857666016, 73.09748077392578, 77.34347534179688, 81.5894775390625, 85.83547973632812, 90.08148193359375, 94.32747650146484, 98.57347869873047, 102.8194808959961, 107.06548309326172, 111.31148529052734, 115.55748748779297, 119.8034896850586, 124.04948425292969, 128.2954864501953, 132.54148864746094, 136.78749084472656, 141.0334930419922, 145.2794952392578, 149.52549743652344, 153.77149963378906, 158.0175018310547, 162.2635040283203, 166.50949096679688, 170.7554931640625, 175.00149536132812, 179.24749755859375]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 5.0, 7.0, 4.0, 3.0, 6.0, 12.0, 11.0, 9.0, 15.0, 24.0, 25.0, 35.0, 37.0, 44.0, 44.0, 37.0, 39.0, 52.0, 58.0, 53.0, 65.0, 51.0, 40.0, 38.0, 43.0, 44.0, 24.0, 37.0, 24.0, 22.0, 12.0, 25.0, 11.0, 12.0, 9.0, 3.0, 8.0, 6.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-64.79041290283203, -62.80526351928711, -60.82011413574219, -58.834964752197266, -56.849815368652344, -54.86466598510742, -52.8795166015625, -50.89436340332031, -48.909217834472656, -46.924068450927734, -44.93891906738281, -42.95376968383789, -40.96862030029297, -38.98347091674805, -36.998321533203125, -35.01316833496094, -33.028018951416016, -31.042869567871094, -29.057720184326172, -27.07257080078125, -25.087421417236328, -23.102272033691406, -21.11712074279785, -19.13197135925293, -17.146821975708008, -15.161672592163086, -13.176523208618164, -11.191372871398926, -9.206223487854004, -7.221074104309082, -5.235923767089844, -3.250774383544922, -1.265625, 0.719524621963501, 2.704674243927002, 4.689824104309082, 6.674973487854004, 8.660122871398926, 10.645273208618164, 12.630422592163086, 14.615571975708008, 16.60072135925293, 18.58587074279785, 20.571022033691406, 22.556171417236328, 24.54132080078125, 26.526470184326172, 28.511619567871094, 30.496768951416016, 32.48191833496094, 34.46706771850586, 36.45221710205078, 38.4373664855957, 40.422515869140625, 42.40766906738281, 44.39281463623047, 46.377967834472656, 48.36311721801758, 50.3482666015625, 52.33341598510742, 54.318565368652344, 56.303714752197266, 58.28886413574219, 60.274017333984375, 62.25916290283203]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 4.0, 0.0, 3.0, 5.0, 7.0, 3.0, 11.0, 16.0, 16.0, 24.0, 31.0, 44.0, 59.0, 90.0, 138.0, 164.0, 289.0, 453.0, 833.0, 1683.0, 3833.0, 12139.0, 66055.0, 3930643.0, 149093.0, 18645.0, 5429.0, 2124.0, 979.0, 527.0, 326.0, 208.0, 129.0, 75.0, 57.0, 41.0, 24.0, 24.0, 20.0, 24.0, 12.0, 6.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.30078125, -6.1077880859375, -5.914794921875, -5.7218017578125, -5.52880859375, -5.3358154296875, -5.142822265625, -4.9498291015625, -4.7568359375, -4.5638427734375, -4.370849609375, -4.1778564453125, -3.98486328125, -3.7918701171875, -3.598876953125, -3.4058837890625, -3.212890625, -3.0198974609375, -2.826904296875, -2.6339111328125, -2.44091796875, -2.2479248046875, -2.054931640625, -1.8619384765625, -1.6689453125, -1.4759521484375, -1.282958984375, -1.0899658203125, -0.89697265625, -0.7039794921875, -0.510986328125, -0.3179931640625, -0.125, 0.0679931640625, 0.260986328125, 0.4539794921875, 0.64697265625, 0.8399658203125, 1.032958984375, 1.2259521484375, 1.4189453125, 1.6119384765625, 1.804931640625, 1.9979248046875, 2.19091796875, 2.3839111328125, 2.576904296875, 2.7698974609375, 2.962890625, 3.1558837890625, 3.348876953125, 3.5418701171875, 3.73486328125, 3.9278564453125, 4.120849609375, 4.3138427734375, 4.5068359375, 4.6998291015625, 4.892822265625, 5.0858154296875, 5.27880859375, 5.4718017578125, 5.664794921875, 5.8577880859375, 6.05078125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 8.0, 12.0, 14.0, 14.0, 20.0, 36.0, 51.0, 56.0, 52.0, 82.0, 76.0, 82.0, 82.0, 76.0, 69.0, 60.0, 55.0, 35.0, 26.0, 25.0, 17.0, 19.0, 12.0, 7.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.681640625, -3.545196533203125, -3.40875244140625, -3.272308349609375, -3.1358642578125, -2.999420166015625, -2.86297607421875, -2.726531982421875, -2.590087890625, -2.453643798828125, -2.31719970703125, -2.180755615234375, -2.0443115234375, -1.907867431640625, -1.77142333984375, -1.634979248046875, -1.49853515625, -1.362091064453125, -1.22564697265625, -1.089202880859375, -0.9527587890625, -0.816314697265625, -0.67987060546875, -0.543426513671875, -0.406982421875, -0.270538330078125, -0.13409423828125, 0.002349853515625, 0.1387939453125, 0.275238037109375, 0.41168212890625, 0.548126220703125, 0.6845703125, 0.821014404296875, 0.95745849609375, 1.093902587890625, 1.2303466796875, 1.366790771484375, 1.50323486328125, 1.639678955078125, 1.776123046875, 1.912567138671875, 2.04901123046875, 2.185455322265625, 2.3218994140625, 2.458343505859375, 2.59478759765625, 2.731231689453125, 2.86767578125, 3.004119873046875, 3.14056396484375, 3.277008056640625, 3.4134521484375, 3.549896240234375, 3.68634033203125, 3.822784423828125, 3.959228515625, 4.095672607421875, 4.23211669921875, 4.368560791015625, 4.5050048828125, 4.641448974609375, 4.77789306640625, 4.914337158203125, 5.05078125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 0.0, 3.0, 5.0, 5.0, 9.0, 8.0, 8.0, 19.0, 17.0, 34.0, 45.0, 39.0, 59.0, 80.0, 92.0, 143.0, 200.0, 274.0, 398.0, 569.0, 936.0, 1728.0, 3702.0, 10683.0, 54178.0, 3548190.0, 526030.0, 32176.0, 7791.0, 2898.0, 1475.0, 758.0, 482.0, 294.0, 261.0, 184.0, 119.0, 78.0, 79.0, 55.0, 44.0, 32.0, 32.0, 19.0, 19.0, 9.0, 8.0, 6.0, 4.0, 2.0, 6.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-7.453125, -7.2330322265625, -7.012939453125, -6.7928466796875, -6.57275390625, -6.3526611328125, -6.132568359375, -5.9124755859375, -5.6923828125, -5.4722900390625, -5.252197265625, -5.0321044921875, -4.81201171875, -4.5919189453125, -4.371826171875, -4.1517333984375, -3.931640625, -3.7115478515625, -3.491455078125, -3.2713623046875, -3.05126953125, -2.8311767578125, -2.611083984375, -2.3909912109375, -2.1708984375, -1.9508056640625, -1.730712890625, -1.5106201171875, -1.29052734375, -1.0704345703125, -0.850341796875, -0.6302490234375, -0.41015625, -0.1900634765625, 0.030029296875, 0.2501220703125, 0.47021484375, 0.6903076171875, 0.910400390625, 1.1304931640625, 1.3505859375, 1.5706787109375, 1.790771484375, 2.0108642578125, 2.23095703125, 2.4510498046875, 2.671142578125, 2.8912353515625, 3.111328125, 3.3314208984375, 3.551513671875, 3.7716064453125, 3.99169921875, 4.2117919921875, 4.431884765625, 4.6519775390625, 4.8720703125, 5.0921630859375, 5.312255859375, 5.5323486328125, 5.75244140625, 5.9725341796875, 6.192626953125, 6.4127197265625, 6.6328125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 10.0, 15.0, 22.0, 52.0, 158.0, 1210.0, 2241.0, 185.0, 87.0, 36.0, 28.0, 13.0, 4.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-7.1953125, -7.045562744140625, -6.89581298828125, -6.746063232421875, -6.5963134765625, -6.446563720703125, -6.29681396484375, -6.147064208984375, -5.997314453125, -5.847564697265625, -5.69781494140625, -5.548065185546875, -5.3983154296875, -5.248565673828125, -5.09881591796875, -4.949066162109375, -4.79931640625, -4.649566650390625, -4.49981689453125, -4.350067138671875, -4.2003173828125, -4.050567626953125, -3.90081787109375, -3.751068115234375, -3.601318359375, -3.451568603515625, -3.30181884765625, -3.152069091796875, -3.0023193359375, -2.852569580078125, -2.70281982421875, -2.553070068359375, -2.4033203125, -2.253570556640625, -2.10382080078125, -1.954071044921875, -1.8043212890625, -1.654571533203125, -1.50482177734375, -1.355072021484375, -1.205322265625, -1.055572509765625, -0.90582275390625, -0.756072998046875, -0.6063232421875, -0.456573486328125, -0.30682373046875, -0.157073974609375, -0.00732421875, 0.142425537109375, 0.29217529296875, 0.441925048828125, 0.5916748046875, 0.741424560546875, 0.89117431640625, 1.040924072265625, 1.190673828125, 1.340423583984375, 1.49017333984375, 1.639923095703125, 1.7896728515625, 1.939422607421875, 2.08917236328125, 2.238922119140625, 2.388671875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 4.0, 14.0, 22.0, 58.0, 87.0, 153.0, 177.0, 171.0, 132.0, 77.0, 42.0, 25.0, 18.0, 10.0, 4.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.120908737182617, -28.448209762573242, -27.775508880615234, -27.10280990600586, -26.430110931396484, -25.757410049438477, -25.0847110748291, -24.412010192871094, -23.73931121826172, -23.066612243652344, -22.393911361694336, -21.72121238708496, -21.048511505126953, -20.375812530517578, -19.703113555908203, -19.030414581298828, -18.35771369934082, -17.685014724731445, -17.012313842773438, -16.339614868164062, -15.666914939880371, -14.99421501159668, -14.321516036987305, -13.648816108703613, -12.976116180419922, -12.30341625213623, -11.630716323852539, -10.958017349243164, -10.285317420959473, -9.612617492675781, -8.939918518066406, -8.267218589782715, -7.594517707824707, -6.921817779541016, -6.249118328094482, -5.576418876647949, -4.903718948364258, -4.231019020080566, -3.558319568634033, -2.8856201171875, -2.2129201889038086, -1.5402204990386963, -0.867520809173584, -0.19482111930847168, 0.4778785705566406, 1.150578260421753, 1.8232779502868652, 2.4959774017333984, 3.16867733001709, 3.841377019882202, 4.5140767097473145, 5.186776161193848, 5.859476089477539, 6.5321760177612305, 7.204875469207764, 7.877574920654297, 8.550274848937988, 9.22297477722168, 9.895673751831055, 10.568373680114746, 11.241073608398438, 11.913773536682129, 12.58647346496582, 13.259172439575195, 13.931872367858887]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 4.0, 0.0, 2.0, 5.0, 5.0, 7.0, 10.0, 10.0, 13.0, 20.0, 21.0, 24.0, 29.0, 29.0, 36.0, 37.0, 44.0, 47.0, 44.0, 53.0, 49.0, 56.0, 49.0, 60.0, 35.0, 59.0, 41.0, 43.0, 29.0, 26.0, 26.0, 24.0, 15.0, 16.0, 13.0, 10.0, 10.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.627298355102539, -10.242330551147461, -9.857361793518066, -9.472393035888672, -9.087425231933594, -8.702457427978516, -8.317488670349121, -7.932520389556885, -7.547552108764648, -7.162583827972412, -6.777615547180176, -6.3926472663879395, -6.007678985595703, -5.622710704803467, -5.2377424240112305, -4.852774143218994, -4.467805862426758, -4.0828375816345215, -3.697869300842285, -3.312901020050049, -2.9279327392578125, -2.542964458465576, -2.15799617767334, -1.7730278968811035, -1.3880596160888672, -1.0030913352966309, -0.6181230545043945, -0.2331547737121582, 0.15181350708007812, 0.5367817878723145, 0.9217500686645508, 1.306718349456787, 1.6916875839233398, 2.076655864715576, 2.4616241455078125, 2.846592426300049, 3.231560707092285, 3.6165289878845215, 4.001497268676758, 4.386465549468994, 4.7714338302612305, 5.156402111053467, 5.541370391845703, 5.9263386726379395, 6.311306953430176, 6.696275234222412, 7.081243515014648, 7.466211795806885, 7.851180076599121, 8.236148834228516, 8.621116638183594, 9.006084442138672, 9.391053199768066, 9.776021957397461, 10.160989761352539, 10.545957565307617, 10.930926322937012, 11.315895080566406, 11.700862884521484, 12.085830688476562, 12.470799446105957, 12.855768203735352, 13.24073600769043, 13.625703811645508, 14.010672569274902]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 3.0, 4.0, 10.0, 10.0, 12.0, 32.0, 43.0, 63.0, 66.0, 121.0, 123.0, 245.0, 356.0, 610.0, 900.0, 1476.0, 2625.0, 4877.0, 9426.0, 20008.0, 45557.0, 110126.0, 248601.0, 313026.0, 164386.0, 68403.0, 29014.0, 13282.0, 6550.0, 3443.0, 1983.0, 1156.0, 664.0, 467.0, 268.0, 213.0, 125.0, 72.0, 64.0, 40.0, 31.0, 15.0, 22.0, 16.0, 4.0, 4.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.537109375, -3.4273681640625, -3.317626953125, -3.2078857421875, -3.09814453125, -2.9884033203125, -2.878662109375, -2.7689208984375, -2.6591796875, -2.5494384765625, -2.439697265625, -2.3299560546875, -2.22021484375, -2.1104736328125, -2.000732421875, -1.8909912109375, -1.78125, -1.6715087890625, -1.561767578125, -1.4520263671875, -1.34228515625, -1.2325439453125, -1.122802734375, -1.0130615234375, -0.9033203125, -0.7935791015625, -0.683837890625, -0.5740966796875, -0.46435546875, -0.3546142578125, -0.244873046875, -0.1351318359375, -0.025390625, 0.0843505859375, 0.194091796875, 0.3038330078125, 0.41357421875, 0.5233154296875, 0.633056640625, 0.7427978515625, 0.8525390625, 0.9622802734375, 1.072021484375, 1.1817626953125, 1.29150390625, 1.4012451171875, 1.510986328125, 1.6207275390625, 1.73046875, 1.8402099609375, 1.949951171875, 2.0596923828125, 2.16943359375, 2.2791748046875, 2.388916015625, 2.4986572265625, 2.6083984375, 2.7181396484375, 2.827880859375, 2.9376220703125, 3.04736328125, 3.1571044921875, 3.266845703125, 3.3765869140625, 3.486328125]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 6.0, 2.0, 3.0, 2.0, 3.0, 11.0, 12.0, 17.0, 15.0, 25.0, 23.0, 41.0, 40.0, 45.0, 60.0, 58.0, 61.0, 41.0, 53.0, 56.0, 53.0, 58.0, 39.0, 57.0, 50.0, 25.0, 34.0, 27.0, 28.0, 15.0, 10.0, 5.0, 12.0, 4.0, 0.0, 7.0, 2.0, 1.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.89453125, -2.7861328125, -2.677734375, -2.5693359375, -2.4609375, -2.3525390625, -2.244140625, -2.1357421875, -2.02734375, -1.9189453125, -1.810546875, -1.7021484375, -1.59375, -1.4853515625, -1.376953125, -1.2685546875, -1.16015625, -1.0517578125, -0.943359375, -0.8349609375, -0.7265625, -0.6181640625, -0.509765625, -0.4013671875, -0.29296875, -0.1845703125, -0.076171875, 0.0322265625, 0.140625, 0.2490234375, 0.357421875, 0.4658203125, 0.57421875, 0.6826171875, 0.791015625, 0.8994140625, 1.0078125, 1.1162109375, 1.224609375, 1.3330078125, 1.44140625, 1.5498046875, 1.658203125, 1.7666015625, 1.875, 1.9833984375, 2.091796875, 2.2001953125, 2.30859375, 2.4169921875, 2.525390625, 2.6337890625, 2.7421875, 2.8505859375, 2.958984375, 3.0673828125, 3.17578125, 3.2841796875, 3.392578125, 3.5009765625, 3.609375, 3.7177734375, 3.826171875, 3.9345703125, 4.04296875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 3.0, 8.0, 14.0, 14.0, 13.0, 22.0, 51.0, 106.0, 267.0, 954.0, 7371.0, 825222.0, 209952.0, 3542.0, 593.0, 201.0, 93.0, 43.0, 27.0, 13.0, 9.0, 7.0, 5.0, 2.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.671875, -19.929931640625, -19.18798828125, -18.446044921875, -17.7041015625, -16.962158203125, -16.22021484375, -15.478271484375, -14.736328125, -13.994384765625, -13.25244140625, -12.510498046875, -11.7685546875, -11.026611328125, -10.28466796875, -9.542724609375, -8.80078125, -8.058837890625, -7.31689453125, -6.574951171875, -5.8330078125, -5.091064453125, -4.34912109375, -3.607177734375, -2.865234375, -2.123291015625, -1.38134765625, -0.639404296875, 0.1025390625, 0.844482421875, 1.58642578125, 2.328369140625, 3.0703125, 3.812255859375, 4.55419921875, 5.296142578125, 6.0380859375, 6.780029296875, 7.52197265625, 8.263916015625, 9.005859375, 9.747802734375, 10.48974609375, 11.231689453125, 11.9736328125, 12.715576171875, 13.45751953125, 14.199462890625, 14.94140625, 15.683349609375, 16.42529296875, 17.167236328125, 17.9091796875, 18.651123046875, 19.39306640625, 20.135009765625, 20.876953125, 21.618896484375, 22.36083984375, 23.102783203125, 23.8447265625, 24.586669921875, 25.32861328125, 26.070556640625, 26.8125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 8.0, 7.0, 10.0, 3.0, 8.0, 13.0, 20.0, 21.0, 25.0, 22.0, 31.0, 43.0, 46.0, 48.0, 53.0, 59.0, 56.0, 62.0, 43.0, 45.0, 50.0, 47.0, 50.0, 45.0, 39.0, 26.0, 23.0, 20.0, 22.0, 12.0, 15.0, 4.0, 7.0, 9.0, 4.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0234375, -11.5777587890625, -11.132080078125, -10.6864013671875, -10.24072265625, -9.7950439453125, -9.349365234375, -8.9036865234375, -8.4580078125, -8.0123291015625, -7.566650390625, -7.1209716796875, -6.67529296875, -6.2296142578125, -5.783935546875, -5.3382568359375, -4.892578125, -4.4468994140625, -4.001220703125, -3.5555419921875, -3.10986328125, -2.6641845703125, -2.218505859375, -1.7728271484375, -1.3271484375, -0.8814697265625, -0.435791015625, 0.0098876953125, 0.45556640625, 0.9012451171875, 1.346923828125, 1.7926025390625, 2.23828125, 2.6839599609375, 3.129638671875, 3.5753173828125, 4.02099609375, 4.4666748046875, 4.912353515625, 5.3580322265625, 5.8037109375, 6.2493896484375, 6.695068359375, 7.1407470703125, 7.58642578125, 8.0321044921875, 8.477783203125, 8.9234619140625, 9.369140625, 9.8148193359375, 10.260498046875, 10.7061767578125, 11.15185546875, 11.5975341796875, 12.043212890625, 12.4888916015625, 12.9345703125, 13.3802490234375, 13.825927734375, 14.2716064453125, 14.71728515625, 15.1629638671875, 15.608642578125, 16.0543212890625, 16.5]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 1.0, 6.0, 5.0, 14.0, 19.0, 35.0, 53.0, 90.0, 195.0, 482.0, 1431.0, 7385.0, 115161.0, 870622.0, 46931.0, 4371.0, 1037.0, 345.0, 168.0, 85.0, 42.0, 32.0, 17.0, 14.0, 6.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.1640625, -6.015045166015625, -5.86602783203125, -5.717010498046875, -5.5679931640625, -5.418975830078125, -5.26995849609375, -5.120941162109375, -4.971923828125, -4.822906494140625, -4.67388916015625, -4.524871826171875, -4.3758544921875, -4.226837158203125, -4.07781982421875, -3.928802490234375, -3.77978515625, -3.630767822265625, -3.48175048828125, -3.332733154296875, -3.1837158203125, -3.034698486328125, -2.88568115234375, -2.736663818359375, -2.587646484375, -2.438629150390625, -2.28961181640625, -2.140594482421875, -1.9915771484375, -1.842559814453125, -1.69354248046875, -1.544525146484375, -1.3955078125, -1.246490478515625, -1.09747314453125, -0.948455810546875, -0.7994384765625, -0.650421142578125, -0.50140380859375, -0.352386474609375, -0.203369140625, -0.054351806640625, 0.09466552734375, 0.243682861328125, 0.3927001953125, 0.541717529296875, 0.69073486328125, 0.839752197265625, 0.98876953125, 1.137786865234375, 1.28680419921875, 1.435821533203125, 1.5848388671875, 1.733856201171875, 1.88287353515625, 2.031890869140625, 2.180908203125, 2.329925537109375, 2.47894287109375, 2.627960205078125, 2.7769775390625, 2.925994873046875, 3.07501220703125, 3.224029541015625, 3.373046875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 5.0, 5.0, 2.0, 9.0, 9.0, 9.0, 9.0, 17.0, 9.0, 13.0, 19.0, 33.0, 16.0, 43.0, 46.0, 58.0, 85.0, 88.0, 106.0, 97.0, 59.0, 55.0, 43.0, 33.0, 28.0, 24.0, 16.0, 14.0, 12.0, 8.0, 11.0, 6.0, 4.0, 5.0, 2.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.000522613525390625, -0.000506862998008728, -0.0004911124706268311, -0.0004753619432449341, -0.0004596114158630371, -0.00044386088848114014, -0.00042811036109924316, -0.0004123598337173462, -0.0003966093063354492, -0.00038085877895355225, -0.0003651082515716553, -0.0003493577241897583, -0.00033360719680786133, -0.00031785666942596436, -0.0003021061420440674, -0.0002863556146621704, -0.00027060508728027344, -0.00025485455989837646, -0.0002391040325164795, -0.00022335350513458252, -0.00020760297775268555, -0.00019185245037078857, -0.0001761019229888916, -0.00016035139560699463, -0.00014460086822509766, -0.00012885034084320068, -0.00011309981346130371, -9.734928607940674e-05, -8.159875869750977e-05, -6.584823131561279e-05, -5.009770393371582e-05, -3.434717655181885e-05, -1.8596649169921875e-05, -2.8461217880249023e-06, 1.290440559387207e-05, 2.8654932975769043e-05, 4.4405460357666016e-05, 6.015598773956299e-05, 7.590651512145996e-05, 9.165704250335693e-05, 0.0001074075698852539, 0.00012315809726715088, 0.00013890862464904785, 0.00015465915203094482, 0.0001704096794128418, 0.00018616020679473877, 0.00020191073417663574, 0.00021766126155853271, 0.0002334117889404297, 0.00024916231632232666, 0.00026491284370422363, 0.0002806633710861206, 0.0002964138984680176, 0.00031216442584991455, 0.0003279149532318115, 0.0003436654806137085, 0.00035941600799560547, 0.00037516653537750244, 0.0003909170627593994, 0.0004066675901412964, 0.00042241811752319336, 0.00043816864490509033, 0.0004539191722869873, 0.0004696696996688843, 0.00048542022705078125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 0.0, 4.0, 4.0, 5.0, 5.0, 7.0, 13.0, 25.0, 35.0, 56.0, 84.0, 112.0, 198.0, 343.0, 691.0, 1358.0, 3302.0, 10173.0, 55520.0, 596620.0, 333614.0, 33997.0, 7245.0, 2576.0, 1211.0, 548.0, 325.0, 197.0, 102.0, 64.0, 46.0, 20.0, 21.0, 14.0, 7.0, 3.0, 6.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4921875, -3.37530517578125, -3.2584228515625, -3.14154052734375, -3.024658203125, -2.90777587890625, -2.7908935546875, -2.67401123046875, -2.55712890625, -2.44024658203125, -2.3233642578125, -2.20648193359375, -2.089599609375, -1.97271728515625, -1.8558349609375, -1.73895263671875, -1.6220703125, -1.50518798828125, -1.3883056640625, -1.27142333984375, -1.154541015625, -1.03765869140625, -0.9207763671875, -0.80389404296875, -0.68701171875, -0.57012939453125, -0.4532470703125, -0.33636474609375, -0.219482421875, -0.10260009765625, 0.0142822265625, 0.13116455078125, 0.248046875, 0.36492919921875, 0.4818115234375, 0.59869384765625, 0.715576171875, 0.83245849609375, 0.9493408203125, 1.06622314453125, 1.18310546875, 1.29998779296875, 1.4168701171875, 1.53375244140625, 1.650634765625, 1.76751708984375, 1.8843994140625, 2.00128173828125, 2.1181640625, 2.23504638671875, 2.3519287109375, 2.46881103515625, 2.585693359375, 2.70257568359375, 2.8194580078125, 2.93634033203125, 3.05322265625, 3.17010498046875, 3.2869873046875, 3.40386962890625, 3.520751953125, 3.63763427734375, 3.7545166015625, 3.87139892578125, 3.98828125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 9.0, 3.0, 7.0, 15.0, 19.0, 40.0, 32.0, 45.0, 85.0, 114.0, 122.0, 161.0, 101.0, 83.0, 54.0, 32.0, 22.0, 18.0, 11.0, 7.0, 10.0, 6.0, 1.0, 4.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.896484375, -2.752166748046875, -2.60784912109375, -2.463531494140625, -2.3192138671875, -2.174896240234375, -2.03057861328125, -1.886260986328125, -1.741943359375, -1.597625732421875, -1.45330810546875, -1.308990478515625, -1.1646728515625, -1.020355224609375, -0.87603759765625, -0.731719970703125, -0.58740234375, -0.443084716796875, -0.29876708984375, -0.154449462890625, -0.0101318359375, 0.134185791015625, 0.27850341796875, 0.422821044921875, 0.567138671875, 0.711456298828125, 0.85577392578125, 1.000091552734375, 1.1444091796875, 1.288726806640625, 1.43304443359375, 1.577362060546875, 1.7216796875, 1.865997314453125, 2.01031494140625, 2.154632568359375, 2.2989501953125, 2.443267822265625, 2.58758544921875, 2.731903076171875, 2.876220703125, 3.020538330078125, 3.16485595703125, 3.309173583984375, 3.4534912109375, 3.597808837890625, 3.74212646484375, 3.886444091796875, 4.03076171875, 4.175079345703125, 4.31939697265625, 4.463714599609375, 4.6080322265625, 4.752349853515625, 4.89666748046875, 5.040985107421875, 5.185302734375, 5.329620361328125, 5.47393798828125, 5.618255615234375, 5.7625732421875, 5.906890869140625, 6.05120849609375, 6.195526123046875, 6.33984375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 11.0, 5.0, 20.0, 55.0, 124.0, 288.0, 268.0, 144.0, 56.0, 20.0, 6.0, 6.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.18428039550781, -90.46527099609375, -86.74626159667969, -83.02725219726562, -79.30824279785156, -75.5892333984375, -71.87022399902344, -68.1512222290039, -64.43221282958984, -60.71320343017578, -56.99419403076172, -53.275184631347656, -49.55617904663086, -45.8371696472168, -42.118160247802734, -38.39915466308594, -34.68014144897461, -30.961132049560547, -27.242124557495117, -23.523115158081055, -19.804107666015625, -16.085098266601562, -12.3660888671875, -8.64708137512207, -4.928071975708008, -1.2090632915496826, 2.5099453926086426, 6.228954315185547, 9.947962760925293, 13.666971206665039, 17.3859806060791, 21.10498809814453, 24.823997497558594, 28.543006896972656, 32.26201629638672, 35.98102569580078, 39.70003128051758, 43.41904067993164, 47.1380500793457, 50.8570556640625, 54.57606506347656, 58.295074462890625, 62.01408386230469, 65.73309326171875, 69.45210266113281, 73.17111206054688, 76.89012145996094, 80.60912322998047, 84.32814025878906, 88.04714965820312, 91.76615905761719, 95.48516845703125, 99.20417785644531, 102.92318725585938, 106.64219665527344, 110.36119842529297, 114.08020782470703, 117.7992172241211, 121.51822662353516, 125.23723602294922, 128.95623779296875, 132.6752471923828, 136.39425659179688, 140.11326599121094, 143.832275390625]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 5.0, 3.0, 8.0, 8.0, 8.0, 14.0, 12.0, 13.0, 17.0, 22.0, 29.0, 24.0, 40.0, 38.0, 36.0, 45.0, 48.0, 49.0, 42.0, 55.0, 72.0, 46.0, 44.0, 46.0, 35.0, 54.0, 30.0, 20.0, 23.0, 30.0, 16.0, 15.0, 12.0, 11.0, 10.0, 8.0, 7.0, 6.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-59.87232971191406, -57.96710205078125, -56.06187057495117, -54.15664291381836, -52.25141143798828, -50.34618377685547, -48.440956115722656, -46.53572463989258, -44.6304931640625, -42.72526550292969, -40.82003402709961, -38.9148063659668, -37.00957489013672, -35.104347229003906, -33.199119567871094, -31.293888092041016, -29.388660430908203, -27.483430862426758, -25.578201293945312, -23.6729736328125, -21.767742156982422, -19.86251449584961, -17.957284927368164, -16.05205535888672, -14.146825790405273, -12.241596221923828, -10.336366653442383, -8.431138038635254, -6.525908470153809, -4.620678901672363, -2.7154502868652344, -0.8102207183837891, 1.0950088500976562, 3.0002381801605225, 4.905467510223389, 6.810696601867676, 8.715926170349121, 10.621155738830566, 12.526384353637695, 14.43161392211914, 16.336843490600586, 18.24207305908203, 20.147302627563477, 22.052532196044922, 23.957759857177734, 25.862991333007812, 27.768218994140625, 29.67344856262207, 31.578678131103516, 33.48390579223633, 35.389137268066406, 37.29436492919922, 39.1995964050293, 41.10482406616211, 43.01005554199219, 44.915283203125, 46.82051086425781, 48.725738525390625, 50.6309700012207, 52.536197662353516, 54.441429138183594, 56.346656799316406, 58.25188446044922, 60.1571159362793, 62.062347412109375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 6.0, 5.0, 8.0, 7.0, 14.0, 27.0, 31.0, 49.0, 75.0, 105.0, 209.0, 342.0, 645.0, 1332.0, 2721.0, 6356.0, 17585.0, 93469.0, 1760315.0, 2169372.0, 110130.0, 19234.0, 6652.0, 2899.0, 1293.0, 625.0, 313.0, 191.0, 111.0, 71.0, 26.0, 23.0, 16.0, 11.0, 7.0, 3.0, 5.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.9375, -4.79241943359375, -4.6473388671875, -4.50225830078125, -4.357177734375, -4.21209716796875, -4.0670166015625, -3.92193603515625, -3.77685546875, -3.63177490234375, -3.4866943359375, -3.34161376953125, -3.196533203125, -3.05145263671875, -2.9063720703125, -2.76129150390625, -2.6162109375, -2.47113037109375, -2.3260498046875, -2.18096923828125, -2.035888671875, -1.89080810546875, -1.7457275390625, -1.60064697265625, -1.45556640625, -1.31048583984375, -1.1654052734375, -1.02032470703125, -0.875244140625, -0.73016357421875, -0.5850830078125, -0.44000244140625, -0.294921875, -0.14984130859375, -0.0047607421875, 0.14031982421875, 0.285400390625, 0.43048095703125, 0.5755615234375, 0.72064208984375, 0.86572265625, 1.01080322265625, 1.1558837890625, 1.30096435546875, 1.446044921875, 1.59112548828125, 1.7362060546875, 1.88128662109375, 2.0263671875, 2.17144775390625, 2.3165283203125, 2.46160888671875, 2.606689453125, 2.75177001953125, 2.8968505859375, 3.04193115234375, 3.18701171875, 3.33209228515625, 3.4771728515625, 3.62225341796875, 3.767333984375, 3.91241455078125, 4.0574951171875, 4.20257568359375, 4.34765625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 7.0, 4.0, 7.0, 12.0, 13.0, 12.0, 12.0, 18.0, 17.0, 36.0, 36.0, 30.0, 36.0, 41.0, 53.0, 37.0, 41.0, 52.0, 46.0, 46.0, 35.0, 48.0, 40.0, 42.0, 29.0, 37.0, 36.0, 33.0, 28.0, 14.0, 11.0, 16.0, 13.0, 14.0, 15.0, 8.0, 8.0, 5.0, 6.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.515625, -2.439483642578125, -2.36334228515625, -2.287200927734375, -2.2110595703125, -2.134918212890625, -2.05877685546875, -1.982635498046875, -1.906494140625, -1.830352783203125, -1.75421142578125, -1.678070068359375, -1.6019287109375, -1.525787353515625, -1.44964599609375, -1.373504638671875, -1.29736328125, -1.221221923828125, -1.14508056640625, -1.068939208984375, -0.9927978515625, -0.916656494140625, -0.84051513671875, -0.764373779296875, -0.688232421875, -0.612091064453125, -0.53594970703125, -0.459808349609375, -0.3836669921875, -0.307525634765625, -0.23138427734375, -0.155242919921875, -0.0791015625, -0.002960205078125, 0.07318115234375, 0.149322509765625, 0.2254638671875, 0.301605224609375, 0.37774658203125, 0.453887939453125, 0.530029296875, 0.606170654296875, 0.68231201171875, 0.758453369140625, 0.8345947265625, 0.910736083984375, 0.98687744140625, 1.063018798828125, 1.13916015625, 1.215301513671875, 1.29144287109375, 1.367584228515625, 1.4437255859375, 1.519866943359375, 1.59600830078125, 1.672149658203125, 1.748291015625, 1.824432373046875, 1.90057373046875, 1.976715087890625, 2.0528564453125, 2.128997802734375, 2.20513916015625, 2.281280517578125, 2.357421875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 2.0, 5.0, 10.0, 12.0, 18.0, 33.0, 92.0, 225.0, 744.0, 3497.0, 33839.0, 4030083.0, 117260.0, 6653.0, 1244.0, 312.0, 136.0, 55.0, 22.0, 13.0, 5.0, 7.0, 3.0, 1.0, 8.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.8046875, -15.2718505859375, -14.739013671875, -14.2061767578125, -13.67333984375, -13.1405029296875, -12.607666015625, -12.0748291015625, -11.5419921875, -11.0091552734375, -10.476318359375, -9.9434814453125, -9.41064453125, -8.8778076171875, -8.344970703125, -7.8121337890625, -7.279296875, -6.7464599609375, -6.213623046875, -5.6807861328125, -5.14794921875, -4.6151123046875, -4.082275390625, -3.5494384765625, -3.0166015625, -2.4837646484375, -1.950927734375, -1.4180908203125, -0.88525390625, -0.3524169921875, 0.180419921875, 0.7132568359375, 1.24609375, 1.7789306640625, 2.311767578125, 2.8446044921875, 3.37744140625, 3.9102783203125, 4.443115234375, 4.9759521484375, 5.5087890625, 6.0416259765625, 6.574462890625, 7.1072998046875, 7.64013671875, 8.1729736328125, 8.705810546875, 9.2386474609375, 9.771484375, 10.3043212890625, 10.837158203125, 11.3699951171875, 11.90283203125, 12.4356689453125, 12.968505859375, 13.5013427734375, 14.0341796875, 14.5670166015625, 15.099853515625, 15.6326904296875, 16.16552734375, 16.6983642578125, 17.231201171875, 17.7640380859375, 18.296875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 3.0, 4.0, 4.0, 4.0, 6.0, 10.0, 17.0, 20.0, 32.0, 53.0, 125.0, 301.0, 970.0, 1425.0, 667.0, 208.0, 84.0, 53.0, 27.0, 22.0, 8.0, 5.0, 10.0, 4.0, 5.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.890625, -10.5899658203125, -10.289306640625, -9.9886474609375, -9.68798828125, -9.3873291015625, -9.086669921875, -8.7860107421875, -8.4853515625, -8.1846923828125, -7.884033203125, -7.5833740234375, -7.28271484375, -6.9820556640625, -6.681396484375, -6.3807373046875, -6.080078125, -5.7794189453125, -5.478759765625, -5.1781005859375, -4.87744140625, -4.5767822265625, -4.276123046875, -3.9754638671875, -3.6748046875, -3.3741455078125, -3.073486328125, -2.7728271484375, -2.47216796875, -2.1715087890625, -1.870849609375, -1.5701904296875, -1.26953125, -0.9688720703125, -0.668212890625, -0.3675537109375, -0.06689453125, 0.2337646484375, 0.534423828125, 0.8350830078125, 1.1357421875, 1.4364013671875, 1.737060546875, 2.0377197265625, 2.33837890625, 2.6390380859375, 2.939697265625, 3.2403564453125, 3.541015625, 3.8416748046875, 4.142333984375, 4.4429931640625, 4.74365234375, 5.0443115234375, 5.344970703125, 5.6456298828125, 5.9462890625, 6.2469482421875, 6.547607421875, 6.8482666015625, 7.14892578125, 7.4495849609375, 7.750244140625, 8.0509033203125, 8.3515625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 7.0, 13.0, 43.0, 110.0, 203.0, 250.0, 211.0, 97.0, 33.0, 11.0, 5.0, 9.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.177978515625, -61.159942626953125, -58.14190673828125, -55.123870849609375, -52.1058349609375, -49.087799072265625, -46.06976318359375, -43.051727294921875, -40.03369140625, -37.015655517578125, -33.99761962890625, -30.979583740234375, -27.9615478515625, -24.943511962890625, -21.925477981567383, -18.907442092895508, -15.889408111572266, -12.87137222290039, -9.853336334228516, -6.835301399230957, -3.817265510559082, -0.799229621887207, 2.2188053131103516, 5.236841201782227, 8.254877090454102, 11.272912979125977, 14.290948867797852, 17.308982849121094, 20.32701873779297, 23.345054626464844, 26.36309051513672, 29.381126403808594, 32.39916229248047, 35.417198181152344, 38.43523406982422, 41.453269958496094, 44.47130584716797, 47.489341735839844, 50.50737762451172, 53.525413513183594, 56.54344940185547, 59.561485290527344, 62.57952117919922, 65.5975570678711, 68.61559295654297, 71.63362884521484, 74.65166473388672, 77.6697006225586, 80.68772888183594, 83.70576477050781, 86.72380065917969, 89.74183654785156, 92.75987243652344, 95.77790832519531, 98.79594421386719, 101.81398010253906, 104.83201599121094, 107.85005187988281, 110.86808776855469, 113.88612365722656, 116.90415954589844, 119.92219543457031, 122.94023132324219, 125.95826721191406, 128.97630310058594]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 7.0, 12.0, 17.0, 13.0, 24.0, 19.0, 30.0, 31.0, 39.0, 39.0, 55.0, 43.0, 53.0, 59.0, 48.0, 61.0, 51.0, 61.0, 47.0, 36.0, 31.0, 47.0, 28.0, 37.0, 35.0, 28.0, 17.0, 11.0, 9.0, 9.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.70733642578125, -29.606185913085938, -28.505033493041992, -27.403881072998047, -26.302730560302734, -25.201580047607422, -24.100427627563477, -22.99927520751953, -21.89812469482422, -20.796974182128906, -19.69582176208496, -18.594669342041016, -17.493518829345703, -16.39236831665039, -15.291215896606445, -14.190064430236816, -13.088912963867188, -11.987761497497559, -10.88661003112793, -9.7854585647583, -8.684307098388672, -7.583155632019043, -6.482004165649414, -5.380852699279785, -4.279701232910156, -3.1785497665405273, -2.0773983001708984, -0.9762468338012695, 0.12490463256835938, 1.2260560989379883, 2.327207565307617, 3.428359031677246, 4.529510498046875, 5.630661964416504, 6.731813430786133, 7.832964897155762, 8.93411636352539, 10.03526782989502, 11.136419296264648, 12.237570762634277, 13.338722229003906, 14.439873695373535, 15.541025161743164, 16.64217758178711, 17.743328094482422, 18.844478607177734, 19.94563102722168, 21.046783447265625, 22.147933959960938, 23.24908447265625, 24.350236892700195, 25.45138931274414, 26.552539825439453, 27.653690338134766, 28.75484275817871, 29.855995178222656, 30.95714569091797, 32.05829620361328, 33.159446716308594, 34.26060104370117, 35.361751556396484, 36.4629020690918, 37.564056396484375, 38.66520690917969, 39.766357421875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 0.0, 6.0, 10.0, 13.0, 24.0, 29.0, 44.0, 85.0, 113.0, 178.0, 257.0, 436.0, 631.0, 1048.0, 1778.0, 3028.0, 5223.0, 9822.0, 18871.0, 38149.0, 81750.0, 174172.0, 287456.0, 218569.0, 105710.0, 49675.0, 23900.0, 12070.0, 6402.0, 3657.0, 2094.0, 1302.0, 747.0, 464.0, 267.0, 169.0, 119.0, 102.0, 50.0, 38.0, 31.0, 19.0, 11.0, 17.0, 3.0, 4.0, 6.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.916015625, -2.82940673828125, -2.7427978515625, -2.65618896484375, -2.569580078125, -2.48297119140625, -2.3963623046875, -2.30975341796875, -2.22314453125, -2.13653564453125, -2.0499267578125, -1.96331787109375, -1.876708984375, -1.79010009765625, -1.7034912109375, -1.61688232421875, -1.5302734375, -1.44366455078125, -1.3570556640625, -1.27044677734375, -1.183837890625, -1.09722900390625, -1.0106201171875, -0.92401123046875, -0.83740234375, -0.75079345703125, -0.6641845703125, -0.57757568359375, -0.490966796875, -0.40435791015625, -0.3177490234375, -0.23114013671875, -0.14453125, -0.05792236328125, 0.0286865234375, 0.11529541015625, 0.201904296875, 0.28851318359375, 0.3751220703125, 0.46173095703125, 0.54833984375, 0.63494873046875, 0.7215576171875, 0.80816650390625, 0.894775390625, 0.98138427734375, 1.0679931640625, 1.15460205078125, 1.2412109375, 1.32781982421875, 1.4144287109375, 1.50103759765625, 1.587646484375, 1.67425537109375, 1.7608642578125, 1.84747314453125, 1.93408203125, 2.02069091796875, 2.1072998046875, 2.19390869140625, 2.280517578125, 2.36712646484375, 2.4537353515625, 2.54034423828125, 2.626953125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 2.0, 4.0, 7.0, 7.0, 13.0, 12.0, 19.0, 15.0, 32.0, 21.0, 29.0, 39.0, 28.0, 37.0, 43.0, 48.0, 47.0, 44.0, 61.0, 42.0, 40.0, 54.0, 49.0, 33.0, 36.0, 39.0, 25.0, 29.0, 24.0, 26.0, 17.0, 20.0, 13.0, 12.0, 13.0, 4.0, 6.0, 3.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.416015625, -2.3360595703125, -2.256103515625, -2.1761474609375, -2.09619140625, -2.0162353515625, -1.936279296875, -1.8563232421875, -1.7763671875, -1.6964111328125, -1.616455078125, -1.5364990234375, -1.45654296875, -1.3765869140625, -1.296630859375, -1.2166748046875, -1.13671875, -1.0567626953125, -0.976806640625, -0.8968505859375, -0.81689453125, -0.7369384765625, -0.656982421875, -0.5770263671875, -0.4970703125, -0.4171142578125, -0.337158203125, -0.2572021484375, -0.17724609375, -0.0972900390625, -0.017333984375, 0.0626220703125, 0.142578125, 0.2225341796875, 0.302490234375, 0.3824462890625, 0.46240234375, 0.5423583984375, 0.622314453125, 0.7022705078125, 0.7822265625, 0.8621826171875, 0.942138671875, 1.0220947265625, 1.10205078125, 1.1820068359375, 1.261962890625, 1.3419189453125, 1.421875, 1.5018310546875, 1.581787109375, 1.6617431640625, 1.74169921875, 1.8216552734375, 1.901611328125, 1.9815673828125, 2.0615234375, 2.1414794921875, 2.221435546875, 2.3013916015625, 2.38134765625, 2.4613037109375, 2.541259765625, 2.6212158203125, 2.701171875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 4.0, 10.0, 11.0, 11.0, 13.0, 15.0, 20.0, 22.0, 39.0, 48.0, 81.0, 113.0, 176.0, 350.0, 577.0, 1270.0, 4230.0, 37071.0, 850793.0, 141695.0, 8099.0, 2004.0, 835.0, 390.0, 204.0, 137.0, 103.0, 53.0, 35.0, 31.0, 26.0, 21.0, 13.0, 15.0, 12.0, 3.0, 5.0, 1.0, 5.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.84375, -12.450927734375, -12.05810546875, -11.665283203125, -11.2724609375, -10.879638671875, -10.48681640625, -10.093994140625, -9.701171875, -9.308349609375, -8.91552734375, -8.522705078125, -8.1298828125, -7.737060546875, -7.34423828125, -6.951416015625, -6.55859375, -6.165771484375, -5.77294921875, -5.380126953125, -4.9873046875, -4.594482421875, -4.20166015625, -3.808837890625, -3.416015625, -3.023193359375, -2.63037109375, -2.237548828125, -1.8447265625, -1.451904296875, -1.05908203125, -0.666259765625, -0.2734375, 0.119384765625, 0.51220703125, 0.905029296875, 1.2978515625, 1.690673828125, 2.08349609375, 2.476318359375, 2.869140625, 3.261962890625, 3.65478515625, 4.047607421875, 4.4404296875, 4.833251953125, 5.22607421875, 5.618896484375, 6.01171875, 6.404541015625, 6.79736328125, 7.190185546875, 7.5830078125, 7.975830078125, 8.36865234375, 8.761474609375, 9.154296875, 9.547119140625, 9.93994140625, 10.332763671875, 10.7255859375, 11.118408203125, 11.51123046875, 11.904052734375, 12.296875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 5.0, 7.0, 10.0, 9.0, 14.0, 18.0, 17.0, 22.0, 31.0, 31.0, 41.0, 40.0, 39.0, 38.0, 53.0, 41.0, 56.0, 59.0, 60.0, 52.0, 52.0, 45.0, 47.0, 37.0, 29.0, 21.0, 17.0, 19.0, 21.0, 12.0, 15.0, 12.0, 8.0, 5.0, 5.0, 5.0, 5.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.3828125, -12.9964599609375, -12.610107421875, -12.2237548828125, -11.83740234375, -11.4510498046875, -11.064697265625, -10.6783447265625, -10.2919921875, -9.9056396484375, -9.519287109375, -9.1329345703125, -8.74658203125, -8.3602294921875, -7.973876953125, -7.5875244140625, -7.201171875, -6.8148193359375, -6.428466796875, -6.0421142578125, -5.65576171875, -5.2694091796875, -4.883056640625, -4.4967041015625, -4.1103515625, -3.7239990234375, -3.337646484375, -2.9512939453125, -2.56494140625, -2.1785888671875, -1.792236328125, -1.4058837890625, -1.01953125, -0.6331787109375, -0.246826171875, 0.1395263671875, 0.52587890625, 0.9122314453125, 1.298583984375, 1.6849365234375, 2.0712890625, 2.4576416015625, 2.843994140625, 3.2303466796875, 3.61669921875, 4.0030517578125, 4.389404296875, 4.7757568359375, 5.162109375, 5.5484619140625, 5.934814453125, 6.3211669921875, 6.70751953125, 7.0938720703125, 7.480224609375, 7.8665771484375, 8.2529296875, 8.6392822265625, 9.025634765625, 9.4119873046875, 9.79833984375, 10.1846923828125, 10.571044921875, 10.9573974609375, 11.34375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 4.0, 4.0, 2.0, 7.0, 7.0, 12.0, 17.0, 33.0, 25.0, 34.0, 48.0, 104.0, 174.0, 342.0, 681.0, 1716.0, 6746.0, 52008.0, 822502.0, 146623.0, 12841.0, 2743.0, 918.0, 390.0, 188.0, 130.0, 73.0, 44.0, 42.0, 24.0, 22.0, 15.0, 7.0, 8.0, 3.0, 6.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.50390625, -3.36749267578125, -3.2310791015625, -3.09466552734375, -2.958251953125, -2.82183837890625, -2.6854248046875, -2.54901123046875, -2.41259765625, -2.27618408203125, -2.1397705078125, -2.00335693359375, -1.866943359375, -1.73052978515625, -1.5941162109375, -1.45770263671875, -1.3212890625, -1.18487548828125, -1.0484619140625, -0.91204833984375, -0.775634765625, -0.63922119140625, -0.5028076171875, -0.36639404296875, -0.22998046875, -0.09356689453125, 0.0428466796875, 0.17926025390625, 0.315673828125, 0.45208740234375, 0.5885009765625, 0.72491455078125, 0.861328125, 0.99774169921875, 1.1341552734375, 1.27056884765625, 1.406982421875, 1.54339599609375, 1.6798095703125, 1.81622314453125, 1.95263671875, 2.08905029296875, 2.2254638671875, 2.36187744140625, 2.498291015625, 2.63470458984375, 2.7711181640625, 2.90753173828125, 3.0439453125, 3.18035888671875, 3.3167724609375, 3.45318603515625, 3.589599609375, 3.72601318359375, 3.8624267578125, 3.99884033203125, 4.13525390625, 4.27166748046875, 4.4080810546875, 4.54449462890625, 4.680908203125, 4.81732177734375, 4.9537353515625, 5.09014892578125, 5.2265625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 7.0, 2.0, 8.0, 5.0, 7.0, 7.0, 10.0, 12.0, 16.0, 24.0, 23.0, 28.0, 38.0, 35.0, 56.0, 104.0, 123.0, 116.0, 98.0, 63.0, 53.0, 42.0, 22.0, 25.0, 15.0, 12.0, 14.0, 9.0, 5.0, 1.0, 7.0, 3.0, 4.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0007185935974121094, -0.0006991401314735413, -0.0006796866655349731, -0.000660233199596405, -0.0006407797336578369, -0.0006213262677192688, -0.0006018728017807007, -0.0005824193358421326, -0.0005629658699035645, -0.0005435124039649963, -0.0005240589380264282, -0.0005046054720878601, -0.000485152006149292, -0.0004656985402107239, -0.00044624507427215576, -0.00042679160833358765, -0.00040733814239501953, -0.0003878846764564514, -0.0003684312105178833, -0.0003489777445793152, -0.00032952427864074707, -0.00031007081270217896, -0.00029061734676361084, -0.0002711638808250427, -0.0002517104148864746, -0.0002322569489479065, -0.00021280348300933838, -0.00019335001707077026, -0.00017389655113220215, -0.00015444308519363403, -0.00013498961925506592, -0.0001155361533164978, -9.608268737792969e-05, -7.662922143936157e-05, -5.717575550079346e-05, -3.772228956222534e-05, -1.8268823623657227e-05, 1.1846423149108887e-06, 2.0638108253479004e-05, 4.009157419204712e-05, 5.9545040130615234e-05, 7.899850606918335e-05, 9.845197200775146e-05, 0.00011790543794631958, 0.0001373589038848877, 0.0001568123698234558, 0.00017626583576202393, 0.00019571930170059204, 0.00021517276763916016, 0.00023462623357772827, 0.0002540796995162964, 0.0002735331654548645, 0.0002929866313934326, 0.00031244009733200073, 0.00033189356327056885, 0.00035134702920913696, 0.0003708004951477051, 0.0003902539610862732, 0.0004097074270248413, 0.0004291608929634094, 0.00044861435890197754, 0.00046806782484054565, 0.00048752129077911377, 0.0005069747567176819, 0.00052642822265625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 8.0, 8.0, 21.0, 28.0, 46.0, 74.0, 125.0, 251.0, 520.0, 1210.0, 3520.0, 15642.0, 163639.0, 798147.0, 53779.0, 7744.0, 2151.0, 814.0, 355.0, 202.0, 87.0, 72.0, 37.0, 27.0, 19.0, 12.0, 5.0, 3.0, 1.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.37109375, -5.20477294921875, -5.0384521484375, -4.87213134765625, -4.705810546875, -4.53948974609375, -4.3731689453125, -4.20684814453125, -4.04052734375, -3.87420654296875, -3.7078857421875, -3.54156494140625, -3.375244140625, -3.20892333984375, -3.0426025390625, -2.87628173828125, -2.7099609375, -2.54364013671875, -2.3773193359375, -2.21099853515625, -2.044677734375, -1.87835693359375, -1.7120361328125, -1.54571533203125, -1.37939453125, -1.21307373046875, -1.0467529296875, -0.88043212890625, -0.714111328125, -0.54779052734375, -0.3814697265625, -0.21514892578125, -0.048828125, 0.11749267578125, 0.2838134765625, 0.45013427734375, 0.616455078125, 0.78277587890625, 0.9490966796875, 1.11541748046875, 1.28173828125, 1.44805908203125, 1.6143798828125, 1.78070068359375, 1.947021484375, 2.11334228515625, 2.2796630859375, 2.44598388671875, 2.6123046875, 2.77862548828125, 2.9449462890625, 3.11126708984375, 3.277587890625, 3.44390869140625, 3.6102294921875, 3.77655029296875, 3.94287109375, 4.10919189453125, 4.2755126953125, 4.44183349609375, 4.608154296875, 4.77447509765625, 4.9407958984375, 5.10711669921875, 5.2734375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 5.0, 3.0, 7.0, 11.0, 22.0, 23.0, 19.0, 35.0, 51.0, 74.0, 87.0, 123.0, 128.0, 120.0, 63.0, 64.0, 46.0, 23.0, 28.0, 16.0, 13.0, 16.0, 5.0, 4.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-5.89453125, -5.758209228515625, -5.62188720703125, -5.485565185546875, -5.3492431640625, -5.212921142578125, -5.07659912109375, -4.940277099609375, -4.803955078125, -4.667633056640625, -4.53131103515625, -4.394989013671875, -4.2586669921875, -4.122344970703125, -3.98602294921875, -3.849700927734375, -3.71337890625, -3.577056884765625, -3.44073486328125, -3.304412841796875, -3.1680908203125, -3.031768798828125, -2.89544677734375, -2.759124755859375, -2.622802734375, -2.486480712890625, -2.35015869140625, -2.213836669921875, -2.0775146484375, -1.941192626953125, -1.80487060546875, -1.668548583984375, -1.5322265625, -1.395904541015625, -1.25958251953125, -1.123260498046875, -0.9869384765625, -0.850616455078125, -0.71429443359375, -0.577972412109375, -0.441650390625, -0.305328369140625, -0.16900634765625, -0.032684326171875, 0.1036376953125, 0.239959716796875, 0.37628173828125, 0.512603759765625, 0.64892578125, 0.785247802734375, 0.92156982421875, 1.057891845703125, 1.1942138671875, 1.330535888671875, 1.46685791015625, 1.603179931640625, 1.739501953125, 1.875823974609375, 2.01214599609375, 2.148468017578125, 2.2847900390625, 2.421112060546875, 2.55743408203125, 2.693756103515625, 2.830078125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 9.0, 16.0, 34.0, 125.0, 430.0, 266.0, 86.0, 21.0, 7.0, 6.0, 3.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-163.71713256835938, -159.603271484375, -155.48939514160156, -151.3755340576172, -147.26165771484375, -143.14779663085938, -139.033935546875, -134.92005920410156, -130.8061981201172, -126.69232940673828, -122.57846069335938, -118.464599609375, -114.3507308959961, -110.23686218261719, -106.12299346923828, -102.00912475585938, -97.89525604248047, -93.78138732910156, -89.66751861572266, -85.55364990234375, -81.43978881835938, -77.32592010498047, -73.21205139160156, -69.09818267822266, -64.98431396484375, -60.870445251464844, -56.7565803527832, -52.6427116394043, -48.528846740722656, -44.41497802734375, -40.301109313964844, -36.18724060058594, -32.07337951660156, -27.95951271057129, -23.845645904541016, -19.73177719116211, -15.617910385131836, -11.504043579101562, -7.390174865722656, -3.276308059692383, 0.8375587463378906, 4.951426029205322, 9.065293312072754, 13.179161071777344, 17.293027877807617, 21.40689468383789, 25.520763397216797, 29.63463020324707, 33.748497009277344, 37.86236572265625, 41.97623062133789, 46.0900993347168, 50.20396423339844, 54.317832946777344, 58.43170166015625, 62.545570373535156, 66.65943908691406, 70.77330780029297, 74.88717651367188, 79.00103759765625, 83.11490631103516, 87.22877502441406, 91.34264373779297, 95.45651245117188, 99.57037353515625]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 8.0, 6.0, 4.0, 10.0, 8.0, 15.0, 14.0, 14.0, 23.0, 20.0, 18.0, 33.0, 29.0, 33.0, 35.0, 40.0, 47.0, 60.0, 52.0, 50.0, 71.0, 55.0, 40.0, 42.0, 34.0, 24.0, 33.0, 33.0, 37.0, 21.0, 18.0, 10.0, 12.0, 11.0, 13.0, 11.0, 5.0, 8.0, 5.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-53.7112922668457, -52.2326774597168, -50.754058837890625, -49.27544403076172, -47.79682922363281, -46.318214416503906, -44.839595794677734, -43.36098098754883, -41.882362365722656, -40.40374755859375, -38.92512893676758, -37.44651412963867, -35.967899322509766, -34.489280700683594, -33.01066589355469, -31.53205108642578, -30.053436279296875, -28.574819564819336, -27.09620475769043, -25.61758804321289, -24.138973236083984, -22.660356521606445, -21.181739807128906, -19.703125, -18.22450828552246, -16.745891571044922, -15.267276763916016, -13.788660049438477, -12.310044288635254, -10.831428527832031, -9.352811813354492, -7.8741960525512695, -6.3955841064453125, -4.91696834564209, -3.438352108001709, -1.9597358703613281, -0.48112010955810547, 0.9974956512451172, 2.4761123657226562, 3.954728126525879, 5.433343887329102, 6.911959648132324, 8.390575408935547, 9.869192123413086, 11.347807884216309, 12.826423645019531, 14.30504035949707, 15.783656120300293, 17.262271881103516, 18.740888595581055, 20.21950340270996, 21.6981201171875, 23.176734924316406, 24.655351638793945, 26.133968353271484, 27.61258316040039, 29.09119987487793, 30.56981658935547, 32.048431396484375, 33.52704620361328, 35.00566482543945, 36.48427963256836, 37.96289825439453, 39.44151306152344, 40.920127868652344]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 3.0, 10.0, 10.0, 16.0, 14.0, 26.0, 33.0, 59.0, 77.0, 125.0, 179.0, 345.0, 6812.0, 4184434.0, 1352.0, 313.0, 157.0, 105.0, 71.0, 41.0, 23.0, 24.0, 13.0, 16.0, 7.0, 4.0, 4.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.6875, -52.25, -50.8125, -49.375, -47.9375, -46.5, -45.0625, -43.625, -42.1875, -40.75, -39.3125, -37.875, -36.4375, -35.0, -33.5625, -32.125, -30.6875, -29.25, -27.8125, -26.375, -24.9375, -23.5, -22.0625, -20.625, -19.1875, -17.75, -16.3125, -14.875, -13.4375, -12.0, -10.5625, -9.125, -7.6875, -6.25, -4.8125, -3.375, -1.9375, -0.5, 0.9375, 2.375, 3.8125, 5.25, 6.6875, 8.125, 9.5625, 11.0, 12.4375, 13.875, 15.3125, 16.75, 18.1875, 19.625, 21.0625, 22.5, 23.9375, 25.375, 26.8125, 28.25, 29.6875, 31.125, 32.5625, 34.0, 35.4375, 36.875, 38.3125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 4.0, 8.0, 9.0, 13.0, 6.0, 16.0, 18.0, 22.0, 25.0, 23.0, 30.0, 36.0, 47.0, 48.0, 42.0, 44.0, 59.0, 58.0, 54.0, 46.0, 38.0, 42.0, 45.0, 44.0, 29.0, 44.0, 34.0, 24.0, 18.0, 21.0, 9.0, 10.0, 11.0, 9.0, 9.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.615234375, -2.53076171875, -2.4462890625, -2.36181640625, -2.27734375, -2.19287109375, -2.1083984375, -2.02392578125, -1.939453125, -1.85498046875, -1.7705078125, -1.68603515625, -1.6015625, -1.51708984375, -1.4326171875, -1.34814453125, -1.263671875, -1.17919921875, -1.0947265625, -1.01025390625, -0.92578125, -0.84130859375, -0.7568359375, -0.67236328125, -0.587890625, -0.50341796875, -0.4189453125, -0.33447265625, -0.25, -0.16552734375, -0.0810546875, 0.00341796875, 0.087890625, 0.17236328125, 0.2568359375, 0.34130859375, 0.42578125, 0.51025390625, 0.5947265625, 0.67919921875, 0.763671875, 0.84814453125, 0.9326171875, 1.01708984375, 1.1015625, 1.18603515625, 1.2705078125, 1.35498046875, 1.439453125, 1.52392578125, 1.6083984375, 1.69287109375, 1.77734375, 1.86181640625, 1.9462890625, 2.03076171875, 2.115234375, 2.19970703125, 2.2841796875, 2.36865234375, 2.453125, 2.53759765625, 2.6220703125, 2.70654296875, 2.791015625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 7.0, 6.0, 6.0, 13.0, 15.0, 21.0, 38.0, 56.0, 112.0, 190.0, 391.0, 835.0, 2101.0, 5517.0, 17864.0, 96261.0, 3035581.0, 966931.0, 49508.0, 11909.0, 4057.0, 1510.0, 647.0, 268.0, 165.0, 97.0, 56.0, 36.0, 30.0, 14.0, 13.0, 8.0, 6.0, 7.0, 8.0, 3.0, 6.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8671875, -7.66461181640625, -7.4620361328125, -7.25946044921875, -7.056884765625, -6.85430908203125, -6.6517333984375, -6.44915771484375, -6.24658203125, -6.04400634765625, -5.8414306640625, -5.63885498046875, -5.436279296875, -5.23370361328125, -5.0311279296875, -4.82855224609375, -4.6259765625, -4.42340087890625, -4.2208251953125, -4.01824951171875, -3.815673828125, -3.61309814453125, -3.4105224609375, -3.20794677734375, -3.00537109375, -2.80279541015625, -2.6002197265625, -2.39764404296875, -2.195068359375, -1.99249267578125, -1.7899169921875, -1.58734130859375, -1.384765625, -1.18218994140625, -0.9796142578125, -0.77703857421875, -0.574462890625, -0.37188720703125, -0.1693115234375, 0.03326416015625, 0.23583984375, 0.43841552734375, 0.6409912109375, 0.84356689453125, 1.046142578125, 1.24871826171875, 1.4512939453125, 1.65386962890625, 1.8564453125, 2.05902099609375, 2.2615966796875, 2.46417236328125, 2.666748046875, 2.86932373046875, 3.0718994140625, 3.27447509765625, 3.47705078125, 3.67962646484375, 3.8822021484375, 4.08477783203125, 4.287353515625, 4.48992919921875, 4.6925048828125, 4.89508056640625, 5.09765625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 8.0, 1.0, 2.0, 6.0, 8.0, 6.0, 13.0, 21.0, 20.0, 37.0, 80.0, 112.0, 192.0, 456.0, 821.0, 1020.0, 592.0, 310.0, 140.0, 75.0, 48.0, 22.0, 21.0, 11.0, 10.0, 14.0, 6.0, 8.0, 2.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.921875, -4.74737548828125, -4.5728759765625, -4.39837646484375, -4.223876953125, -4.04937744140625, -3.8748779296875, -3.70037841796875, -3.52587890625, -3.35137939453125, -3.1768798828125, -3.00238037109375, -2.827880859375, -2.65338134765625, -2.4788818359375, -2.30438232421875, -2.1298828125, -1.95538330078125, -1.7808837890625, -1.60638427734375, -1.431884765625, -1.25738525390625, -1.0828857421875, -0.90838623046875, -0.73388671875, -0.55938720703125, -0.3848876953125, -0.21038818359375, -0.035888671875, 0.13861083984375, 0.3131103515625, 0.48760986328125, 0.662109375, 0.83660888671875, 1.0111083984375, 1.18560791015625, 1.360107421875, 1.53460693359375, 1.7091064453125, 1.88360595703125, 2.05810546875, 2.23260498046875, 2.4071044921875, 2.58160400390625, 2.756103515625, 2.93060302734375, 3.1051025390625, 3.27960205078125, 3.4541015625, 3.62860107421875, 3.8031005859375, 3.97760009765625, 4.152099609375, 4.32659912109375, 4.5010986328125, 4.67559814453125, 4.85009765625, 5.02459716796875, 5.1990966796875, 5.37359619140625, 5.548095703125, 5.72259521484375, 5.8970947265625, 6.07159423828125, 6.24609375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 5.0, 13.0, 44.0, 130.0, 225.0, 286.0, 143.0, 87.0, 32.0, 15.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.2436637878418, -32.90420913696289, -30.564754486083984, -28.225299835205078, -25.885845184326172, -23.546390533447266, -21.206933975219727, -18.86747932434082, -16.528024673461914, -14.188570022583008, -11.849115371704102, -9.509659767150879, -7.170205116271973, -4.830750465393066, -2.4912948608398438, -0.1518402099609375, 2.1876144409179688, 4.527069091796875, 6.8665242195129395, 9.205979347229004, 11.54543399810791, 13.884888648986816, 16.22434425354004, 18.563798904418945, 20.90325355529785, 23.242708206176758, 25.582162857055664, 27.921619415283203, 30.26107406616211, 32.600528717041016, 34.93998336791992, 37.27943801879883, 39.618896484375, 41.958351135253906, 44.29780578613281, 46.63726043701172, 48.976715087890625, 51.31616973876953, 53.65562438964844, 55.995079040527344, 58.33453369140625, 60.673988342285156, 63.01344299316406, 65.35289764404297, 67.69235229492188, 70.03180694580078, 72.37126159667969, 74.7107162475586, 77.0501708984375, 79.3896255493164, 81.72908020019531, 84.06853485107422, 86.40798950195312, 88.74744415283203, 91.08689880371094, 93.42635345458984, 95.76581573486328, 98.10527038574219, 100.4447250366211, 102.7841796875, 105.1236343383789, 107.46308898925781, 109.80254364013672, 112.14199829101562, 114.48145294189453]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 5.0, 1.0, 8.0, 6.0, 9.0, 9.0, 12.0, 12.0, 13.0, 26.0, 31.0, 59.0, 40.0, 39.0, 55.0, 43.0, 48.0, 57.0, 52.0, 58.0, 54.0, 49.0, 37.0, 43.0, 34.0, 35.0, 26.0, 27.0, 17.0, 26.0, 21.0, 9.0, 13.0, 7.0, 5.0, 7.0, 8.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-24.977367401123047, -24.25897216796875, -23.540576934814453, -22.822181701660156, -22.10378646850586, -21.385393142700195, -20.6669979095459, -19.9486026763916, -19.230207443237305, -18.511812210083008, -17.79341697692871, -17.075021743774414, -16.35662841796875, -15.638232231140137, -14.919837951660156, -14.20144271850586, -13.483047485351562, -12.764652252197266, -12.046257019042969, -11.327862739562988, -10.609467506408691, -9.891072273254395, -9.172677993774414, -8.454282760620117, -7.73588752746582, -7.017492294311523, -6.299097537994385, -5.580702781677246, -4.862307548522949, -4.143912315368652, -3.4255175590515137, -2.707122802734375, -1.988729476928711, -1.2703344821929932, -0.5519394874572754, 0.16645550727844238, 0.8848505020141602, 1.603245496749878, 2.3216404914855957, 3.0400352478027344, 3.7584304809570312, 4.476825714111328, 5.195220470428467, 5.9136152267456055, 6.632010459899902, 7.350405693054199, 8.06879997253418, 8.787195205688477, 9.505590438842773, 10.22398567199707, 10.942380905151367, 11.660775184631348, 12.379170417785645, 13.097565650939941, 13.815959930419922, 14.534355163574219, 15.252750396728516, 15.971145629882812, 16.68954086303711, 17.407936096191406, 18.126331329345703, 18.844724655151367, 19.563119888305664, 20.28151512145996, 20.999910354614258]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 7.0, 8.0, 8.0, 17.0, 23.0, 25.0, 57.0, 78.0, 156.0, 294.0, 481.0, 1090.0, 2575.0, 6275.0, 17068.0, 50231.0, 161874.0, 412124.0, 269055.0, 83432.0, 26944.0, 9864.0, 3870.0, 1568.0, 645.0, 333.0, 178.0, 105.0, 62.0, 31.0, 21.0, 23.0, 13.0, 4.0, 3.0, 5.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.857421875, -3.727630615234375, -3.59783935546875, -3.468048095703125, -3.3382568359375, -3.208465576171875, -3.07867431640625, -2.948883056640625, -2.819091796875, -2.689300537109375, -2.55950927734375, -2.429718017578125, -2.2999267578125, -2.170135498046875, -2.04034423828125, -1.910552978515625, -1.78076171875, -1.650970458984375, -1.52117919921875, -1.391387939453125, -1.2615966796875, -1.131805419921875, -1.00201416015625, -0.872222900390625, -0.742431640625, -0.612640380859375, -0.48284912109375, -0.353057861328125, -0.2232666015625, -0.093475341796875, 0.03631591796875, 0.166107177734375, 0.2958984375, 0.425689697265625, 0.55548095703125, 0.685272216796875, 0.8150634765625, 0.944854736328125, 1.07464599609375, 1.204437255859375, 1.334228515625, 1.464019775390625, 1.59381103515625, 1.723602294921875, 1.8533935546875, 1.983184814453125, 2.11297607421875, 2.242767333984375, 2.37255859375, 2.502349853515625, 2.63214111328125, 2.761932373046875, 2.8917236328125, 3.021514892578125, 3.15130615234375, 3.281097412109375, 3.410888671875, 3.540679931640625, 3.67047119140625, 3.800262451171875, 3.9300537109375, 4.059844970703125, 4.18963623046875, 4.319427490234375, 4.44921875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 9.0, 10.0, 11.0, 16.0, 11.0, 22.0, 24.0, 30.0, 24.0, 33.0, 34.0, 44.0, 69.0, 45.0, 57.0, 46.0, 49.0, 57.0, 50.0, 50.0, 39.0, 35.0, 33.0, 41.0, 43.0, 29.0, 19.0, 15.0, 8.0, 12.0, 10.0, 12.0, 5.0, 6.0, 4.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0], "bins": [-3.353515625, -3.266448974609375, -3.17938232421875, -3.092315673828125, -3.0052490234375, -2.918182373046875, -2.83111572265625, -2.744049072265625, -2.656982421875, -2.569915771484375, -2.48284912109375, -2.395782470703125, -2.3087158203125, -2.221649169921875, -2.13458251953125, -2.047515869140625, -1.96044921875, -1.873382568359375, -1.78631591796875, -1.699249267578125, -1.6121826171875, -1.525115966796875, -1.43804931640625, -1.350982666015625, -1.263916015625, -1.176849365234375, -1.08978271484375, -1.002716064453125, -0.9156494140625, -0.828582763671875, -0.74151611328125, -0.654449462890625, -0.5673828125, -0.480316162109375, -0.39324951171875, -0.306182861328125, -0.2191162109375, -0.132049560546875, -0.04498291015625, 0.042083740234375, 0.129150390625, 0.216217041015625, 0.30328369140625, 0.390350341796875, 0.4774169921875, 0.564483642578125, 0.65155029296875, 0.738616943359375, 0.82568359375, 0.912750244140625, 0.99981689453125, 1.086883544921875, 1.1739501953125, 1.261016845703125, 1.34808349609375, 1.435150146484375, 1.522216796875, 1.609283447265625, 1.69635009765625, 1.783416748046875, 1.8704833984375, 1.957550048828125, 2.04461669921875, 2.131683349609375, 2.21875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 0.0, 3.0, 4.0, 2.0, 6.0, 2.0, 13.0, 13.0, 22.0, 18.0, 35.0, 53.0, 71.0, 100.0, 174.0, 247.0, 467.0, 979.0, 2483.0, 8440.0, 44083.0, 430017.0, 500953.0, 46721.0, 8812.0, 2574.0, 983.0, 491.0, 273.0, 158.0, 123.0, 73.0, 41.0, 29.0, 19.0, 17.0, 11.0, 7.0, 11.0, 7.0, 5.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.81640625, -7.572265625, -7.328125, -7.083984375, -6.83984375, -6.595703125, -6.3515625, -6.107421875, -5.86328125, -5.619140625, -5.375, -5.130859375, -4.88671875, -4.642578125, -4.3984375, -4.154296875, -3.91015625, -3.666015625, -3.421875, -3.177734375, -2.93359375, -2.689453125, -2.4453125, -2.201171875, -1.95703125, -1.712890625, -1.46875, -1.224609375, -0.98046875, -0.736328125, -0.4921875, -0.248046875, -0.00390625, 0.240234375, 0.484375, 0.728515625, 0.97265625, 1.216796875, 1.4609375, 1.705078125, 1.94921875, 2.193359375, 2.4375, 2.681640625, 2.92578125, 3.169921875, 3.4140625, 3.658203125, 3.90234375, 4.146484375, 4.390625, 4.634765625, 4.87890625, 5.123046875, 5.3671875, 5.611328125, 5.85546875, 6.099609375, 6.34375, 6.587890625, 6.83203125, 7.076171875, 7.3203125, 7.564453125, 7.80859375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 2.0, 3.0, 4.0, 5.0, 9.0, 12.0, 7.0, 15.0, 10.0, 16.0, 16.0, 16.0, 22.0, 22.0, 33.0, 29.0, 30.0, 38.0, 34.0, 45.0, 37.0, 47.0, 39.0, 54.0, 39.0, 37.0, 38.0, 31.0, 42.0, 37.0, 37.0, 32.0, 24.0, 18.0, 22.0, 16.0, 15.0, 18.0, 4.0, 8.0, 8.0, 3.0, 9.0, 6.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-8.21875, -7.9493408203125, -7.679931640625, -7.4105224609375, -7.14111328125, -6.8717041015625, -6.602294921875, -6.3328857421875, -6.0634765625, -5.7940673828125, -5.524658203125, -5.2552490234375, -4.98583984375, -4.7164306640625, -4.447021484375, -4.1776123046875, -3.908203125, -3.6387939453125, -3.369384765625, -3.0999755859375, -2.83056640625, -2.5611572265625, -2.291748046875, -2.0223388671875, -1.7529296875, -1.4835205078125, -1.214111328125, -0.9447021484375, -0.67529296875, -0.4058837890625, -0.136474609375, 0.1329345703125, 0.40234375, 0.6717529296875, 0.941162109375, 1.2105712890625, 1.47998046875, 1.7493896484375, 2.018798828125, 2.2882080078125, 2.5576171875, 2.8270263671875, 3.096435546875, 3.3658447265625, 3.63525390625, 3.9046630859375, 4.174072265625, 4.4434814453125, 4.712890625, 4.9822998046875, 5.251708984375, 5.5211181640625, 5.79052734375, 6.0599365234375, 6.329345703125, 6.5987548828125, 6.8681640625, 7.1375732421875, 7.406982421875, 7.6763916015625, 7.94580078125, 8.2152099609375, 8.484619140625, 8.7540283203125, 9.0234375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 5.0, 3.0, 3.0, 5.0, 5.0, 16.0, 31.0, 48.0, 98.0, 166.0, 388.0, 1406.0, 7587.0, 109759.0, 880399.0, 42788.0, 4335.0, 957.0, 264.0, 134.0, 68.0, 29.0, 25.0, 15.0, 12.0, 6.0, 6.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.65625, -6.4566650390625, -6.257080078125, -6.0574951171875, -5.85791015625, -5.6583251953125, -5.458740234375, -5.2591552734375, -5.0595703125, -4.8599853515625, -4.660400390625, -4.4608154296875, -4.26123046875, -4.0616455078125, -3.862060546875, -3.6624755859375, -3.462890625, -3.2633056640625, -3.063720703125, -2.8641357421875, -2.66455078125, -2.4649658203125, -2.265380859375, -2.0657958984375, -1.8662109375, -1.6666259765625, -1.467041015625, -1.2674560546875, -1.06787109375, -0.8682861328125, -0.668701171875, -0.4691162109375, -0.26953125, -0.0699462890625, 0.129638671875, 0.3292236328125, 0.52880859375, 0.7283935546875, 0.927978515625, 1.1275634765625, 1.3271484375, 1.5267333984375, 1.726318359375, 1.9259033203125, 2.12548828125, 2.3250732421875, 2.524658203125, 2.7242431640625, 2.923828125, 3.1234130859375, 3.322998046875, 3.5225830078125, 3.72216796875, 3.9217529296875, 4.121337890625, 4.3209228515625, 4.5205078125, 4.7200927734375, 4.919677734375, 5.1192626953125, 5.31884765625, 5.5184326171875, 5.718017578125, 5.9176025390625, 6.1171875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 4.0, 0.0, 6.0, 1.0, 6.0, 7.0, 11.0, 6.0, 13.0, 15.0, 22.0, 30.0, 40.0, 55.0, 101.0, 128.0, 132.0, 104.0, 95.0, 48.0, 40.0, 27.0, 25.0, 21.0, 9.0, 7.0, 6.0, 6.0, 9.0, 6.0, 6.0, 0.0, 2.0, 3.0, 2.0, 6.0, 2.0, 3.0, 0.0, 2.0], "bins": [-0.0009112358093261719, -0.0008887350559234619, -0.000866234302520752, -0.000843733549118042, -0.000821232795715332, -0.0007987320423126221, -0.0007762312889099121, -0.0007537305355072021, -0.0007312297821044922, -0.0007087290287017822, -0.0006862282752990723, -0.0006637275218963623, -0.0006412267684936523, -0.0006187260150909424, -0.0005962252616882324, -0.0005737245082855225, -0.0005512237548828125, -0.0005287230014801025, -0.0005062222480773926, -0.0004837214946746826, -0.00046122074127197266, -0.0004387199878692627, -0.00041621923446655273, -0.0003937184810638428, -0.0003712177276611328, -0.00034871697425842285, -0.0003262162208557129, -0.00030371546745300293, -0.00028121471405029297, -0.000258713960647583, -0.00023621320724487305, -0.00021371245384216309, -0.00019121170043945312, -0.00016871094703674316, -0.0001462101936340332, -0.00012370944023132324, -0.00010120868682861328, -7.870793342590332e-05, -5.620718002319336e-05, -3.37064266204834e-05, -1.1205673217773438e-05, 1.1295080184936523e-05, 3.3795833587646484e-05, 5.6296586990356445e-05, 7.87973403930664e-05, 0.00010129809379577637, 0.00012379884719848633, 0.0001462996006011963, 0.00016880035400390625, 0.0001913011074066162, 0.00021380186080932617, 0.00023630261421203613, 0.0002588033676147461, 0.00028130412101745605, 0.000303804874420166, 0.000326305627822876, 0.00034880638122558594, 0.0003713071346282959, 0.00039380788803100586, 0.0004163086414337158, 0.0004388093948364258, 0.00046131014823913574, 0.0004838109016418457, 0.0005063116550445557, 0.0005288124084472656]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 10.0, 7.0, 16.0, 21.0, 53.0, 83.0, 156.0, 340.0, 892.0, 2181.0, 8556.0, 57094.0, 739717.0, 212423.0, 20523.0, 4160.0, 1316.0, 496.0, 247.0, 115.0, 54.0, 26.0, 24.0, 20.0, 11.0, 7.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.2578125, -6.104248046875, -5.95068359375, -5.797119140625, -5.6435546875, -5.489990234375, -5.33642578125, -5.182861328125, -5.029296875, -4.875732421875, -4.72216796875, -4.568603515625, -4.4150390625, -4.261474609375, -4.10791015625, -3.954345703125, -3.80078125, -3.647216796875, -3.49365234375, -3.340087890625, -3.1865234375, -3.032958984375, -2.87939453125, -2.725830078125, -2.572265625, -2.418701171875, -2.26513671875, -2.111572265625, -1.9580078125, -1.804443359375, -1.65087890625, -1.497314453125, -1.34375, -1.190185546875, -1.03662109375, -0.883056640625, -0.7294921875, -0.575927734375, -0.42236328125, -0.268798828125, -0.115234375, 0.038330078125, 0.19189453125, 0.345458984375, 0.4990234375, 0.652587890625, 0.80615234375, 0.959716796875, 1.11328125, 1.266845703125, 1.42041015625, 1.573974609375, 1.7275390625, 1.881103515625, 2.03466796875, 2.188232421875, 2.341796875, 2.495361328125, 2.64892578125, 2.802490234375, 2.9560546875, 3.109619140625, 3.26318359375, 3.416748046875, 3.5703125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 4.0, 2.0, 2.0, 3.0, 2.0, 4.0, 5.0, 8.0, 12.0, 14.0, 13.0, 33.0, 47.0, 67.0, 101.0, 121.0, 126.0, 131.0, 106.0, 65.0, 45.0, 27.0, 18.0, 12.0, 10.0, 7.0, 3.0, 6.0, 3.0, 5.0, 1.0, 5.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.203125, -3.07305908203125, -2.9429931640625, -2.81292724609375, -2.682861328125, -2.55279541015625, -2.4227294921875, -2.29266357421875, -2.16259765625, -2.03253173828125, -1.9024658203125, -1.77239990234375, -1.642333984375, -1.51226806640625, -1.3822021484375, -1.25213623046875, -1.1220703125, -0.99200439453125, -0.8619384765625, -0.73187255859375, -0.601806640625, -0.47174072265625, -0.3416748046875, -0.21160888671875, -0.08154296875, 0.04852294921875, 0.1785888671875, 0.30865478515625, 0.438720703125, 0.56878662109375, 0.6988525390625, 0.82891845703125, 0.958984375, 1.08905029296875, 1.2191162109375, 1.34918212890625, 1.479248046875, 1.60931396484375, 1.7393798828125, 1.86944580078125, 1.99951171875, 2.12957763671875, 2.2596435546875, 2.38970947265625, 2.519775390625, 2.64984130859375, 2.7799072265625, 2.90997314453125, 3.0400390625, 3.17010498046875, 3.3001708984375, 3.43023681640625, 3.560302734375, 3.69036865234375, 3.8204345703125, 3.95050048828125, 4.08056640625, 4.21063232421875, 4.3406982421875, 4.47076416015625, 4.600830078125, 4.73089599609375, 4.8609619140625, 4.99102783203125, 5.12109375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 4.0, 12.0, 22.0, 56.0, 226.0, 413.0, 201.0, 42.0, 12.0, 9.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.74073028564453, -106.98514556884766, -103.22956085205078, -99.4739761352539, -95.71839904785156, -91.96281433105469, -88.20722961425781, -84.45164489746094, -80.69606018066406, -76.94047546386719, -73.18489074707031, -69.42930603027344, -65.67372131347656, -61.91814041137695, -58.162559509277344, -54.40697479248047, -50.651390075683594, -46.89580535888672, -43.140220642089844, -39.384639739990234, -35.62905502319336, -31.873470306396484, -28.117887496948242, -24.3623046875, -20.606719970703125, -16.85113525390625, -13.095552444458008, -9.33996868133545, -5.584384918212891, -1.8288002014160156, 1.9267826080322266, 5.682365417480469, 9.437942504882812, 13.193526268005371, 16.94911003112793, 20.704692840576172, 24.460277557373047, 28.215862274169922, 31.971445083618164, 35.727027893066406, 39.48261260986328, 43.238197326660156, 46.99378204345703, 50.74936294555664, 54.504947662353516, 58.26053237915039, 62.01611328125, 65.77169799804688, 69.52728271484375, 73.28286743164062, 77.0384521484375, 80.79403686523438, 84.54962158203125, 88.30520629882812, 92.06078338623047, 95.81636810302734, 99.57195281982422, 103.3275375366211, 107.08312225341797, 110.83870697021484, 114.59428405761719, 118.34986877441406, 122.10545349121094, 125.86103820800781, 129.6166229248047]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 3.0, 2.0, 5.0, 4.0, 10.0, 14.0, 10.0, 19.0, 30.0, 18.0, 28.0, 26.0, 40.0, 42.0, 62.0, 52.0, 57.0, 91.0, 67.0, 67.0, 59.0, 47.0, 37.0, 39.0, 36.0, 22.0, 27.0, 13.0, 20.0, 14.0, 13.0, 7.0, 7.0, 8.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-56.8134651184082, -55.364013671875, -53.9145622253418, -52.465110778808594, -51.015655517578125, -49.56620407104492, -48.11675262451172, -46.667301177978516, -45.21784973144531, -43.76839828491211, -42.318946838378906, -40.86949157714844, -39.420040130615234, -37.97058868408203, -36.52113723754883, -35.071685791015625, -33.622230529785156, -32.17277908325195, -30.723325729370117, -29.273874282836914, -27.824420928955078, -26.374969482421875, -24.925518035888672, -23.47606658935547, -22.026613235473633, -20.57716178894043, -19.127708435058594, -17.67825698852539, -16.228805541992188, -14.779352188110352, -13.329900741577148, -11.880448341369629, -10.430999755859375, -8.981547355651855, -7.532095432281494, -6.082643508911133, -4.633191108703613, -3.1837387084960938, -1.7342872619628906, -0.2848348617553711, 1.1646175384521484, 2.614069700241089, 4.063521862030029, 5.512973785400391, 6.96242618560791, 8.41187858581543, 9.861330032348633, 11.310782432556152, 12.760234832763672, 14.209687232971191, 15.659139633178711, 17.108591079711914, 18.55804443359375, 20.007495880126953, 21.456947326660156, 22.90639877319336, 24.355852127075195, 25.8053035736084, 27.254756927490234, 28.704208374023438, 30.15365982055664, 31.603113174438477, 33.05256652832031, 34.502017974853516, 35.95146942138672]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 8.0, 14.0, 26.0, 22.0, 26.0, 53.0, 76.0, 107.0, 154.0, 269.0, 408.0, 693.0, 1174.0, 2205.0, 4672.0, 11194.0, 33259.0, 197803.0, 2508319.0, 1292911.0, 101416.0, 23142.0, 8322.0, 3659.0, 1776.0, 996.0, 571.0, 323.0, 195.0, 138.0, 108.0, 82.0, 49.0, 30.0, 28.0, 17.0, 5.0, 9.0, 6.0, 3.0, 3.0, 7.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.52734375, -3.390869140625, -3.25439453125, -3.117919921875, -2.9814453125, -2.844970703125, -2.70849609375, -2.572021484375, -2.435546875, -2.299072265625, -2.16259765625, -2.026123046875, -1.8896484375, -1.753173828125, -1.61669921875, -1.480224609375, -1.34375, -1.207275390625, -1.07080078125, -0.934326171875, -0.7978515625, -0.661376953125, -0.52490234375, -0.388427734375, -0.251953125, -0.115478515625, 0.02099609375, 0.157470703125, 0.2939453125, 0.430419921875, 0.56689453125, 0.703369140625, 0.83984375, 0.976318359375, 1.11279296875, 1.249267578125, 1.3857421875, 1.522216796875, 1.65869140625, 1.795166015625, 1.931640625, 2.068115234375, 2.20458984375, 2.341064453125, 2.4775390625, 2.614013671875, 2.75048828125, 2.886962890625, 3.0234375, 3.159912109375, 3.29638671875, 3.432861328125, 3.5693359375, 3.705810546875, 3.84228515625, 3.978759765625, 4.115234375, 4.251708984375, 4.38818359375, 4.524658203125, 4.6611328125, 4.797607421875, 4.93408203125, 5.070556640625, 5.20703125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 3.0, 4.0, 6.0, 5.0, 11.0, 18.0, 13.0, 11.0, 19.0, 28.0, 35.0, 46.0, 48.0, 33.0, 44.0, 41.0, 58.0, 43.0, 51.0, 58.0, 54.0, 54.0, 46.0, 37.0, 44.0, 33.0, 28.0, 24.0, 18.0, 15.0, 15.0, 14.0, 9.0, 10.0, 8.0, 7.0, 5.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.603515625, -2.525848388671875, -2.44818115234375, -2.370513916015625, -2.2928466796875, -2.215179443359375, -2.13751220703125, -2.059844970703125, -1.982177734375, -1.904510498046875, -1.82684326171875, -1.749176025390625, -1.6715087890625, -1.593841552734375, -1.51617431640625, -1.438507080078125, -1.36083984375, -1.283172607421875, -1.20550537109375, -1.127838134765625, -1.0501708984375, -0.972503662109375, -0.89483642578125, -0.817169189453125, -0.739501953125, -0.661834716796875, -0.58416748046875, -0.506500244140625, -0.4288330078125, -0.351165771484375, -0.27349853515625, -0.195831298828125, -0.1181640625, -0.040496826171875, 0.03717041015625, 0.114837646484375, 0.1925048828125, 0.270172119140625, 0.34783935546875, 0.425506591796875, 0.503173828125, 0.580841064453125, 0.65850830078125, 0.736175537109375, 0.8138427734375, 0.891510009765625, 0.96917724609375, 1.046844482421875, 1.12451171875, 1.202178955078125, 1.27984619140625, 1.357513427734375, 1.4351806640625, 1.512847900390625, 1.59051513671875, 1.668182373046875, 1.745849609375, 1.823516845703125, 1.90118408203125, 1.978851318359375, 2.0565185546875, 2.134185791015625, 2.21185302734375, 2.289520263671875, 2.3671875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 7.0, 3.0, 11.0, 12.0, 9.0, 15.0, 17.0, 30.0, 32.0, 48.0, 82.0, 128.0, 179.0, 353.0, 659.0, 1151.0, 2744.0, 7011.0, 19329.0, 65251.0, 513275.0, 3239207.0, 273162.0, 47123.0, 14607.0, 5497.0, 2161.0, 998.0, 463.0, 271.0, 150.0, 102.0, 67.0, 44.0, 27.0, 20.0, 11.0, 7.0, 5.0, 8.0, 2.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.421875, -5.2491455078125, -5.076416015625, -4.9036865234375, -4.73095703125, -4.5582275390625, -4.385498046875, -4.2127685546875, -4.0400390625, -3.8673095703125, -3.694580078125, -3.5218505859375, -3.34912109375, -3.1763916015625, -3.003662109375, -2.8309326171875, -2.658203125, -2.4854736328125, -2.312744140625, -2.1400146484375, -1.96728515625, -1.7945556640625, -1.621826171875, -1.4490966796875, -1.2763671875, -1.1036376953125, -0.930908203125, -0.7581787109375, -0.58544921875, -0.4127197265625, -0.239990234375, -0.0672607421875, 0.10546875, 0.2781982421875, 0.450927734375, 0.6236572265625, 0.79638671875, 0.9691162109375, 1.141845703125, 1.3145751953125, 1.4873046875, 1.6600341796875, 1.832763671875, 2.0054931640625, 2.17822265625, 2.3509521484375, 2.523681640625, 2.6964111328125, 2.869140625, 3.0418701171875, 3.214599609375, 3.3873291015625, 3.56005859375, 3.7327880859375, 3.905517578125, 4.0782470703125, 4.2509765625, 4.4237060546875, 4.596435546875, 4.7691650390625, 4.94189453125, 5.1146240234375, 5.287353515625, 5.4600830078125, 5.6328125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 4.0, 8.0, 8.0, 6.0, 9.0, 12.0, 19.0, 36.0, 34.0, 64.0, 100.0, 162.0, 313.0, 609.0, 954.0, 821.0, 395.0, 198.0, 117.0, 63.0, 39.0, 32.0, 11.0, 16.0, 12.0, 9.0, 7.0, 4.0, 4.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-9.8828125, -9.65118408203125, -9.4195556640625, -9.18792724609375, -8.956298828125, -8.72467041015625, -8.4930419921875, -8.26141357421875, -8.02978515625, -7.79815673828125, -7.5665283203125, -7.33489990234375, -7.103271484375, -6.87164306640625, -6.6400146484375, -6.40838623046875, -6.1767578125, -5.94512939453125, -5.7135009765625, -5.48187255859375, -5.250244140625, -5.01861572265625, -4.7869873046875, -4.55535888671875, -4.32373046875, -4.09210205078125, -3.8604736328125, -3.62884521484375, -3.397216796875, -3.16558837890625, -2.9339599609375, -2.70233154296875, -2.470703125, -2.23907470703125, -2.0074462890625, -1.77581787109375, -1.544189453125, -1.31256103515625, -1.0809326171875, -0.84930419921875, -0.61767578125, -0.38604736328125, -0.1544189453125, 0.07720947265625, 0.308837890625, 0.54046630859375, 0.7720947265625, 1.00372314453125, 1.2353515625, 1.46697998046875, 1.6986083984375, 1.93023681640625, 2.161865234375, 2.39349365234375, 2.6251220703125, 2.85675048828125, 3.08837890625, 3.32000732421875, 3.5516357421875, 3.78326416015625, 4.014892578125, 4.24652099609375, 4.4781494140625, 4.70977783203125, 4.94140625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 5.0, 2.0, 11.0, 14.0, 24.0, 56.0, 104.0, 137.0, 178.0, 141.0, 108.0, 78.0, 58.0, 30.0, 19.0, 11.0, 5.0, 6.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-35.2314453125, -33.53607940673828, -31.840709686279297, -30.145343780517578, -28.449975967407227, -26.754608154296875, -25.059240341186523, -23.363872528076172, -21.668506622314453, -19.9731388092041, -18.27777099609375, -16.58240509033203, -14.88703727722168, -13.191669464111328, -11.496301651000977, -9.800934791564941, -8.105566024780273, -6.41019868850708, -4.714831352233887, -3.019463539123535, -1.3240962028503418, 0.37127113342285156, 2.066638946533203, 3.7620058059692383, 5.45737361907959, 7.152740955352783, 8.848108291625977, 10.543476104736328, 12.23884391784668, 13.934210777282715, 15.629578590393066, 17.3249454498291, 19.020313262939453, 20.715681076049805, 22.411048889160156, 24.106414794921875, 25.801782608032227, 27.497150421142578, 29.19251823425293, 30.88788604736328, 32.583251953125, 34.27861785888672, 35.9739875793457, 37.66935348510742, 39.364723205566406, 41.060089111328125, 42.755455017089844, 44.45082473754883, 46.14619445800781, 47.84156036376953, 49.536930084228516, 51.232295989990234, 52.92766571044922, 54.62303161621094, 56.318397521972656, 58.01376724243164, 59.70913314819336, 61.40449905395508, 63.09986877441406, 64.79523468017578, 66.4906005859375, 68.18597412109375, 69.88134002685547, 71.57670593261719, 73.2720718383789]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 7.0, 7.0, 11.0, 13.0, 17.0, 14.0, 17.0, 15.0, 27.0, 26.0, 23.0, 34.0, 41.0, 32.0, 36.0, 46.0, 52.0, 47.0, 47.0, 49.0, 46.0, 24.0, 40.0, 44.0, 31.0, 26.0, 30.0, 32.0, 14.0, 27.0, 20.0, 15.0, 18.0, 9.0, 15.0, 6.0, 6.0, 6.0, 7.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-26.16159439086914, -25.33700942993164, -24.51242446899414, -23.68783950805664, -22.86325454711914, -22.03866958618164, -21.21408462524414, -20.38949966430664, -19.56491470336914, -18.74032974243164, -17.91574478149414, -17.09115982055664, -16.26657485961914, -15.44198989868164, -14.617405891418457, -13.792820930480957, -12.968236923217773, -12.143651962280273, -11.319067001342773, -10.494482040405273, -9.669897079467773, -8.845312118530273, -8.02072811126709, -7.19614315032959, -6.37155818939209, -5.54697322845459, -4.72238826751709, -3.897803783416748, -3.073218822479248, -2.248633861541748, -1.4240493774414062, -0.5994644165039062, 0.22512054443359375, 1.0497053861618042, 1.8742902278900146, 2.6988749504089355, 3.5234599113464355, 4.3480448722839355, 5.172629356384277, 5.997214317321777, 6.821799278259277, 7.646384239196777, 8.470969200134277, 9.295553207397461, 10.120138168334961, 10.944723129272461, 11.769308090209961, 12.593893051147461, 13.418478012084961, 14.243062973022461, 15.067647933959961, 15.892232894897461, 16.71681785583496, 17.54140281677246, 18.365985870361328, 19.190570831298828, 20.015155792236328, 20.839740753173828, 21.664325714111328, 22.488910675048828, 23.313495635986328, 24.138080596923828, 24.962665557861328, 25.787250518798828, 26.611835479736328]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 8.0, 5.0, 10.0, 26.0, 42.0, 52.0, 71.0, 163.0, 295.0, 565.0, 1298.0, 3198.0, 8523.0, 26031.0, 91668.0, 325635.0, 408963.0, 128146.0, 35529.0, 11219.0, 3985.0, 1628.0, 717.0, 354.0, 160.0, 83.0, 74.0, 39.0, 23.0, 11.0, 13.0, 7.0, 5.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8984375, -4.7459716796875, -4.593505859375, -4.4410400390625, -4.28857421875, -4.1361083984375, -3.983642578125, -3.8311767578125, -3.6787109375, -3.5262451171875, -3.373779296875, -3.2213134765625, -3.06884765625, -2.9163818359375, -2.763916015625, -2.6114501953125, -2.458984375, -2.3065185546875, -2.154052734375, -2.0015869140625, -1.84912109375, -1.6966552734375, -1.544189453125, -1.3917236328125, -1.2392578125, -1.0867919921875, -0.934326171875, -0.7818603515625, -0.62939453125, -0.4769287109375, -0.324462890625, -0.1719970703125, -0.01953125, 0.1329345703125, 0.285400390625, 0.4378662109375, 0.59033203125, 0.7427978515625, 0.895263671875, 1.0477294921875, 1.2001953125, 1.3526611328125, 1.505126953125, 1.6575927734375, 1.81005859375, 1.9625244140625, 2.114990234375, 2.2674560546875, 2.419921875, 2.5723876953125, 2.724853515625, 2.8773193359375, 3.02978515625, 3.1822509765625, 3.334716796875, 3.4871826171875, 3.6396484375, 3.7921142578125, 3.944580078125, 4.0970458984375, 4.24951171875, 4.4019775390625, 4.554443359375, 4.7069091796875, 4.859375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 6.0, 1.0, 11.0, 9.0, 12.0, 11.0, 9.0, 16.0, 13.0, 21.0, 27.0, 28.0, 46.0, 41.0, 42.0, 52.0, 40.0, 44.0, 60.0, 48.0, 56.0, 51.0, 36.0, 34.0, 53.0, 40.0, 27.0, 31.0, 27.0, 22.0, 14.0, 16.0, 9.0, 9.0, 11.0, 6.0, 5.0, 5.0, 3.0, 3.0, 8.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.39453125, -2.32275390625, -2.2509765625, -2.17919921875, -2.107421875, -2.03564453125, -1.9638671875, -1.89208984375, -1.8203125, -1.74853515625, -1.6767578125, -1.60498046875, -1.533203125, -1.46142578125, -1.3896484375, -1.31787109375, -1.24609375, -1.17431640625, -1.1025390625, -1.03076171875, -0.958984375, -0.88720703125, -0.8154296875, -0.74365234375, -0.671875, -0.60009765625, -0.5283203125, -0.45654296875, -0.384765625, -0.31298828125, -0.2412109375, -0.16943359375, -0.09765625, -0.02587890625, 0.0458984375, 0.11767578125, 0.189453125, 0.26123046875, 0.3330078125, 0.40478515625, 0.4765625, 0.54833984375, 0.6201171875, 0.69189453125, 0.763671875, 0.83544921875, 0.9072265625, 0.97900390625, 1.05078125, 1.12255859375, 1.1943359375, 1.26611328125, 1.337890625, 1.40966796875, 1.4814453125, 1.55322265625, 1.625, 1.69677734375, 1.7685546875, 1.84033203125, 1.912109375, 1.98388671875, 2.0556640625, 2.12744140625, 2.19921875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 1.0, 5.0, 4.0, 7.0, 13.0, 35.0, 53.0, 79.0, 131.0, 209.0, 420.0, 914.0, 2100.0, 7230.0, 63386.0, 860239.0, 100150.0, 9124.0, 2421.0, 1012.0, 443.0, 253.0, 119.0, 95.0, 35.0, 28.0, 19.0, 16.0, 12.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.375, -12.9990234375, -12.623046875, -12.2470703125, -11.87109375, -11.4951171875, -11.119140625, -10.7431640625, -10.3671875, -9.9912109375, -9.615234375, -9.2392578125, -8.86328125, -8.4873046875, -8.111328125, -7.7353515625, -7.359375, -6.9833984375, -6.607421875, -6.2314453125, -5.85546875, -5.4794921875, -5.103515625, -4.7275390625, -4.3515625, -3.9755859375, -3.599609375, -3.2236328125, -2.84765625, -2.4716796875, -2.095703125, -1.7197265625, -1.34375, -0.9677734375, -0.591796875, -0.2158203125, 0.16015625, 0.5361328125, 0.912109375, 1.2880859375, 1.6640625, 2.0400390625, 2.416015625, 2.7919921875, 3.16796875, 3.5439453125, 3.919921875, 4.2958984375, 4.671875, 5.0478515625, 5.423828125, 5.7998046875, 6.17578125, 6.5517578125, 6.927734375, 7.3037109375, 7.6796875, 8.0556640625, 8.431640625, 8.8076171875, 9.18359375, 9.5595703125, 9.935546875, 10.3115234375, 10.6875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 4.0, 7.0, 19.0, 15.0, 14.0, 21.0, 34.0, 29.0, 34.0, 27.0, 46.0, 39.0, 41.0, 51.0, 58.0, 66.0, 60.0, 51.0, 53.0, 60.0, 43.0, 37.0, 34.0, 31.0, 27.0, 14.0, 16.0, 11.0, 12.0, 8.0, 13.0, 10.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.125, -10.7811279296875, -10.437255859375, -10.0933837890625, -9.74951171875, -9.4056396484375, -9.061767578125, -8.7178955078125, -8.3740234375, -8.0301513671875, -7.686279296875, -7.3424072265625, -6.99853515625, -6.6546630859375, -6.310791015625, -5.9669189453125, -5.623046875, -5.2791748046875, -4.935302734375, -4.5914306640625, -4.24755859375, -3.9036865234375, -3.559814453125, -3.2159423828125, -2.8720703125, -2.5281982421875, -2.184326171875, -1.8404541015625, -1.49658203125, -1.1527099609375, -0.808837890625, -0.4649658203125, -0.12109375, 0.2227783203125, 0.566650390625, 0.9105224609375, 1.25439453125, 1.5982666015625, 1.942138671875, 2.2860107421875, 2.6298828125, 2.9737548828125, 3.317626953125, 3.6614990234375, 4.00537109375, 4.3492431640625, 4.693115234375, 5.0369873046875, 5.380859375, 5.7247314453125, 6.068603515625, 6.4124755859375, 6.75634765625, 7.1002197265625, 7.444091796875, 7.7879638671875, 8.1318359375, 8.4757080078125, 8.819580078125, 9.1634521484375, 9.50732421875, 9.8511962890625, 10.195068359375, 10.5389404296875, 10.8828125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 6.0, 7.0, 5.0, 10.0, 19.0, 18.0, 30.0, 50.0, 62.0, 81.0, 112.0, 229.0, 288.0, 629.0, 1257.0, 3246.0, 10783.0, 53748.0, 567155.0, 350893.0, 45009.0, 9401.0, 2915.0, 1190.0, 569.0, 298.0, 162.0, 123.0, 78.0, 55.0, 41.0, 28.0, 19.0, 14.0, 8.0, 11.0, 8.0, 1.0, 2.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.25390625, -3.148773193359375, -3.04364013671875, -2.938507080078125, -2.8333740234375, -2.728240966796875, -2.62310791015625, -2.517974853515625, -2.412841796875, -2.307708740234375, -2.20257568359375, -2.097442626953125, -1.9923095703125, -1.887176513671875, -1.78204345703125, -1.676910400390625, -1.57177734375, -1.466644287109375, -1.36151123046875, -1.256378173828125, -1.1512451171875, -1.046112060546875, -0.94097900390625, -0.835845947265625, -0.730712890625, -0.625579833984375, -0.52044677734375, -0.415313720703125, -0.3101806640625, -0.205047607421875, -0.09991455078125, 0.005218505859375, 0.1103515625, 0.215484619140625, 0.32061767578125, 0.425750732421875, 0.5308837890625, 0.636016845703125, 0.74114990234375, 0.846282958984375, 0.951416015625, 1.056549072265625, 1.16168212890625, 1.266815185546875, 1.3719482421875, 1.477081298828125, 1.58221435546875, 1.687347412109375, 1.79248046875, 1.897613525390625, 2.00274658203125, 2.107879638671875, 2.2130126953125, 2.318145751953125, 2.42327880859375, 2.528411865234375, 2.633544921875, 2.738677978515625, 2.84381103515625, 2.948944091796875, 3.0540771484375, 3.159210205078125, 3.26434326171875, 3.369476318359375, 3.474609375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 6.0, 5.0, 5.0, 14.0, 17.0, 7.0, 15.0, 16.0, 19.0, 33.0, 40.0, 40.0, 55.0, 62.0, 77.0, 113.0, 96.0, 70.0, 57.0, 39.0, 39.0, 26.0, 29.0, 26.0, 15.0, 25.0, 12.0, 9.0, 13.0, 3.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006761550903320312, -0.0006541907787322998, -0.0006322264671325684, -0.0006102621555328369, -0.0005882978439331055, -0.000566333532333374, -0.0005443692207336426, -0.0005224049091339111, -0.0005004405975341797, -0.00047847628593444824, -0.0004565119743347168, -0.00043454766273498535, -0.0004125833511352539, -0.00039061903953552246, -0.000368654727935791, -0.00034669041633605957, -0.0003247261047363281, -0.0003027617931365967, -0.00028079748153686523, -0.0002588331699371338, -0.00023686885833740234, -0.0002149045467376709, -0.00019294023513793945, -0.000170975923538208, -0.00014901161193847656, -0.00012704730033874512, -0.00010508298873901367, -8.311867713928223e-05, -6.115436553955078e-05, -3.9190053939819336e-05, -1.722574234008789e-05, 4.738569259643555e-06, 2.6702880859375e-05, 4.8667192459106445e-05, 7.063150405883789e-05, 9.259581565856934e-05, 0.00011456012725830078, 0.00013652443885803223, 0.00015848875045776367, 0.00018045306205749512, 0.00020241737365722656, 0.000224381685256958, 0.00024634599685668945, 0.0002683103084564209, 0.00029027462005615234, 0.0003122389316558838, 0.00033420324325561523, 0.0003561675548553467, 0.0003781318664550781, 0.00040009617805480957, 0.000422060489654541, 0.00044402480125427246, 0.0004659891128540039, 0.00048795342445373535, 0.0005099177360534668, 0.0005318820476531982, 0.0005538463592529297, 0.0005758106708526611, 0.0005977749824523926, 0.000619739294052124, 0.0006417036056518555, 0.0006636679172515869, 0.0006856322288513184, 0.0007075965404510498, 0.0007295608520507812]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 6.0, 6.0, 7.0, 17.0, 19.0, 23.0, 38.0, 45.0, 64.0, 121.0, 188.0, 331.0, 634.0, 1321.0, 3157.0, 8755.0, 36321.0, 387565.0, 554338.0, 39840.0, 9512.0, 3387.0, 1315.0, 670.0, 331.0, 206.0, 108.0, 71.0, 45.0, 33.0, 18.0, 14.0, 15.0, 7.0, 9.0, 4.0, 4.0, 3.0, 2.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.34765625, -4.20751953125, -4.0673828125, -3.92724609375, -3.787109375, -3.64697265625, -3.5068359375, -3.36669921875, -3.2265625, -3.08642578125, -2.9462890625, -2.80615234375, -2.666015625, -2.52587890625, -2.3857421875, -2.24560546875, -2.10546875, -1.96533203125, -1.8251953125, -1.68505859375, -1.544921875, -1.40478515625, -1.2646484375, -1.12451171875, -0.984375, -0.84423828125, -0.7041015625, -0.56396484375, -0.423828125, -0.28369140625, -0.1435546875, -0.00341796875, 0.13671875, 0.27685546875, 0.4169921875, 0.55712890625, 0.697265625, 0.83740234375, 0.9775390625, 1.11767578125, 1.2578125, 1.39794921875, 1.5380859375, 1.67822265625, 1.818359375, 1.95849609375, 2.0986328125, 2.23876953125, 2.37890625, 2.51904296875, 2.6591796875, 2.79931640625, 2.939453125, 3.07958984375, 3.2197265625, 3.35986328125, 3.5, 3.64013671875, 3.7802734375, 3.92041015625, 4.060546875, 4.20068359375, 4.3408203125, 4.48095703125, 4.62109375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 5.0, 3.0, 0.0, 8.0, 9.0, 11.0, 21.0, 39.0, 35.0, 44.0, 79.0, 132.0, 150.0, 123.0, 108.0, 88.0, 41.0, 35.0, 24.0, 12.0, 5.0, 3.0, 5.0, 3.0, 6.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.33203125, -5.187591552734375, -5.04315185546875, -4.898712158203125, -4.7542724609375, -4.609832763671875, -4.46539306640625, -4.320953369140625, -4.176513671875, -4.032073974609375, -3.88763427734375, -3.743194580078125, -3.5987548828125, -3.454315185546875, -3.30987548828125, -3.165435791015625, -3.02099609375, -2.876556396484375, -2.73211669921875, -2.587677001953125, -2.4432373046875, -2.298797607421875, -2.15435791015625, -2.009918212890625, -1.865478515625, -1.721038818359375, -1.57659912109375, -1.432159423828125, -1.2877197265625, -1.143280029296875, -0.99884033203125, -0.854400634765625, -0.7099609375, -0.565521240234375, -0.42108154296875, -0.276641845703125, -0.1322021484375, 0.012237548828125, 0.15667724609375, 0.301116943359375, 0.445556640625, 0.589996337890625, 0.73443603515625, 0.878875732421875, 1.0233154296875, 1.167755126953125, 1.31219482421875, 1.456634521484375, 1.60107421875, 1.745513916015625, 1.88995361328125, 2.034393310546875, 2.1788330078125, 2.323272705078125, 2.46771240234375, 2.612152099609375, 2.756591796875, 2.901031494140625, 3.04547119140625, 3.189910888671875, 3.3343505859375, 3.478790283203125, 3.62322998046875, 3.767669677734375, 3.912109375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 2.0, 7.0, 11.0, 39.0, 50.0, 129.0, 251.0, 249.0, 132.0, 59.0, 32.0, 8.0, 6.0, 6.0, 2.0, 5.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.35801696777344, -82.98989868164062, -80.62177276611328, -78.25365447998047, -75.88552856445312, -73.51741027832031, -71.14928436279297, -68.78116607666016, -66.41304016113281, -64.044921875, -61.676795959472656, -59.30867385864258, -56.9405517578125, -54.57243347167969, -52.20431137084961, -49.83618927001953, -47.46807098388672, -45.09994888305664, -42.73182678222656, -40.363704681396484, -37.995582580566406, -35.627464294433594, -33.259342193603516, -30.891220092773438, -28.52309799194336, -26.15497589111328, -23.786853790283203, -21.418733596801758, -19.05061149597168, -16.6824893951416, -14.31436824798584, -11.946247100830078, -9.578125, -7.21000337600708, -4.84188175201416, -2.4737601280212402, -0.10563850402832031, 2.262483596801758, 4.6306047439575195, 6.998725891113281, 9.36684799194336, 11.734970092773438, 14.1030912399292, 16.47121238708496, 18.83933448791504, 21.207456588745117, 23.575576782226562, 25.94369888305664, 28.31182098388672, 30.679943084716797, 33.048065185546875, 35.41618728637695, 37.78430938720703, 40.152427673339844, 42.52054977416992, 44.888671875, 47.25679397583008, 49.624916076660156, 51.993038177490234, 54.36116027832031, 56.729278564453125, 59.09740447998047, 61.46552276611328, 63.83364486694336, 66.20176696777344]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 9.0, 6.0, 7.0, 12.0, 13.0, 13.0, 16.0, 12.0, 18.0, 26.0, 20.0, 26.0, 33.0, 39.0, 48.0, 51.0, 60.0, 66.0, 57.0, 58.0, 47.0, 43.0, 49.0, 32.0, 20.0, 35.0, 34.0, 22.0, 15.0, 21.0, 12.0, 24.0, 11.0, 14.0, 7.0, 6.0, 5.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.749351501464844, -34.60606384277344, -33.46277618408203, -32.31949234008789, -31.176204681396484, -30.032917022705078, -28.889629364013672, -27.746341705322266, -26.603055953979492, -25.459768295288086, -24.316482543945312, -23.173194885253906, -22.0299072265625, -20.886621475219727, -19.74333381652832, -18.600048065185547, -17.45676040649414, -16.313472747802734, -15.170186996459961, -14.026899337768555, -12.883612632751465, -11.740325927734375, -10.597038269042969, -9.453751564025879, -8.310464859008789, -7.167178153991699, -6.023890972137451, -4.880603790283203, -3.7373170852661133, -2.5940303802490234, -1.4507431983947754, -0.30745601654052734, 0.8358345031738281, 1.979121446609497, 3.122408390045166, 4.265695571899414, 5.408982276916504, 6.552268981933594, 7.695556163787842, 8.83884334564209, 9.98213005065918, 11.12541675567627, 12.26870346069336, 13.411991119384766, 14.555277824401855, 15.698564529418945, 16.84185218811035, 17.985137939453125, 19.12842559814453, 20.271713256835938, 21.41499900817871, 22.558286666870117, 23.70157241821289, 24.844860076904297, 25.988147735595703, 27.13143539428711, 28.274721145629883, 29.41800880432129, 30.561294555664062, 31.70458221435547, 32.847869873046875, 33.99115753173828, 35.13444137573242, 36.27772903442383, 37.421016693115234]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 2.0, 6.0, 7.0, 9.0, 20.0, 35.0, 59.0, 108.0, 181.0, 363.0, 755.0, 1948.0, 6658.0, 32200.0, 517978.0, 3429758.0, 179414.0, 17972.0, 4158.0, 1382.0, 539.0, 252.0, 172.0, 105.0, 58.0, 34.0, 33.0, 23.0, 10.0, 8.0, 8.0, 7.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.09765625, -4.8966064453125, -4.695556640625, -4.4945068359375, -4.29345703125, -4.0924072265625, -3.891357421875, -3.6903076171875, -3.4892578125, -3.2882080078125, -3.087158203125, -2.8861083984375, -2.68505859375, -2.4840087890625, -2.282958984375, -2.0819091796875, -1.880859375, -1.6798095703125, -1.478759765625, -1.2777099609375, -1.07666015625, -0.8756103515625, -0.674560546875, -0.4735107421875, -0.2724609375, -0.0714111328125, 0.129638671875, 0.3306884765625, 0.53173828125, 0.7327880859375, 0.933837890625, 1.1348876953125, 1.3359375, 1.5369873046875, 1.738037109375, 1.9390869140625, 2.14013671875, 2.3411865234375, 2.542236328125, 2.7432861328125, 2.9443359375, 3.1453857421875, 3.346435546875, 3.5474853515625, 3.74853515625, 3.9495849609375, 4.150634765625, 4.3516845703125, 4.552734375, 4.7537841796875, 4.954833984375, 5.1558837890625, 5.35693359375, 5.5579833984375, 5.759033203125, 5.9600830078125, 6.1611328125, 6.3621826171875, 6.563232421875, 6.7642822265625, 6.96533203125, 7.1663818359375, 7.367431640625, 7.5684814453125, 7.76953125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 7.0, 2.0, 13.0, 6.0, 12.0, 23.0, 32.0, 24.0, 29.0, 32.0, 44.0, 42.0, 47.0, 43.0, 45.0, 58.0, 58.0, 46.0, 60.0, 42.0, 64.0, 52.0, 45.0, 26.0, 32.0, 28.0, 23.0, 16.0, 11.0, 7.0, 8.0, 9.0, 6.0, 6.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.205078125, -2.125732421875, -2.04638671875, -1.967041015625, -1.8876953125, -1.808349609375, -1.72900390625, -1.649658203125, -1.5703125, -1.490966796875, -1.41162109375, -1.332275390625, -1.2529296875, -1.173583984375, -1.09423828125, -1.014892578125, -0.935546875, -0.856201171875, -0.77685546875, -0.697509765625, -0.6181640625, -0.538818359375, -0.45947265625, -0.380126953125, -0.30078125, -0.221435546875, -0.14208984375, -0.062744140625, 0.0166015625, 0.095947265625, 0.17529296875, 0.254638671875, 0.333984375, 0.413330078125, 0.49267578125, 0.572021484375, 0.6513671875, 0.730712890625, 0.81005859375, 0.889404296875, 0.96875, 1.048095703125, 1.12744140625, 1.206787109375, 1.2861328125, 1.365478515625, 1.44482421875, 1.524169921875, 1.603515625, 1.682861328125, 1.76220703125, 1.841552734375, 1.9208984375, 2.000244140625, 2.07958984375, 2.158935546875, 2.23828125, 2.317626953125, 2.39697265625, 2.476318359375, 2.5556640625, 2.635009765625, 2.71435546875, 2.793701171875, 2.873046875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 5.0, 14.0, 18.0, 40.0, 73.0, 143.0, 230.0, 475.0, 1186.0, 3343.0, 12148.0, 67914.0, 1902800.0, 2118445.0, 70510.0, 11921.0, 2910.0, 1020.0, 426.0, 244.0, 152.0, 60.0, 55.0, 50.0, 35.0, 28.0, 13.0, 11.0, 7.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.83984375, -5.60638427734375, -5.3729248046875, -5.13946533203125, -4.906005859375, -4.67254638671875, -4.4390869140625, -4.20562744140625, -3.97216796875, -3.73870849609375, -3.5052490234375, -3.27178955078125, -3.038330078125, -2.80487060546875, -2.5714111328125, -2.33795166015625, -2.1044921875, -1.87103271484375, -1.6375732421875, -1.40411376953125, -1.170654296875, -0.93719482421875, -0.7037353515625, -0.47027587890625, -0.23681640625, -0.00335693359375, 0.2301025390625, 0.46356201171875, 0.697021484375, 0.93048095703125, 1.1639404296875, 1.39739990234375, 1.630859375, 1.86431884765625, 2.0977783203125, 2.33123779296875, 2.564697265625, 2.79815673828125, 3.0316162109375, 3.26507568359375, 3.49853515625, 3.73199462890625, 3.9654541015625, 4.19891357421875, 4.432373046875, 4.66583251953125, 4.8992919921875, 5.13275146484375, 5.3662109375, 5.59967041015625, 5.8331298828125, 6.06658935546875, 6.300048828125, 6.53350830078125, 6.7669677734375, 7.00042724609375, 7.23388671875, 7.46734619140625, 7.7008056640625, 7.93426513671875, 8.167724609375, 8.40118408203125, 8.6346435546875, 8.86810302734375, 9.1015625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 6.0, 5.0, 10.0, 29.0, 31.0, 50.0, 103.0, 284.0, 809.0, 1385.0, 816.0, 312.0, 124.0, 57.0, 24.0, 19.0, 8.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.7109375, -8.355712890625, -8.00048828125, -7.645263671875, -7.2900390625, -6.934814453125, -6.57958984375, -6.224365234375, -5.869140625, -5.513916015625, -5.15869140625, -4.803466796875, -4.4482421875, -4.093017578125, -3.73779296875, -3.382568359375, -3.02734375, -2.672119140625, -2.31689453125, -1.961669921875, -1.6064453125, -1.251220703125, -0.89599609375, -0.540771484375, -0.185546875, 0.169677734375, 0.52490234375, 0.880126953125, 1.2353515625, 1.590576171875, 1.94580078125, 2.301025390625, 2.65625, 3.011474609375, 3.36669921875, 3.721923828125, 4.0771484375, 4.432373046875, 4.78759765625, 5.142822265625, 5.498046875, 5.853271484375, 6.20849609375, 6.563720703125, 6.9189453125, 7.274169921875, 7.62939453125, 7.984619140625, 8.33984375, 8.695068359375, 9.05029296875, 9.405517578125, 9.7607421875, 10.115966796875, 10.47119140625, 10.826416015625, 11.181640625, 11.536865234375, 11.89208984375, 12.247314453125, 12.6025390625, 12.957763671875, 13.31298828125, 13.668212890625, 14.0234375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 5.0, 0.0, 4.0, 3.0, 18.0, 49.0, 172.0, 340.0, 273.0, 95.0, 23.0, 12.0, 9.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.05658721923828, -96.5664291381836, -93.07626342773438, -89.58610534667969, -86.095947265625, -82.60578918457031, -79.1156234741211, -75.6254653930664, -72.13529968261719, -68.6451416015625, -65.15497589111328, -61.664817810058594, -58.174659729003906, -54.68449783325195, -51.1943359375, -47.70417785644531, -44.214019775390625, -40.72385787963867, -37.233699798583984, -33.74353790283203, -30.25337791442871, -26.76321792602539, -23.273056030273438, -19.782896041870117, -16.292736053466797, -12.802576065063477, -9.31241512298584, -5.822254180908203, -2.332094192504883, 1.1580657958984375, 4.648227691650391, 8.138387680053711, 11.628547668457031, 15.118707656860352, 18.608867645263672, 22.099029541015625, 25.589189529418945, 29.079349517822266, 32.56951141357422, 36.059669494628906, 39.54983139038086, 43.03999328613281, 46.5301513671875, 50.02031326293945, 53.510475158691406, 57.000633239746094, 60.49079513549805, 63.98095703125, 67.47111511230469, 70.96127319335938, 74.4514389038086, 77.94159698486328, 81.43175506591797, 84.92192077636719, 88.41207885742188, 91.90223693847656, 95.39239501953125, 98.88255310058594, 102.37271881103516, 105.86287689208984, 109.35303497314453, 112.84320068359375, 116.33335876464844, 119.82351684570312, 123.31368255615234]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 0.0, 7.0, 5.0, 11.0, 8.0, 5.0, 10.0, 19.0, 23.0, 29.0, 34.0, 36.0, 37.0, 47.0, 39.0, 38.0, 63.0, 72.0, 67.0, 56.0, 54.0, 45.0, 45.0, 44.0, 37.0, 34.0, 25.0, 25.0, 25.0, 15.0, 15.0, 8.0, 5.0, 8.0, 5.0, 5.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-37.10551834106445, -36.16584014892578, -35.22616195678711, -34.28648376464844, -33.346805572509766, -32.407127380371094, -31.467449188232422, -30.527769088745117, -29.588090896606445, -28.648412704467773, -27.7087345123291, -26.76905632019043, -25.829378128051758, -24.889698028564453, -23.95001983642578, -23.01034164428711, -22.070663452148438, -21.130985260009766, -20.191307067871094, -19.251628875732422, -18.31195068359375, -17.372272491455078, -16.432594299316406, -15.492914199829102, -14.553237915039062, -13.61355972290039, -12.673881530761719, -11.734203338623047, -10.794524192810059, -9.854846000671387, -8.915167808532715, -7.975489139556885, -7.035810470581055, -6.096132278442383, -5.156453609466553, -4.216775417327881, -3.27709698677063, -2.337418556213379, -1.397740364074707, -0.45806169509887695, 0.4816164970397949, 1.421294927597046, 2.360973358154297, 3.3006515502929688, 4.240329742431641, 5.180008411407471, 6.119686603546143, 7.059365272521973, 7.9990434646606445, 8.938721656799316, 9.878399848937988, 10.818078994750977, 11.757757186889648, 12.69743537902832, 13.637113571166992, 14.576791763305664, 15.516469955444336, 16.456148147583008, 17.39582633972168, 18.33550453186035, 19.275182723999023, 20.214862823486328, 21.154541015625, 22.094219207763672, 23.033897399902344]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [5.0, 0.0, 0.0, 4.0, 1.0, 2.0, 5.0, 8.0, 7.0, 9.0, 21.0, 39.0, 53.0, 82.0, 169.0, 347.0, 782.0, 2059.0, 6844.0, 27571.0, 142552.0, 555866.0, 250684.0, 45916.0, 10536.0, 3003.0, 1032.0, 441.0, 195.0, 145.0, 63.0, 46.0, 38.0, 12.0, 7.0, 8.0, 5.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.796875, -4.575439453125, -4.35400390625, -4.132568359375, -3.9111328125, -3.689697265625, -3.46826171875, -3.246826171875, -3.025390625, -2.803955078125, -2.58251953125, -2.361083984375, -2.1396484375, -1.918212890625, -1.69677734375, -1.475341796875, -1.25390625, -1.032470703125, -0.81103515625, -0.589599609375, -0.3681640625, -0.146728515625, 0.07470703125, 0.296142578125, 0.517578125, 0.739013671875, 0.96044921875, 1.181884765625, 1.4033203125, 1.624755859375, 1.84619140625, 2.067626953125, 2.2890625, 2.510498046875, 2.73193359375, 2.953369140625, 3.1748046875, 3.396240234375, 3.61767578125, 3.839111328125, 4.060546875, 4.281982421875, 4.50341796875, 4.724853515625, 4.9462890625, 5.167724609375, 5.38916015625, 5.610595703125, 5.83203125, 6.053466796875, 6.27490234375, 6.496337890625, 6.7177734375, 6.939208984375, 7.16064453125, 7.382080078125, 7.603515625, 7.824951171875, 8.04638671875, 8.267822265625, 8.4892578125, 8.710693359375, 8.93212890625, 9.153564453125, 9.375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 5.0, 5.0, 7.0, 4.0, 14.0, 16.0, 12.0, 12.0, 20.0, 33.0, 33.0, 36.0, 37.0, 37.0, 35.0, 59.0, 46.0, 50.0, 55.0, 53.0, 42.0, 49.0, 32.0, 41.0, 32.0, 39.0, 36.0, 25.0, 16.0, 20.0, 16.0, 16.0, 12.0, 5.0, 14.0, 8.0, 7.0, 3.0, 3.0, 10.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.271484375, -2.202056884765625, -2.13262939453125, -2.063201904296875, -1.9937744140625, -1.924346923828125, -1.85491943359375, -1.785491943359375, -1.716064453125, -1.646636962890625, -1.57720947265625, -1.507781982421875, -1.4383544921875, -1.368927001953125, -1.29949951171875, -1.230072021484375, -1.16064453125, -1.091217041015625, -1.02178955078125, -0.952362060546875, -0.8829345703125, -0.813507080078125, -0.74407958984375, -0.674652099609375, -0.605224609375, -0.535797119140625, -0.46636962890625, -0.396942138671875, -0.3275146484375, -0.258087158203125, -0.18865966796875, -0.119232177734375, -0.0498046875, 0.019622802734375, 0.08905029296875, 0.158477783203125, 0.2279052734375, 0.297332763671875, 0.36676025390625, 0.436187744140625, 0.505615234375, 0.575042724609375, 0.64447021484375, 0.713897705078125, 0.7833251953125, 0.852752685546875, 0.92218017578125, 0.991607666015625, 1.06103515625, 1.130462646484375, 1.19989013671875, 1.269317626953125, 1.3387451171875, 1.408172607421875, 1.47760009765625, 1.547027587890625, 1.616455078125, 1.685882568359375, 1.75531005859375, 1.824737548828125, 1.8941650390625, 1.963592529296875, 2.03302001953125, 2.102447509765625, 2.171875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 13.0, 8.0, 9.0, 14.0, 32.0, 21.0, 37.0, 47.0, 61.0, 90.0, 167.0, 226.0, 332.0, 553.0, 1089.0, 2370.0, 6775.0, 27911.0, 222321.0, 697805.0, 68699.0, 12490.0, 3846.0, 1558.0, 753.0, 430.0, 268.0, 178.0, 119.0, 104.0, 59.0, 44.0, 33.0, 28.0, 18.0, 15.0, 12.0, 7.0, 5.0, 4.0, 4.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0], "bins": [-9.9140625, -9.6405029296875, -9.366943359375, -9.0933837890625, -8.81982421875, -8.5462646484375, -8.272705078125, -7.9991455078125, -7.7255859375, -7.4520263671875, -7.178466796875, -6.9049072265625, -6.63134765625, -6.3577880859375, -6.084228515625, -5.8106689453125, -5.537109375, -5.2635498046875, -4.989990234375, -4.7164306640625, -4.44287109375, -4.1693115234375, -3.895751953125, -3.6221923828125, -3.3486328125, -3.0750732421875, -2.801513671875, -2.5279541015625, -2.25439453125, -1.9808349609375, -1.707275390625, -1.4337158203125, -1.16015625, -0.8865966796875, -0.613037109375, -0.3394775390625, -0.06591796875, 0.2076416015625, 0.481201171875, 0.7547607421875, 1.0283203125, 1.3018798828125, 1.575439453125, 1.8489990234375, 2.12255859375, 2.3961181640625, 2.669677734375, 2.9432373046875, 3.216796875, 3.4903564453125, 3.763916015625, 4.0374755859375, 4.31103515625, 4.5845947265625, 4.858154296875, 5.1317138671875, 5.4052734375, 5.6788330078125, 5.952392578125, 6.2259521484375, 6.49951171875, 6.7730712890625, 7.046630859375, 7.3201904296875, 7.59375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 8.0, 2.0, 8.0, 8.0, 10.0, 21.0, 15.0, 20.0, 21.0, 26.0, 35.0, 39.0, 40.0, 53.0, 53.0, 61.0, 67.0, 68.0, 61.0, 54.0, 51.0, 47.0, 40.0, 31.0, 37.0, 24.0, 21.0, 18.0, 16.0, 12.0, 14.0, 7.0, 7.0, 5.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.390625, -11.0770263671875, -10.763427734375, -10.4498291015625, -10.13623046875, -9.8226318359375, -9.509033203125, -9.1954345703125, -8.8818359375, -8.5682373046875, -8.254638671875, -7.9410400390625, -7.62744140625, -7.3138427734375, -7.000244140625, -6.6866455078125, -6.373046875, -6.0594482421875, -5.745849609375, -5.4322509765625, -5.11865234375, -4.8050537109375, -4.491455078125, -4.1778564453125, -3.8642578125, -3.5506591796875, -3.237060546875, -2.9234619140625, -2.60986328125, -2.2962646484375, -1.982666015625, -1.6690673828125, -1.35546875, -1.0418701171875, -0.728271484375, -0.4146728515625, -0.10107421875, 0.2125244140625, 0.526123046875, 0.8397216796875, 1.1533203125, 1.4669189453125, 1.780517578125, 2.0941162109375, 2.40771484375, 2.7213134765625, 3.034912109375, 3.3485107421875, 3.662109375, 3.9757080078125, 4.289306640625, 4.6029052734375, 4.91650390625, 5.2301025390625, 5.543701171875, 5.8572998046875, 6.1708984375, 6.4844970703125, 6.798095703125, 7.1116943359375, 7.42529296875, 7.7388916015625, 8.052490234375, 8.3660888671875, 8.6796875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 9.0, 10.0, 20.0, 16.0, 38.0, 64.0, 120.0, 211.0, 492.0, 1209.0, 4444.0, 26859.0, 738037.0, 256961.0, 15370.0, 2946.0, 939.0, 388.0, 181.0, 96.0, 51.0, 31.0, 22.0, 17.0, 12.0, 4.0, 3.0, 1.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.78515625, -5.56988525390625, -5.3546142578125, -5.13934326171875, -4.924072265625, -4.70880126953125, -4.4935302734375, -4.27825927734375, -4.06298828125, -3.84771728515625, -3.6324462890625, -3.41717529296875, -3.201904296875, -2.98663330078125, -2.7713623046875, -2.55609130859375, -2.3408203125, -2.12554931640625, -1.9102783203125, -1.69500732421875, -1.479736328125, -1.26446533203125, -1.0491943359375, -0.83392333984375, -0.61865234375, -0.40338134765625, -0.1881103515625, 0.02716064453125, 0.242431640625, 0.45770263671875, 0.6729736328125, 0.88824462890625, 1.103515625, 1.31878662109375, 1.5340576171875, 1.74932861328125, 1.964599609375, 2.17987060546875, 2.3951416015625, 2.61041259765625, 2.82568359375, 3.04095458984375, 3.2562255859375, 3.47149658203125, 3.686767578125, 3.90203857421875, 4.1173095703125, 4.33258056640625, 4.5478515625, 4.76312255859375, 4.9783935546875, 5.19366455078125, 5.408935546875, 5.62420654296875, 5.8394775390625, 6.05474853515625, 6.27001953125, 6.48529052734375, 6.7005615234375, 6.91583251953125, 7.131103515625, 7.34637451171875, 7.5616455078125, 7.77691650390625, 7.9921875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 3.0, 2.0, 7.0, 12.0, 11.0, 25.0, 35.0, 37.0, 62.0, 110.0, 167.0, 204.0, 106.0, 68.0, 44.0, 30.0, 21.0, 11.0, 15.0, 7.0, 4.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0012311935424804688, -0.0011837929487228394, -0.00113639235496521, -0.0010889917612075806, -0.0010415911674499512, -0.0009941905736923218, -0.0009467899799346924, -0.000899389386177063, -0.0008519887924194336, -0.0008045881986618042, -0.0007571876049041748, -0.0007097870111465454, -0.000662386417388916, -0.0006149858236312866, -0.0005675852298736572, -0.0005201846361160278, -0.00047278404235839844, -0.00042538344860076904, -0.00037798285484313965, -0.00033058226108551025, -0.00028318166732788086, -0.00023578107357025146, -0.00018838047981262207, -0.00014097988605499268, -9.357929229736328e-05, -4.617869853973389e-05, 1.2218952178955078e-06, 4.86224889755249e-05, 9.60230827331543e-05, 0.0001434236764907837, 0.00019082427024841309, 0.00023822486400604248, 0.0002856254577636719, 0.00033302605152130127, 0.00038042664527893066, 0.00042782723903656006, 0.00047522783279418945, 0.0005226284265518188, 0.0005700290203094482, 0.0006174296140670776, 0.000664830207824707, 0.0007122308015823364, 0.0007596313953399658, 0.0008070319890975952, 0.0008544325828552246, 0.000901833176612854, 0.0009492337703704834, 0.0009966343641281128, 0.0010440349578857422, 0.0010914355516433716, 0.001138836145401001, 0.0011862367391586304, 0.0012336373329162598, 0.0012810379266738892, 0.0013284385204315186, 0.001375839114189148, 0.0014232397079467773, 0.0014706403017044067, 0.0015180408954620361, 0.0015654414892196655, 0.001612842082977295, 0.0016602426767349243, 0.0017076432704925537, 0.001755043864250183, 0.0018024444580078125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 11.0, 14.0, 18.0, 32.0, 42.0, 82.0, 110.0, 184.0, 359.0, 613.0, 1237.0, 2795.0, 9016.0, 41817.0, 325954.0, 594211.0, 54486.0, 11216.0, 3424.0, 1408.0, 660.0, 334.0, 206.0, 114.0, 75.0, 43.0, 26.0, 18.0, 17.0, 7.0, 3.0, 7.0, 5.0, 7.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.505859375, -3.376373291015625, -3.24688720703125, -3.117401123046875, -2.9879150390625, -2.858428955078125, -2.72894287109375, -2.599456787109375, -2.469970703125, -2.340484619140625, -2.21099853515625, -2.081512451171875, -1.9520263671875, -1.822540283203125, -1.69305419921875, -1.563568115234375, -1.43408203125, -1.304595947265625, -1.17510986328125, -1.045623779296875, -0.9161376953125, -0.786651611328125, -0.65716552734375, -0.527679443359375, -0.398193359375, -0.268707275390625, -0.13922119140625, -0.009735107421875, 0.1197509765625, 0.249237060546875, 0.37872314453125, 0.508209228515625, 0.6376953125, 0.767181396484375, 0.89666748046875, 1.026153564453125, 1.1556396484375, 1.285125732421875, 1.41461181640625, 1.544097900390625, 1.673583984375, 1.803070068359375, 1.93255615234375, 2.062042236328125, 2.1915283203125, 2.321014404296875, 2.45050048828125, 2.579986572265625, 2.70947265625, 2.838958740234375, 2.96844482421875, 3.097930908203125, 3.2274169921875, 3.356903076171875, 3.48638916015625, 3.615875244140625, 3.745361328125, 3.874847412109375, 4.00433349609375, 4.133819580078125, 4.2633056640625, 4.392791748046875, 4.52227783203125, 4.651763916015625, 4.78125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 6.0, 2.0, 2.0, 3.0, 4.0, 8.0, 9.0, 10.0, 14.0, 9.0, 14.0, 20.0, 26.0, 37.0, 48.0, 52.0, 59.0, 69.0, 91.0, 82.0, 83.0, 67.0, 56.0, 56.0, 29.0, 32.0, 21.0, 22.0, 12.0, 13.0, 5.0, 14.0, 5.0, 8.0, 6.0, 4.0, 7.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.615234375, -2.528839111328125, -2.44244384765625, -2.356048583984375, -2.2696533203125, -2.183258056640625, -2.09686279296875, -2.010467529296875, -1.924072265625, -1.837677001953125, -1.75128173828125, -1.664886474609375, -1.5784912109375, -1.492095947265625, -1.40570068359375, -1.319305419921875, -1.23291015625, -1.146514892578125, -1.06011962890625, -0.973724365234375, -0.8873291015625, -0.800933837890625, -0.71453857421875, -0.628143310546875, -0.541748046875, -0.455352783203125, -0.36895751953125, -0.282562255859375, -0.1961669921875, -0.109771728515625, -0.02337646484375, 0.063018798828125, 0.1494140625, 0.235809326171875, 0.32220458984375, 0.408599853515625, 0.4949951171875, 0.581390380859375, 0.66778564453125, 0.754180908203125, 0.840576171875, 0.926971435546875, 1.01336669921875, 1.099761962890625, 1.1861572265625, 1.272552490234375, 1.35894775390625, 1.445343017578125, 1.53173828125, 1.618133544921875, 1.70452880859375, 1.790924072265625, 1.8773193359375, 1.963714599609375, 2.05010986328125, 2.136505126953125, 2.222900390625, 2.309295654296875, 2.39569091796875, 2.482086181640625, 2.5684814453125, 2.654876708984375, 2.74127197265625, 2.827667236328125, 2.9140625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 1.0, 2.0, 7.0, 13.0, 42.0, 59.0, 140.0, 278.0, 235.0, 110.0, 45.0, 27.0, 18.0, 7.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.07476806640625, -83.46434783935547, -80.85391998291016, -78.24349975585938, -75.6330795288086, -73.02265167236328, -70.4122314453125, -67.80180358886719, -65.1913833618164, -62.58095932006836, -59.97053909301758, -57.36011505126953, -54.749691009521484, -52.13926696777344, -49.528846740722656, -46.91842269897461, -44.30800247192383, -41.69757843017578, -39.087158203125, -36.47673416137695, -33.866310119628906, -31.255887985229492, -28.645465850830078, -26.03504180908203, -23.424619674682617, -20.814197540283203, -18.203773498535156, -15.593351364135742, -12.982928276062012, -10.372505187988281, -7.762083053588867, -5.15165901184082, -2.5412368774414062, 0.06918597221374512, 2.6796088218688965, 5.290031433105469, 7.900454521179199, 10.51087760925293, 13.121299743652344, 15.73172378540039, 18.342145919799805, 20.95256805419922, 23.562992095947266, 26.17341423034668, 28.783836364746094, 31.39426040649414, 34.00468444824219, 36.61510467529297, 39.225528717041016, 41.83595275878906, 44.446372985839844, 47.05679702758789, 49.66722106933594, 52.27764129638672, 54.888065338134766, 57.49848937988281, 60.108909606933594, 62.71933364868164, 65.32975769042969, 67.94017791748047, 70.55059814453125, 73.16102600097656, 75.77144622802734, 78.38186645507812, 80.99229431152344]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 6.0, 5.0, 4.0, 6.0, 8.0, 4.0, 12.0, 11.0, 16.0, 18.0, 22.0, 32.0, 32.0, 26.0, 33.0, 46.0, 45.0, 59.0, 77.0, 86.0, 61.0, 56.0, 44.0, 40.0, 37.0, 33.0, 29.0, 26.0, 21.0, 26.0, 11.0, 12.0, 10.0, 13.0, 16.0, 7.0, 7.0, 2.0, 8.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.19622802734375, -32.07718276977539, -30.958139419555664, -29.839094161987305, -28.720050811767578, -27.60100555419922, -26.48196029663086, -25.3629150390625, -24.243871688842773, -23.124826431274414, -22.005783081054688, -20.886737823486328, -19.76769256591797, -18.648649215698242, -17.529603958129883, -16.410560607910156, -15.291515350341797, -14.172471046447754, -13.053426742553711, -11.934381484985352, -10.815337181091309, -9.696292877197266, -8.577247619628906, -7.458203315734863, -6.33915901184082, -5.220114707946777, -4.101069927215576, -2.982025384902954, -1.862980842590332, -0.7439365386962891, 0.3751082420349121, 1.4941530227661133, 2.6131973266601562, 3.7322418689727783, 4.8512864112854, 5.970331192016602, 7.0893754959106445, 8.208419799804688, 9.327465057373047, 10.44650936126709, 11.565553665161133, 12.684597969055176, 13.803642272949219, 14.922687530517578, 16.041732788085938, 17.160776138305664, 18.279821395874023, 19.39886474609375, 20.51791000366211, 21.63695526123047, 22.755998611450195, 23.875043869018555, 24.99408721923828, 26.11313247680664, 27.232177734375, 28.35122299194336, 29.470266342163086, 30.589311599731445, 31.708354949951172, 32.82740020751953, 33.94644546508789, 35.06549072265625, 36.184532165527344, 37.3035774230957, 38.42262268066406]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 4.0, 13.0, 9.0, 13.0, 21.0, 32.0, 41.0, 78.0, 137.0, 254.0, 599.0, 1680.0, 8611.0, 307442.0, 3834348.0, 35220.0, 3897.0, 1040.0, 356.0, 196.0, 105.0, 55.0, 46.0, 39.0, 18.0, 18.0, 10.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.15625, -17.74609375, -17.3359375, -16.92578125, -16.515625, -16.10546875, -15.6953125, -15.28515625, -14.875, -14.46484375, -14.0546875, -13.64453125, -13.234375, -12.82421875, -12.4140625, -12.00390625, -11.59375, -11.18359375, -10.7734375, -10.36328125, -9.953125, -9.54296875, -9.1328125, -8.72265625, -8.3125, -7.90234375, -7.4921875, -7.08203125, -6.671875, -6.26171875, -5.8515625, -5.44140625, -5.03125, -4.62109375, -4.2109375, -3.80078125, -3.390625, -2.98046875, -2.5703125, -2.16015625, -1.75, -1.33984375, -0.9296875, -0.51953125, -0.109375, 0.30078125, 0.7109375, 1.12109375, 1.53125, 1.94140625, 2.3515625, 2.76171875, 3.171875, 3.58203125, 3.9921875, 4.40234375, 4.8125, 5.22265625, 5.6328125, 6.04296875, 6.453125, 6.86328125, 7.2734375, 7.68359375, 8.09375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 4.0, 6.0, 7.0, 12.0, 14.0, 10.0, 24.0, 25.0, 24.0, 35.0, 49.0, 51.0, 61.0, 54.0, 59.0, 58.0, 59.0, 60.0, 45.0, 72.0, 47.0, 52.0, 32.0, 31.0, 31.0, 20.0, 14.0, 11.0, 8.0, 8.0, 9.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.259765625, -3.171905517578125, -3.08404541015625, -2.996185302734375, -2.9083251953125, -2.820465087890625, -2.73260498046875, -2.644744873046875, -2.556884765625, -2.469024658203125, -2.38116455078125, -2.293304443359375, -2.2054443359375, -2.117584228515625, -2.02972412109375, -1.941864013671875, -1.85400390625, -1.766143798828125, -1.67828369140625, -1.590423583984375, -1.5025634765625, -1.414703369140625, -1.32684326171875, -1.238983154296875, -1.151123046875, -1.063262939453125, -0.97540283203125, -0.887542724609375, -0.7996826171875, -0.711822509765625, -0.62396240234375, -0.536102294921875, -0.4482421875, -0.360382080078125, -0.27252197265625, -0.184661865234375, -0.0968017578125, -0.008941650390625, 0.07891845703125, 0.166778564453125, 0.254638671875, 0.342498779296875, 0.43035888671875, 0.518218994140625, 0.6060791015625, 0.693939208984375, 0.78179931640625, 0.869659423828125, 0.95751953125, 1.045379638671875, 1.13323974609375, 1.221099853515625, 1.3089599609375, 1.396820068359375, 1.48468017578125, 1.572540283203125, 1.660400390625, 1.748260498046875, 1.83612060546875, 1.923980712890625, 2.0118408203125, 2.099700927734375, 2.18756103515625, 2.275421142578125, 2.36328125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 4.0, 8.0, 12.0, 19.0, 19.0, 40.0, 48.0, 66.0, 76.0, 148.0, 252.0, 406.0, 763.0, 1702.0, 4545.0, 15033.0, 96119.0, 3075705.0, 941503.0, 43355.0, 8861.0, 2866.0, 1140.0, 616.0, 367.0, 188.0, 150.0, 84.0, 53.0, 35.0, 24.0, 16.0, 12.0, 11.0, 6.0, 6.0, 3.0, 3.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.53125, -7.29461669921875, -7.0579833984375, -6.82135009765625, -6.584716796875, -6.34808349609375, -6.1114501953125, -5.87481689453125, -5.63818359375, -5.40155029296875, -5.1649169921875, -4.92828369140625, -4.691650390625, -4.45501708984375, -4.2183837890625, -3.98175048828125, -3.7451171875, -3.50848388671875, -3.2718505859375, -3.03521728515625, -2.798583984375, -2.56195068359375, -2.3253173828125, -2.08868408203125, -1.85205078125, -1.61541748046875, -1.3787841796875, -1.14215087890625, -0.905517578125, -0.66888427734375, -0.4322509765625, -0.19561767578125, 0.041015625, 0.27764892578125, 0.5142822265625, 0.75091552734375, 0.987548828125, 1.22418212890625, 1.4608154296875, 1.69744873046875, 1.93408203125, 2.17071533203125, 2.4073486328125, 2.64398193359375, 2.880615234375, 3.11724853515625, 3.3538818359375, 3.59051513671875, 3.8271484375, 4.06378173828125, 4.3004150390625, 4.53704833984375, 4.773681640625, 5.01031494140625, 5.2469482421875, 5.48358154296875, 5.72021484375, 5.95684814453125, 6.1934814453125, 6.43011474609375, 6.666748046875, 6.90338134765625, 7.1400146484375, 7.37664794921875, 7.61328125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 6.0, 2.0, 6.0, 8.0, 7.0, 5.0, 22.0, 24.0, 33.0, 51.0, 64.0, 112.0, 230.0, 415.0, 619.0, 789.0, 679.0, 416.0, 219.0, 151.0, 58.0, 62.0, 22.0, 29.0, 14.0, 9.0, 1.0, 8.0, 4.0, 3.0, 0.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4296875, -5.23284912109375, -5.0360107421875, -4.83917236328125, -4.642333984375, -4.44549560546875, -4.2486572265625, -4.05181884765625, -3.85498046875, -3.65814208984375, -3.4613037109375, -3.26446533203125, -3.067626953125, -2.87078857421875, -2.6739501953125, -2.47711181640625, -2.2802734375, -2.08343505859375, -1.8865966796875, -1.68975830078125, -1.492919921875, -1.29608154296875, -1.0992431640625, -0.90240478515625, -0.70556640625, -0.50872802734375, -0.3118896484375, -0.11505126953125, 0.081787109375, 0.27862548828125, 0.4754638671875, 0.67230224609375, 0.869140625, 1.06597900390625, 1.2628173828125, 1.45965576171875, 1.656494140625, 1.85333251953125, 2.0501708984375, 2.24700927734375, 2.44384765625, 2.64068603515625, 2.8375244140625, 3.03436279296875, 3.231201171875, 3.42803955078125, 3.6248779296875, 3.82171630859375, 4.0185546875, 4.21539306640625, 4.4122314453125, 4.60906982421875, 4.805908203125, 5.00274658203125, 5.1995849609375, 5.39642333984375, 5.59326171875, 5.79010009765625, 5.9869384765625, 6.18377685546875, 6.380615234375, 6.57745361328125, 6.7742919921875, 6.97113037109375, 7.16796875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 14.0, 31.0, 135.0, 357.0, 307.0, 100.0, 29.0, 14.0, 6.0, 6.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-192.19317626953125, -187.91604614257812, -183.638916015625, -179.36178588867188, -175.08465576171875, -170.80752563476562, -166.5303955078125, -162.25326538085938, -157.97613525390625, -153.69900512695312, -149.421875, -145.14474487304688, -140.86761474609375, -136.59048461914062, -132.3133544921875, -128.03622436523438, -123.75908660888672, -119.4819564819336, -115.20482635498047, -110.92769622802734, -106.65056610107422, -102.3734359741211, -98.09629821777344, -93.81916809082031, -89.54203796386719, -85.26490783691406, -80.98777770996094, -76.71064758300781, -72.43351745605469, -68.15638732910156, -63.87925338745117, -59.60212326049805, -55.32500457763672, -51.047874450683594, -46.77074432373047, -42.493614196777344, -38.21648406982422, -33.939353942871094, -29.662220001220703, -25.385089874267578, -21.107959747314453, -16.830829620361328, -12.553698539733887, -8.276567459106445, -3.9994373321533203, 0.2776927947998047, 4.5548248291015625, 8.831954956054688, 13.109085083007812, 17.386215209960938, 21.663345336914062, 25.94047737121582, 30.217607498168945, 34.49473571777344, 38.77186965942383, 43.04899978637695, 47.32612991333008, 51.6032600402832, 55.88039016723633, 60.15752410888672, 64.43465423583984, 68.71178436279297, 72.9889144897461, 77.26604461669922, 81.54317474365234]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 10.0, 5.0, 6.0, 9.0, 12.0, 12.0, 22.0, 28.0, 32.0, 29.0, 42.0, 39.0, 40.0, 50.0, 45.0, 48.0, 39.0, 51.0, 52.0, 57.0, 54.0, 47.0, 46.0, 40.0, 32.0, 35.0, 29.0, 21.0, 16.0, 11.0, 12.0, 9.0, 4.0, 8.0, 4.0, 1.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.124876022338867, -27.280773162841797, -26.436670303344727, -25.592567443847656, -24.748462677001953, -23.904361724853516, -23.060256958007812, -22.216154098510742, -21.372051239013672, -20.5279483795166, -19.68384552001953, -18.83974266052246, -17.99563980102539, -17.151535034179688, -16.307432174682617, -15.463329315185547, -14.619226455688477, -13.775123596191406, -12.931020736694336, -12.08691692352295, -11.242814064025879, -10.398711204528809, -9.554607391357422, -8.710504531860352, -7.866401672363281, -7.022298812866211, -6.178195476531982, -5.334092140197754, -4.489989280700684, -3.6458864212036133, -2.8017830848693848, -1.9576797485351562, -1.1135749816894531, -0.2694718837738037, 0.5746312141418457, 1.4187343120574951, 2.2628374099731445, 3.106940269470215, 3.9510436058044434, 4.795146942138672, 5.639249801635742, 6.4833526611328125, 7.327455997467041, 8.17155933380127, 9.01566219329834, 9.85976505279541, 10.703868865966797, 11.547971725463867, 12.392074584960938, 13.236177444458008, 14.080280303955078, 14.924384117126465, 15.768486976623535, 16.612590789794922, 17.456693649291992, 18.300796508789062, 19.144899368286133, 19.989002227783203, 20.833105087280273, 21.677207946777344, 22.521312713623047, 23.365413665771484, 24.209518432617188, 25.053621292114258, 25.897724151611328]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 12.0, 12.0, 23.0, 27.0, 41.0, 68.0, 129.0, 268.0, 718.0, 2153.0, 9606.0, 60556.0, 486136.0, 426526.0, 50682.0, 8390.0, 1995.0, 624.0, 253.0, 142.0, 68.0, 51.0, 16.0, 15.0, 7.0, 7.0, 11.0, 5.0, 5.0, 5.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.30859375, -7.072509765625, -6.83642578125, -6.600341796875, -6.3642578125, -6.128173828125, -5.89208984375, -5.656005859375, -5.419921875, -5.183837890625, -4.94775390625, -4.711669921875, -4.4755859375, -4.239501953125, -4.00341796875, -3.767333984375, -3.53125, -3.295166015625, -3.05908203125, -2.822998046875, -2.5869140625, -2.350830078125, -2.11474609375, -1.878662109375, -1.642578125, -1.406494140625, -1.17041015625, -0.934326171875, -0.6982421875, -0.462158203125, -0.22607421875, 0.010009765625, 0.24609375, 0.482177734375, 0.71826171875, 0.954345703125, 1.1904296875, 1.426513671875, 1.66259765625, 1.898681640625, 2.134765625, 2.370849609375, 2.60693359375, 2.843017578125, 3.0791015625, 3.315185546875, 3.55126953125, 3.787353515625, 4.0234375, 4.259521484375, 4.49560546875, 4.731689453125, 4.9677734375, 5.203857421875, 5.43994140625, 5.676025390625, 5.912109375, 6.148193359375, 6.38427734375, 6.620361328125, 6.8564453125, 7.092529296875, 7.32861328125, 7.564697265625, 7.80078125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 4.0, 13.0, 2.0, 10.0, 17.0, 19.0, 19.0, 22.0, 22.0, 35.0, 24.0, 40.0, 42.0, 46.0, 60.0, 50.0, 58.0, 55.0, 48.0, 48.0, 47.0, 68.0, 43.0, 34.0, 32.0, 24.0, 13.0, 29.0, 20.0, 18.0, 14.0, 11.0, 4.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-3.1640625, -3.081024169921875, -2.99798583984375, -2.914947509765625, -2.8319091796875, -2.748870849609375, -2.66583251953125, -2.582794189453125, -2.499755859375, -2.416717529296875, -2.33367919921875, -2.250640869140625, -2.1676025390625, -2.084564208984375, -2.00152587890625, -1.918487548828125, -1.83544921875, -1.752410888671875, -1.66937255859375, -1.586334228515625, -1.5032958984375, -1.420257568359375, -1.33721923828125, -1.254180908203125, -1.171142578125, -1.088104248046875, -1.00506591796875, -0.922027587890625, -0.8389892578125, -0.755950927734375, -0.67291259765625, -0.589874267578125, -0.5068359375, -0.423797607421875, -0.34075927734375, -0.257720947265625, -0.1746826171875, -0.091644287109375, -0.00860595703125, 0.074432373046875, 0.157470703125, 0.240509033203125, 0.32354736328125, 0.406585693359375, 0.4896240234375, 0.572662353515625, 0.65570068359375, 0.738739013671875, 0.82177734375, 0.904815673828125, 0.98785400390625, 1.070892333984375, 1.1539306640625, 1.236968994140625, 1.32000732421875, 1.403045654296875, 1.486083984375, 1.569122314453125, 1.65216064453125, 1.735198974609375, 1.8182373046875, 1.901275634765625, 1.98431396484375, 2.067352294921875, 2.150390625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 3.0, 3.0, 7.0, 15.0, 13.0, 13.0, 25.0, 30.0, 34.0, 41.0, 67.0, 89.0, 155.0, 256.0, 486.0, 1098.0, 3115.0, 12514.0, 71911.0, 602690.0, 299884.0, 43391.0, 8411.0, 2335.0, 883.0, 425.0, 226.0, 137.0, 87.0, 61.0, 41.0, 28.0, 27.0, 10.0, 10.0, 10.0, 7.0, 9.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.50390625, -6.3060302734375, -6.108154296875, -5.9102783203125, -5.71240234375, -5.5145263671875, -5.316650390625, -5.1187744140625, -4.9208984375, -4.7230224609375, -4.525146484375, -4.3272705078125, -4.12939453125, -3.9315185546875, -3.733642578125, -3.5357666015625, -3.337890625, -3.1400146484375, -2.942138671875, -2.7442626953125, -2.54638671875, -2.3485107421875, -2.150634765625, -1.9527587890625, -1.7548828125, -1.5570068359375, -1.359130859375, -1.1612548828125, -0.96337890625, -0.7655029296875, -0.567626953125, -0.3697509765625, -0.171875, 0.0260009765625, 0.223876953125, 0.4217529296875, 0.61962890625, 0.8175048828125, 1.015380859375, 1.2132568359375, 1.4111328125, 1.6090087890625, 1.806884765625, 2.0047607421875, 2.20263671875, 2.4005126953125, 2.598388671875, 2.7962646484375, 2.994140625, 3.1920166015625, 3.389892578125, 3.5877685546875, 3.78564453125, 3.9835205078125, 4.181396484375, 4.3792724609375, 4.5771484375, 4.7750244140625, 4.972900390625, 5.1707763671875, 5.36865234375, 5.5665283203125, 5.764404296875, 5.9622802734375, 6.16015625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 4.0, 2.0, 7.0, 8.0, 14.0, 19.0, 14.0, 19.0, 25.0, 16.0, 30.0, 35.0, 28.0, 28.0, 34.0, 35.0, 49.0, 44.0, 49.0, 34.0, 38.0, 59.0, 37.0, 33.0, 37.0, 35.0, 38.0, 40.0, 27.0, 26.0, 17.0, 23.0, 22.0, 19.0, 13.0, 9.0, 9.0, 2.0, 7.0, 3.0, 5.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.4921875, -7.25677490234375, -7.0213623046875, -6.78594970703125, -6.550537109375, -6.31512451171875, -6.0797119140625, -5.84429931640625, -5.60888671875, -5.37347412109375, -5.1380615234375, -4.90264892578125, -4.667236328125, -4.43182373046875, -4.1964111328125, -3.96099853515625, -3.7255859375, -3.49017333984375, -3.2547607421875, -3.01934814453125, -2.783935546875, -2.54852294921875, -2.3131103515625, -2.07769775390625, -1.84228515625, -1.60687255859375, -1.3714599609375, -1.13604736328125, -0.900634765625, -0.66522216796875, -0.4298095703125, -0.19439697265625, 0.041015625, 0.27642822265625, 0.5118408203125, 0.74725341796875, 0.982666015625, 1.21807861328125, 1.4534912109375, 1.68890380859375, 1.92431640625, 2.15972900390625, 2.3951416015625, 2.63055419921875, 2.865966796875, 3.10137939453125, 3.3367919921875, 3.57220458984375, 3.8076171875, 4.04302978515625, 4.2784423828125, 4.51385498046875, 4.749267578125, 4.98468017578125, 5.2200927734375, 5.45550537109375, 5.69091796875, 5.92633056640625, 6.1617431640625, 6.39715576171875, 6.632568359375, 6.86798095703125, 7.1033935546875, 7.33880615234375, 7.57421875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 3.0, 7.0, 9.0, 20.0, 23.0, 53.0, 82.0, 171.0, 319.0, 706.0, 1827.0, 5366.0, 19093.0, 89686.0, 619776.0, 249536.0, 45327.0, 10919.0, 3391.0, 1193.0, 551.0, 216.0, 103.0, 65.0, 44.0, 20.0, 11.0, 8.0, 13.0, 8.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.373046875, -2.29840087890625, -2.2237548828125, -2.14910888671875, -2.074462890625, -1.99981689453125, -1.9251708984375, -1.85052490234375, -1.77587890625, -1.70123291015625, -1.6265869140625, -1.55194091796875, -1.477294921875, -1.40264892578125, -1.3280029296875, -1.25335693359375, -1.1787109375, -1.10406494140625, -1.0294189453125, -0.95477294921875, -0.880126953125, -0.80548095703125, -0.7308349609375, -0.65618896484375, -0.58154296875, -0.50689697265625, -0.4322509765625, -0.35760498046875, -0.282958984375, -0.20831298828125, -0.1336669921875, -0.05902099609375, 0.015625, 0.09027099609375, 0.1649169921875, 0.23956298828125, 0.314208984375, 0.38885498046875, 0.4635009765625, 0.53814697265625, 0.61279296875, 0.68743896484375, 0.7620849609375, 0.83673095703125, 0.911376953125, 0.98602294921875, 1.0606689453125, 1.13531494140625, 1.2099609375, 1.28460693359375, 1.3592529296875, 1.43389892578125, 1.508544921875, 1.58319091796875, 1.6578369140625, 1.73248291015625, 1.80712890625, 1.88177490234375, 1.9564208984375, 2.03106689453125, 2.105712890625, 2.18035888671875, 2.2550048828125, 2.32965087890625, 2.404296875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 7.0, 7.0, 4.0, 10.0, 13.0, 13.0, 18.0, 29.0, 24.0, 46.0, 52.0, 55.0, 65.0, 88.0, 83.0, 90.0, 81.0, 65.0, 45.0, 53.0, 36.0, 19.0, 20.0, 15.0, 15.0, 9.0, 8.0, 9.0, 1.0, 3.0, 6.0, 3.0, 4.0, 1.0, 4.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005435943603515625, -0.0005275383591651917, -0.0005114823579788208, -0.00049542635679245, -0.0004793703556060791, -0.00046331435441970825, -0.0004472583532333374, -0.00043120235204696655, -0.0004151463508605957, -0.00039909034967422485, -0.000383034348487854, -0.00036697834730148315, -0.0003509223461151123, -0.00033486634492874146, -0.0003188103437423706, -0.00030275434255599976, -0.0002866983413696289, -0.00027064234018325806, -0.0002545863389968872, -0.00023853033781051636, -0.0002224743366241455, -0.00020641833543777466, -0.0001903623342514038, -0.00017430633306503296, -0.0001582503318786621, -0.00014219433069229126, -0.0001261383295059204, -0.00011008232831954956, -9.402632713317871e-05, -7.797032594680786e-05, -6.191432476043701e-05, -4.585832357406616e-05, -2.9802322387695312e-05, -1.3746321201324463e-05, 2.3096799850463867e-06, 1.8365681171417236e-05, 3.4421682357788086e-05, 5.0477683544158936e-05, 6.653368473052979e-05, 8.258968591690063e-05, 9.864568710327148e-05, 0.00011470168828964233, 0.00013075768947601318, 0.00014681369066238403, 0.00016286969184875488, 0.00017892569303512573, 0.00019498169422149658, 0.00021103769540786743, 0.00022709369659423828, 0.00024314969778060913, 0.00025920569896698, 0.00027526170015335083, 0.0002913177013397217, 0.00030737370252609253, 0.0003234297037124634, 0.00033948570489883423, 0.0003555417060852051, 0.00037159770727157593, 0.0003876537084579468, 0.0004037097096443176, 0.0004197657108306885, 0.0004358217120170593, 0.0004518777132034302, 0.000467933714389801, 0.0004839897155761719]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 5.0, 8.0, 10.0, 7.0, 17.0, 34.0, 44.0, 69.0, 131.0, 191.0, 380.0, 587.0, 1219.0, 2671.0, 6585.0, 18267.0, 57445.0, 202061.0, 550417.0, 143703.0, 41720.0, 13444.0, 5115.0, 2155.0, 1079.0, 460.0, 288.0, 141.0, 103.0, 71.0, 42.0, 20.0, 19.0, 13.0, 11.0, 9.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.98046875, -1.9228363037109375, -1.865203857421875, -1.8075714111328125, -1.74993896484375, -1.6923065185546875, -1.634674072265625, -1.5770416259765625, -1.5194091796875, -1.4617767333984375, -1.404144287109375, -1.3465118408203125, -1.28887939453125, -1.2312469482421875, -1.173614501953125, -1.1159820556640625, -1.058349609375, -1.0007171630859375, -0.943084716796875, -0.8854522705078125, -0.82781982421875, -0.7701873779296875, -0.712554931640625, -0.6549224853515625, -0.5972900390625, -0.5396575927734375, -0.482025146484375, -0.4243927001953125, -0.36676025390625, -0.3091278076171875, -0.251495361328125, -0.1938629150390625, -0.13623046875, -0.0785980224609375, -0.020965576171875, 0.0366668701171875, 0.09429931640625, 0.1519317626953125, 0.209564208984375, 0.2671966552734375, 0.3248291015625, 0.3824615478515625, 0.440093994140625, 0.4977264404296875, 0.55535888671875, 0.6129913330078125, 0.670623779296875, 0.7282562255859375, 0.785888671875, 0.8435211181640625, 0.901153564453125, 0.9587860107421875, 1.01641845703125, 1.0740509033203125, 1.131683349609375, 1.1893157958984375, 1.2469482421875, 1.3045806884765625, 1.362213134765625, 1.4198455810546875, 1.47747802734375, 1.5351104736328125, 1.592742919921875, 1.6503753662109375, 1.7080078125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 4.0, 2.0, 5.0, 3.0, 3.0, 7.0, 4.0, 3.0, 9.0, 16.0, 18.0, 33.0, 31.0, 26.0, 49.0, 57.0, 64.0, 72.0, 83.0, 68.0, 81.0, 69.0, 83.0, 64.0, 44.0, 25.0, 20.0, 22.0, 11.0, 11.0, 6.0, 4.0, 6.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.466796875, -1.39849853515625, -1.3302001953125, -1.26190185546875, -1.193603515625, -1.12530517578125, -1.0570068359375, -0.98870849609375, -0.92041015625, -0.85211181640625, -0.7838134765625, -0.71551513671875, -0.647216796875, -0.57891845703125, -0.5106201171875, -0.44232177734375, -0.3740234375, -0.30572509765625, -0.2374267578125, -0.16912841796875, -0.100830078125, -0.03253173828125, 0.0357666015625, 0.10406494140625, 0.17236328125, 0.24066162109375, 0.3089599609375, 0.37725830078125, 0.445556640625, 0.51385498046875, 0.5821533203125, 0.65045166015625, 0.71875, 0.78704833984375, 0.8553466796875, 0.92364501953125, 0.991943359375, 1.06024169921875, 1.1285400390625, 1.19683837890625, 1.26513671875, 1.33343505859375, 1.4017333984375, 1.47003173828125, 1.538330078125, 1.60662841796875, 1.6749267578125, 1.74322509765625, 1.8115234375, 1.87982177734375, 1.9481201171875, 2.01641845703125, 2.084716796875, 2.15301513671875, 2.2213134765625, 2.28961181640625, 2.35791015625, 2.42620849609375, 2.4945068359375, 2.56280517578125, 2.631103515625, 2.69940185546875, 2.7677001953125, 2.83599853515625, 2.904296875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 6.0, 12.0, 39.0, 99.0, 319.0, 317.0, 134.0, 37.0, 19.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.30042266845703, -83.5133285522461, -80.72622680664062, -77.93913269042969, -75.15203094482422, -72.36493682861328, -69.57783508300781, -66.79074096679688, -64.00364685058594, -61.216548919677734, -58.42945098876953, -55.642356872558594, -52.855255126953125, -50.06816101074219, -47.281063079833984, -44.49396514892578, -41.70686340332031, -38.91976547241211, -36.132667541503906, -33.34557342529297, -30.558473587036133, -27.77137565612793, -24.98427963256836, -22.197181701660156, -19.410083770751953, -16.62298583984375, -13.835888862609863, -11.048791885375977, -8.261693954467773, -5.47459602355957, -2.6875, 0.09959793090820312, 2.8866958618164062, 5.673793315887451, 8.460890769958496, 11.247987747192383, 14.035085678100586, 16.82218360900879, 19.60927963256836, 22.396377563476562, 25.183475494384766, 27.97057342529297, 30.757671356201172, 33.544769287109375, 36.33186340332031, 39.11896514892578, 41.90605926513672, 44.69315719604492, 47.480255126953125, 50.26735305786133, 53.05445098876953, 55.84154510498047, 58.62864685058594, 61.415740966796875, 64.20283508300781, 66.98993682861328, 69.77703857421875, 72.56413269042969, 75.35123443603516, 78.1383285522461, 80.92543029785156, 83.7125244140625, 86.49961853027344, 89.2867202758789, 92.07381439208984]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 5.0, 5.0, 7.0, 8.0, 7.0, 9.0, 15.0, 13.0, 17.0, 20.0, 24.0, 20.0, 33.0, 42.0, 37.0, 46.0, 48.0, 67.0, 113.0, 76.0, 50.0, 48.0, 46.0, 37.0, 33.0, 36.0, 30.0, 12.0, 18.0, 15.0, 10.0, 13.0, 9.0, 12.0, 10.0, 6.0, 4.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-28.994064331054688, -27.902921676635742, -26.811779022216797, -25.72063636779785, -24.629493713378906, -23.538352966308594, -22.44721031188965, -21.356067657470703, -20.264925003051758, -19.173782348632812, -18.082639694213867, -16.991497039794922, -15.900355339050293, -14.809212684631348, -13.718070983886719, -12.626928329467773, -11.535785675048828, -10.444643020629883, -9.353500366210938, -8.262358665466309, -7.171216011047363, -6.080073356628418, -4.988931179046631, -3.8977890014648438, -2.8066463470458984, -1.7155039310455322, -0.624361515045166, 0.4667809009552002, 1.5579233169555664, 2.6490659713745117, 3.740208148956299, 4.831350326538086, 5.922492980957031, 7.013635635375977, 8.104778289794922, 9.19591999053955, 10.287062644958496, 11.378205299377441, 12.46934700012207, 13.560489654541016, 14.651632308959961, 15.742774963378906, 16.83391761779785, 17.925060272216797, 19.01620101928711, 20.107345581054688, 21.198486328125, 22.289628982543945, 23.38077163696289, 24.471914291381836, 25.56305694580078, 26.654199600219727, 27.745342254638672, 28.836483001708984, 29.92762565612793, 31.018768310546875, 32.10990905761719, 33.2010498046875, 34.29219436645508, 35.38333511352539, 36.47447967529297, 37.56562042236328, 38.65676498413086, 39.74790573120117, 40.83905029296875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 3.0, 9.0, 17.0, 12.0, 21.0, 45.0, 55.0, 66.0, 108.0, 162.0, 240.0, 333.0, 597.0, 977.0, 1822.0, 3570.0, 8715.0, 28005.0, 166226.0, 1491310.0, 2159570.0, 270677.0, 40279.0, 11343.0, 4765.0, 2251.0, 1158.0, 672.0, 426.0, 283.0, 185.0, 109.0, 82.0, 49.0, 39.0, 34.0, 20.0, 16.0, 15.0, 0.0, 3.0, 8.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.556640625, -3.44232177734375, -3.3280029296875, -3.21368408203125, -3.099365234375, -2.98504638671875, -2.8707275390625, -2.75640869140625, -2.64208984375, -2.52777099609375, -2.4134521484375, -2.29913330078125, -2.184814453125, -2.07049560546875, -1.9561767578125, -1.84185791015625, -1.7275390625, -1.61322021484375, -1.4989013671875, -1.38458251953125, -1.270263671875, -1.15594482421875, -1.0416259765625, -0.92730712890625, -0.81298828125, -0.69866943359375, -0.5843505859375, -0.47003173828125, -0.355712890625, -0.24139404296875, -0.1270751953125, -0.01275634765625, 0.1015625, 0.21588134765625, 0.3302001953125, 0.44451904296875, 0.558837890625, 0.67315673828125, 0.7874755859375, 0.90179443359375, 1.01611328125, 1.13043212890625, 1.2447509765625, 1.35906982421875, 1.473388671875, 1.58770751953125, 1.7020263671875, 1.81634521484375, 1.9306640625, 2.04498291015625, 2.1593017578125, 2.27362060546875, 2.387939453125, 2.50225830078125, 2.6165771484375, 2.73089599609375, 2.84521484375, 2.95953369140625, 3.0738525390625, 3.18817138671875, 3.302490234375, 3.41680908203125, 3.5311279296875, 3.64544677734375, 3.759765625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 6.0, 4.0, 15.0, 11.0, 13.0, 10.0, 27.0, 31.0, 29.0, 32.0, 52.0, 50.0, 48.0, 58.0, 60.0, 60.0, 56.0, 51.0, 49.0, 56.0, 37.0, 42.0, 34.0, 25.0, 27.0, 18.0, 24.0, 17.0, 14.0, 7.0, 12.0, 9.0, 7.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.966796875, -2.884918212890625, -2.80303955078125, -2.721160888671875, -2.6392822265625, -2.557403564453125, -2.47552490234375, -2.393646240234375, -2.311767578125, -2.229888916015625, -2.14801025390625, -2.066131591796875, -1.9842529296875, -1.902374267578125, -1.82049560546875, -1.738616943359375, -1.65673828125, -1.574859619140625, -1.49298095703125, -1.411102294921875, -1.3292236328125, -1.247344970703125, -1.16546630859375, -1.083587646484375, -1.001708984375, -0.919830322265625, -0.83795166015625, -0.756072998046875, -0.6741943359375, -0.592315673828125, -0.51043701171875, -0.428558349609375, -0.3466796875, -0.264801025390625, -0.18292236328125, -0.101043701171875, -0.0191650390625, 0.062713623046875, 0.14459228515625, 0.226470947265625, 0.308349609375, 0.390228271484375, 0.47210693359375, 0.553985595703125, 0.6358642578125, 0.717742919921875, 0.79962158203125, 0.881500244140625, 0.96337890625, 1.045257568359375, 1.12713623046875, 1.209014892578125, 1.2908935546875, 1.372772216796875, 1.45465087890625, 1.536529541015625, 1.618408203125, 1.700286865234375, 1.78216552734375, 1.864044189453125, 1.9459228515625, 2.027801513671875, 2.10968017578125, 2.191558837890625, 2.2734375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 1.0, 10.0, 13.0, 19.0, 43.0, 71.0, 131.0, 324.0, 1018.0, 7686.0, 2091435.0, 2083892.0, 7984.0, 1068.0, 314.0, 133.0, 67.0, 45.0, 12.0, 8.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.4296875, -11.9324951171875, -11.435302734375, -10.9381103515625, -10.44091796875, -9.9437255859375, -9.446533203125, -8.9493408203125, -8.4521484375, -7.9549560546875, -7.457763671875, -6.9605712890625, -6.46337890625, -5.9661865234375, -5.468994140625, -4.9718017578125, -4.474609375, -3.9774169921875, -3.480224609375, -2.9830322265625, -2.48583984375, -1.9886474609375, -1.491455078125, -0.9942626953125, -0.4970703125, 0.0001220703125, 0.497314453125, 0.9945068359375, 1.49169921875, 1.9888916015625, 2.486083984375, 2.9832763671875, 3.48046875, 3.9776611328125, 4.474853515625, 4.9720458984375, 5.46923828125, 5.9664306640625, 6.463623046875, 6.9608154296875, 7.4580078125, 7.9552001953125, 8.452392578125, 8.9495849609375, 9.44677734375, 9.9439697265625, 10.441162109375, 10.9383544921875, 11.435546875, 11.9327392578125, 12.429931640625, 12.9271240234375, 13.42431640625, 13.9215087890625, 14.418701171875, 14.9158935546875, 15.4130859375, 15.9102783203125, 16.407470703125, 16.9046630859375, 17.40185546875, 17.8990478515625, 18.396240234375, 18.8934326171875, 19.390625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 11.0, 10.0, 20.0, 13.0, 29.0, 55.0, 69.0, 151.0, 268.0, 484.0, 669.0, 823.0, 604.0, 380.0, 186.0, 97.0, 82.0, 40.0, 23.0, 12.0, 8.0, 12.0, 11.0, 7.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.87109375, -5.67718505859375, -5.4832763671875, -5.28936767578125, -5.095458984375, -4.90155029296875, -4.7076416015625, -4.51373291015625, -4.31982421875, -4.12591552734375, -3.9320068359375, -3.73809814453125, -3.544189453125, -3.35028076171875, -3.1563720703125, -2.96246337890625, -2.7685546875, -2.57464599609375, -2.3807373046875, -2.18682861328125, -1.992919921875, -1.79901123046875, -1.6051025390625, -1.41119384765625, -1.21728515625, -1.02337646484375, -0.8294677734375, -0.63555908203125, -0.441650390625, -0.24774169921875, -0.0538330078125, 0.14007568359375, 0.333984375, 0.52789306640625, 0.7218017578125, 0.91571044921875, 1.109619140625, 1.30352783203125, 1.4974365234375, 1.69134521484375, 1.88525390625, 2.07916259765625, 2.2730712890625, 2.46697998046875, 2.660888671875, 2.85479736328125, 3.0487060546875, 3.24261474609375, 3.4365234375, 3.63043212890625, 3.8243408203125, 4.01824951171875, 4.212158203125, 4.40606689453125, 4.5999755859375, 4.79388427734375, 4.98779296875, 5.18170166015625, 5.3756103515625, 5.56951904296875, 5.763427734375, 5.95733642578125, 6.1512451171875, 6.34515380859375, 6.5390625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 5.0, 7.0, 11.0, 22.0, 26.0, 53.0, 100.0, 140.0, 171.0, 175.0, 107.0, 85.0, 51.0, 16.0, 11.0, 9.0, 6.0, 10.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.392005920410156, -28.772388458251953, -27.15277099609375, -25.533153533935547, -23.913536071777344, -22.29391860961914, -20.674299240112305, -19.0546817779541, -17.4350643157959, -15.815446853637695, -14.195829391479492, -12.576210975646973, -10.95659351348877, -9.336976051330566, -7.717357635498047, -6.097740173339844, -4.478122711181641, -2.8585050106048584, -1.2388873100280762, 0.38073062896728516, 2.0003480911254883, 3.6199655532836914, 5.239583969116211, 6.859201431274414, 8.478818893432617, 10.09843635559082, 11.718053817749023, 13.337672233581543, 14.957289695739746, 16.576908111572266, 18.19652557373047, 19.816143035888672, 21.435760498046875, 23.055377960205078, 24.67499542236328, 26.294612884521484, 27.914230346679688, 29.53384780883789, 31.153467178344727, 32.77308654785156, 34.3927001953125, 36.0123176574707, 37.631935119628906, 39.25155258178711, 40.87117004394531, 42.490787506103516, 44.11040496826172, 45.73002624511719, 47.34964370727539, 48.969261169433594, 50.5888786315918, 52.20849609375, 53.8281135559082, 55.447731018066406, 57.067352294921875, 58.68696594238281, 60.30658721923828, 61.926204681396484, 63.54582214355469, 65.16544342041016, 66.7850570678711, 68.40467834472656, 70.0242919921875, 71.64391326904297, 73.2635269165039]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 7.0, 5.0, 10.0, 6.0, 10.0, 15.0, 15.0, 21.0, 24.0, 22.0, 33.0, 27.0, 36.0, 46.0, 33.0, 44.0, 49.0, 47.0, 51.0, 45.0, 47.0, 37.0, 41.0, 42.0, 37.0, 34.0, 32.0, 27.0, 24.0, 30.0, 9.0, 15.0, 19.0, 15.0, 7.0, 10.0, 8.0, 6.0, 2.0, 4.0, 5.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-22.091201782226562, -21.4658203125, -20.840438842773438, -20.215059280395508, -19.589677810668945, -18.964296340942383, -18.338916778564453, -17.71353530883789, -17.088153839111328, -16.462772369384766, -15.83739185333252, -15.212011337280273, -14.586629867553711, -13.961248397827148, -13.335867881774902, -12.710487365722656, -12.085105895996094, -11.459724426269531, -10.834343910217285, -10.208963394165039, -9.583581924438477, -8.958200454711914, -8.332819938659668, -7.707438945770264, -7.082057952880859, -6.456676959991455, -5.831295967102051, -5.2059149742126465, -4.580533981323242, -3.955152988433838, -3.3297719955444336, -2.7043910026550293, -2.079008102416992, -1.453627109527588, -0.8282461166381836, -0.2028651237487793, 0.422515869140625, 1.0478968620300293, 1.6732778549194336, 2.298658847808838, 2.924039840698242, 3.5494208335876465, 4.174801826477051, 4.800182819366455, 5.425563812255859, 6.050944805145264, 6.676325798034668, 7.301706790924072, 7.927087783813477, 8.552469253540039, 9.177849769592285, 9.803230285644531, 10.428611755371094, 11.053993225097656, 11.679373741149902, 12.304754257202148, 12.930135726928711, 13.555517196655273, 14.18089771270752, 14.806278228759766, 15.431659698486328, 16.05704116821289, 16.682422637939453, 17.307802200317383, 17.933183670043945]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 5.0, 9.0, 11.0, 15.0, 30.0, 41.0, 92.0, 178.0, 362.0, 871.0, 2448.0, 7980.0, 32309.0, 189860.0, 623787.0, 152634.0, 27191.0, 6907.0, 2227.0, 833.0, 358.0, 190.0, 82.0, 48.0, 32.0, 19.0, 13.0, 1.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.453125, -5.26141357421875, -5.0697021484375, -4.87799072265625, -4.686279296875, -4.49456787109375, -4.3028564453125, -4.11114501953125, -3.91943359375, -3.72772216796875, -3.5360107421875, -3.34429931640625, -3.152587890625, -2.96087646484375, -2.7691650390625, -2.57745361328125, -2.3857421875, -2.19403076171875, -2.0023193359375, -1.81060791015625, -1.618896484375, -1.42718505859375, -1.2354736328125, -1.04376220703125, -0.85205078125, -0.66033935546875, -0.4686279296875, -0.27691650390625, -0.085205078125, 0.10650634765625, 0.2982177734375, 0.48992919921875, 0.681640625, 0.87335205078125, 1.0650634765625, 1.25677490234375, 1.448486328125, 1.64019775390625, 1.8319091796875, 2.02362060546875, 2.21533203125, 2.40704345703125, 2.5987548828125, 2.79046630859375, 2.982177734375, 3.17388916015625, 3.3656005859375, 3.55731201171875, 3.7490234375, 3.94073486328125, 4.1324462890625, 4.32415771484375, 4.515869140625, 4.70758056640625, 4.8992919921875, 5.09100341796875, 5.28271484375, 5.47442626953125, 5.6661376953125, 5.85784912109375, 6.049560546875, 6.24127197265625, 6.4329833984375, 6.62469482421875, 6.81640625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 5.0, 5.0, 7.0, 5.0, 12.0, 12.0, 13.0, 12.0, 11.0, 25.0, 24.0, 26.0, 19.0, 41.0, 43.0, 44.0, 46.0, 41.0, 42.0, 37.0, 47.0, 53.0, 40.0, 45.0, 33.0, 49.0, 36.0, 34.0, 36.0, 24.0, 22.0, 19.0, 20.0, 18.0, 10.0, 11.0, 8.0, 9.0, 9.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0], "bins": [-2.65625, -2.5814208984375, -2.506591796875, -2.4317626953125, -2.35693359375, -2.2821044921875, -2.207275390625, -2.1324462890625, -2.0576171875, -1.9827880859375, -1.907958984375, -1.8331298828125, -1.75830078125, -1.6834716796875, -1.608642578125, -1.5338134765625, -1.458984375, -1.3841552734375, -1.309326171875, -1.2344970703125, -1.15966796875, -1.0848388671875, -1.010009765625, -0.9351806640625, -0.8603515625, -0.7855224609375, -0.710693359375, -0.6358642578125, -0.56103515625, -0.4862060546875, -0.411376953125, -0.3365478515625, -0.26171875, -0.1868896484375, -0.112060546875, -0.0372314453125, 0.03759765625, 0.1124267578125, 0.187255859375, 0.2620849609375, 0.3369140625, 0.4117431640625, 0.486572265625, 0.5614013671875, 0.63623046875, 0.7110595703125, 0.785888671875, 0.8607177734375, 0.935546875, 1.0103759765625, 1.085205078125, 1.1600341796875, 1.23486328125, 1.3096923828125, 1.384521484375, 1.4593505859375, 1.5341796875, 1.6090087890625, 1.683837890625, 1.7586669921875, 1.83349609375, 1.9083251953125, 1.983154296875, 2.0579833984375, 2.1328125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 5.0, 2.0, 7.0, 10.0, 10.0, 14.0, 13.0, 24.0, 33.0, 38.0, 51.0, 98.0, 141.0, 193.0, 280.0, 435.0, 713.0, 1659.0, 4217.0, 14405.0, 76542.0, 697056.0, 209861.0, 30226.0, 7355.0, 2487.0, 1099.0, 549.0, 326.0, 208.0, 133.0, 106.0, 67.0, 43.0, 44.0, 29.0, 27.0, 15.0, 9.0, 9.0, 5.0, 4.0, 3.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-6.390625, -6.1954345703125, -6.000244140625, -5.8050537109375, -5.60986328125, -5.4146728515625, -5.219482421875, -5.0242919921875, -4.8291015625, -4.6339111328125, -4.438720703125, -4.2435302734375, -4.04833984375, -3.8531494140625, -3.657958984375, -3.4627685546875, -3.267578125, -3.0723876953125, -2.877197265625, -2.6820068359375, -2.48681640625, -2.2916259765625, -2.096435546875, -1.9012451171875, -1.7060546875, -1.5108642578125, -1.315673828125, -1.1204833984375, -0.92529296875, -0.7301025390625, -0.534912109375, -0.3397216796875, -0.14453125, 0.0506591796875, 0.245849609375, 0.4410400390625, 0.63623046875, 0.8314208984375, 1.026611328125, 1.2218017578125, 1.4169921875, 1.6121826171875, 1.807373046875, 2.0025634765625, 2.19775390625, 2.3929443359375, 2.588134765625, 2.7833251953125, 2.978515625, 3.1737060546875, 3.368896484375, 3.5640869140625, 3.75927734375, 3.9544677734375, 4.149658203125, 4.3448486328125, 4.5400390625, 4.7352294921875, 4.930419921875, 5.1256103515625, 5.32080078125, 5.5159912109375, 5.711181640625, 5.9063720703125, 6.1015625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 0.0, 4.0, 4.0, 3.0, 8.0, 8.0, 7.0, 11.0, 9.0, 9.0, 17.0, 23.0, 26.0, 16.0, 31.0, 37.0, 35.0, 48.0, 42.0, 51.0, 62.0, 53.0, 40.0, 49.0, 46.0, 41.0, 49.0, 48.0, 37.0, 32.0, 20.0, 21.0, 25.0, 14.0, 15.0, 17.0, 8.0, 8.0, 11.0, 3.0, 3.0, 5.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0], "bins": [-9.7421875, -9.4744873046875, -9.206787109375, -8.9390869140625, -8.67138671875, -8.4036865234375, -8.135986328125, -7.8682861328125, -7.6005859375, -7.3328857421875, -7.065185546875, -6.7974853515625, -6.52978515625, -6.2620849609375, -5.994384765625, -5.7266845703125, -5.458984375, -5.1912841796875, -4.923583984375, -4.6558837890625, -4.38818359375, -4.1204833984375, -3.852783203125, -3.5850830078125, -3.3173828125, -3.0496826171875, -2.781982421875, -2.5142822265625, -2.24658203125, -1.9788818359375, -1.711181640625, -1.4434814453125, -1.17578125, -0.9080810546875, -0.640380859375, -0.3726806640625, -0.10498046875, 0.1627197265625, 0.430419921875, 0.6981201171875, 0.9658203125, 1.2335205078125, 1.501220703125, 1.7689208984375, 2.03662109375, 2.3043212890625, 2.572021484375, 2.8397216796875, 3.107421875, 3.3751220703125, 3.642822265625, 3.9105224609375, 4.17822265625, 4.4459228515625, 4.713623046875, 4.9813232421875, 5.2490234375, 5.5167236328125, 5.784423828125, 6.0521240234375, 6.31982421875, 6.5875244140625, 6.855224609375, 7.1229248046875, 7.390625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 0.0, 2.0, 5.0, 8.0, 11.0, 10.0, 14.0, 15.0, 30.0, 44.0, 58.0, 113.0, 185.0, 337.0, 706.0, 1625.0, 4068.0, 11560.0, 40578.0, 227265.0, 667478.0, 67443.0, 17093.0, 5717.0, 2261.0, 935.0, 432.0, 221.0, 123.0, 66.0, 51.0, 37.0, 17.0, 17.0, 9.0, 5.0, 1.0, 9.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.720703125, -2.636138916015625, -2.55157470703125, -2.467010498046875, -2.3824462890625, -2.297882080078125, -2.21331787109375, -2.128753662109375, -2.044189453125, -1.959625244140625, -1.87506103515625, -1.790496826171875, -1.7059326171875, -1.621368408203125, -1.53680419921875, -1.452239990234375, -1.36767578125, -1.283111572265625, -1.19854736328125, -1.113983154296875, -1.0294189453125, -0.944854736328125, -0.86029052734375, -0.775726318359375, -0.691162109375, -0.606597900390625, -0.52203369140625, -0.437469482421875, -0.3529052734375, -0.268341064453125, -0.18377685546875, -0.099212646484375, -0.0146484375, 0.069915771484375, 0.15447998046875, 0.239044189453125, 0.3236083984375, 0.408172607421875, 0.49273681640625, 0.577301025390625, 0.661865234375, 0.746429443359375, 0.83099365234375, 0.915557861328125, 1.0001220703125, 1.084686279296875, 1.16925048828125, 1.253814697265625, 1.33837890625, 1.422943115234375, 1.50750732421875, 1.592071533203125, 1.6766357421875, 1.761199951171875, 1.84576416015625, 1.930328369140625, 2.014892578125, 2.099456787109375, 2.18402099609375, 2.268585205078125, 2.3531494140625, 2.437713623046875, 2.52227783203125, 2.606842041015625, 2.69140625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 9.0, 4.0, 12.0, 14.0, 27.0, 26.0, 45.0, 59.0, 83.0, 107.0, 157.0, 117.0, 87.0, 66.0, 41.0, 36.0, 21.0, 18.0, 12.0, 9.0, 6.0, 6.0, 2.0, 2.0, 4.0, 3.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0006699562072753906, -0.0006465092301368713, -0.000623062252998352, -0.0005996152758598328, -0.0005761682987213135, -0.0005527213215827942, -0.0005292743444442749, -0.0005058273673057556, -0.00048238039016723633, -0.00045893341302871704, -0.00043548643589019775, -0.00041203945875167847, -0.0003885924816131592, -0.0003651455044746399, -0.0003416985273361206, -0.0003182515501976013, -0.00029480457305908203, -0.00027135759592056274, -0.00024791061878204346, -0.00022446364164352417, -0.00020101666450500488, -0.0001775696873664856, -0.0001541227102279663, -0.00013067573308944702, -0.00010722875595092773, -8.378177881240845e-05, -6.033480167388916e-05, -3.688782453536987e-05, -1.3440847396850586e-05, 1.0006129741668701e-05, 3.345310688018799e-05, 5.6900084018707275e-05, 8.034706115722656e-05, 0.00010379403829574585, 0.00012724101543426514, 0.00015068799257278442, 0.0001741349697113037, 0.000197581946849823, 0.00022102892398834229, 0.00024447590112686157, 0.00026792287826538086, 0.00029136985540390015, 0.00031481683254241943, 0.0003382638096809387, 0.000361710786819458, 0.0003851577639579773, 0.0004086047410964966, 0.00043205171823501587, 0.00045549869537353516, 0.00047894567251205444, 0.0005023926496505737, 0.000525839626789093, 0.0005492866039276123, 0.0005727335810661316, 0.0005961805582046509, 0.0006196275353431702, 0.0006430745124816895, 0.0006665214896202087, 0.000689968466758728, 0.0007134154438972473, 0.0007368624210357666, 0.0007603093981742859, 0.0007837563753128052, 0.0008072033524513245, 0.0008306503295898438]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 5.0, 2.0, 1.0, 5.0, 7.0, 9.0, 21.0, 16.0, 33.0, 55.0, 86.0, 141.0, 245.0, 425.0, 777.0, 1742.0, 4324.0, 12758.0, 51346.0, 591119.0, 321395.0, 45016.0, 11615.0, 4049.0, 1624.0, 787.0, 402.0, 212.0, 127.0, 77.0, 47.0, 24.0, 20.0, 14.0, 15.0, 8.0, 5.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.291015625, -3.196868896484375, -3.10272216796875, -3.008575439453125, -2.9144287109375, -2.820281982421875, -2.72613525390625, -2.631988525390625, -2.537841796875, -2.443695068359375, -2.34954833984375, -2.255401611328125, -2.1612548828125, -2.067108154296875, -1.97296142578125, -1.878814697265625, -1.78466796875, -1.690521240234375, -1.59637451171875, -1.502227783203125, -1.4080810546875, -1.313934326171875, -1.21978759765625, -1.125640869140625, -1.031494140625, -0.937347412109375, -0.84320068359375, -0.749053955078125, -0.6549072265625, -0.560760498046875, -0.46661376953125, -0.372467041015625, -0.2783203125, -0.184173583984375, -0.09002685546875, 0.004119873046875, 0.0982666015625, 0.192413330078125, 0.28656005859375, 0.380706787109375, 0.474853515625, 0.569000244140625, 0.66314697265625, 0.757293701171875, 0.8514404296875, 0.945587158203125, 1.03973388671875, 1.133880615234375, 1.22802734375, 1.322174072265625, 1.41632080078125, 1.510467529296875, 1.6046142578125, 1.698760986328125, 1.79290771484375, 1.887054443359375, 1.981201171875, 2.075347900390625, 2.16949462890625, 2.263641357421875, 2.3577880859375, 2.451934814453125, 2.54608154296875, 2.640228271484375, 2.734375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 0.0, 2.0, 5.0, 2.0, 3.0, 3.0, 11.0, 8.0, 18.0, 12.0, 13.0, 22.0, 17.0, 38.0, 46.0, 59.0, 93.0, 101.0, 117.0, 80.0, 71.0, 71.0, 44.0, 40.0, 29.0, 20.0, 12.0, 16.0, 10.0, 13.0, 6.0, 5.0, 1.0, 0.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.576171875, -2.50152587890625, -2.4268798828125, -2.35223388671875, -2.277587890625, -2.20294189453125, -2.1282958984375, -2.05364990234375, -1.97900390625, -1.90435791015625, -1.8297119140625, -1.75506591796875, -1.680419921875, -1.60577392578125, -1.5311279296875, -1.45648193359375, -1.3818359375, -1.30718994140625, -1.2325439453125, -1.15789794921875, -1.083251953125, -1.00860595703125, -0.9339599609375, -0.85931396484375, -0.78466796875, -0.71002197265625, -0.6353759765625, -0.56072998046875, -0.486083984375, -0.41143798828125, -0.3367919921875, -0.26214599609375, -0.1875, -0.11285400390625, -0.0382080078125, 0.03643798828125, 0.111083984375, 0.18572998046875, 0.2603759765625, 0.33502197265625, 0.40966796875, 0.48431396484375, 0.5589599609375, 0.63360595703125, 0.708251953125, 0.78289794921875, 0.8575439453125, 0.93218994140625, 1.0068359375, 1.08148193359375, 1.1561279296875, 1.23077392578125, 1.305419921875, 1.38006591796875, 1.4547119140625, 1.52935791015625, 1.60400390625, 1.67864990234375, 1.7532958984375, 1.82794189453125, 1.902587890625, 1.97723388671875, 2.0518798828125, 2.12652587890625, 2.201171875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 2.0, 4.0, 2.0, 13.0, 12.0, 30.0, 56.0, 98.0, 251.0, 302.0, 128.0, 53.0, 23.0, 9.0, 7.0, 5.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.20618438720703, -60.06856155395508, -57.930938720703125, -55.79331588745117, -53.65569305419922, -51.518070220947266, -49.38044738769531, -47.242820739746094, -45.105201721191406, -42.96757888793945, -40.8299560546875, -38.69233322143555, -36.554710388183594, -34.41708755493164, -32.27946472167969, -30.1418399810791, -28.004215240478516, -25.866592407226562, -23.72896957397461, -21.591346740722656, -19.453723907470703, -17.31610107421875, -15.178476333618164, -13.040853500366211, -10.903230667114258, -8.765607833862305, -6.627984523773193, -4.490361213684082, -2.352738380432129, -0.21511554718017578, 1.9225082397460938, 4.060131072998047, 6.19775390625, 8.335376739501953, 10.472999572753906, 12.610623359680176, 14.748246192932129, 16.885868072509766, 19.02349281311035, 21.161115646362305, 23.298738479614258, 25.43636131286621, 27.573984146118164, 29.71160888671875, 31.849231719970703, 33.986854553222656, 36.12447738647461, 38.26210021972656, 40.399723052978516, 42.53734588623047, 44.67496871948242, 46.812591552734375, 48.95021438598633, 51.08783721923828, 53.2254638671875, 55.36308288574219, 57.500709533691406, 59.63833236694336, 61.77595520019531, 63.913578033447266, 66.05120086669922, 68.18882751464844, 70.32644653320312, 72.46407318115234, 74.60169219970703]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 2.0, 4.0, 1.0, 2.0, 4.0, 5.0, 6.0, 6.0, 3.0, 14.0, 10.0, 13.0, 17.0, 16.0, 22.0, 16.0, 21.0, 21.0, 30.0, 25.0, 32.0, 39.0, 34.0, 67.0, 89.0, 92.0, 61.0, 39.0, 41.0, 36.0, 22.0, 32.0, 22.0, 25.0, 26.0, 24.0, 18.0, 10.0, 14.0, 8.0, 4.0, 7.0, 9.0, 5.0, 1.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 0.0, 2.0], "bins": [-32.371185302734375, -31.395626068115234, -30.420066833496094, -29.444507598876953, -28.468948364257812, -27.493389129638672, -26.51782989501953, -25.54227066040039, -24.56671142578125, -23.59115219116211, -22.61559295654297, -21.640033721923828, -20.664474487304688, -19.688915252685547, -18.713356018066406, -17.737796783447266, -16.762237548828125, -15.786678314208984, -14.811119079589844, -13.835559844970703, -12.860000610351562, -11.884441375732422, -10.908882141113281, -9.93332290649414, -8.957763671875, -7.982204437255859, -7.006645202636719, -6.031085968017578, -5.0555267333984375, -4.079967498779297, -3.1044082641601562, -2.1288490295410156, -1.153289794921875, -0.17773056030273438, 0.7978286743164062, 1.7733879089355469, 2.7489471435546875, 3.724506378173828, 4.700065612792969, 5.675624847412109, 6.65118408203125, 7.626743316650391, 8.602302551269531, 9.577861785888672, 10.553421020507812, 11.528980255126953, 12.504539489746094, 13.480098724365234, 14.455657958984375, 15.431217193603516, 16.406776428222656, 17.382335662841797, 18.357894897460938, 19.333454132080078, 20.30901336669922, 21.28457260131836, 22.2601318359375, 23.23569107055664, 24.21125030517578, 25.186809539794922, 26.162368774414062, 27.137928009033203, 28.113487243652344, 29.089046478271484, 30.064605712890625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 5.0, 5.0, 4.0, 6.0, 10.0, 22.0, 13.0, 19.0, 44.0, 42.0, 69.0, 100.0, 132.0, 208.0, 323.0, 501.0, 836.0, 1558.0, 3293.0, 8176.0, 26517.0, 160971.0, 1465604.0, 2192267.0, 276147.0, 38440.0, 10315.0, 3989.0, 1886.0, 1027.0, 568.0, 386.0, 227.0, 139.0, 117.0, 84.0, 67.0, 45.0, 39.0, 25.0, 22.0, 14.0, 7.0, 7.0, 6.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.19140625, -4.0609130859375, -3.930419921875, -3.7999267578125, -3.66943359375, -3.5389404296875, -3.408447265625, -3.2779541015625, -3.1474609375, -3.0169677734375, -2.886474609375, -2.7559814453125, -2.62548828125, -2.4949951171875, -2.364501953125, -2.2340087890625, -2.103515625, -1.9730224609375, -1.842529296875, -1.7120361328125, -1.58154296875, -1.4510498046875, -1.320556640625, -1.1900634765625, -1.0595703125, -0.9290771484375, -0.798583984375, -0.6680908203125, -0.53759765625, -0.4071044921875, -0.276611328125, -0.1461181640625, -0.015625, 0.1148681640625, 0.245361328125, 0.3758544921875, 0.50634765625, 0.6368408203125, 0.767333984375, 0.8978271484375, 1.0283203125, 1.1588134765625, 1.289306640625, 1.4197998046875, 1.55029296875, 1.6807861328125, 1.811279296875, 1.9417724609375, 2.072265625, 2.2027587890625, 2.333251953125, 2.4637451171875, 2.59423828125, 2.7247314453125, 2.855224609375, 2.9857177734375, 3.1162109375, 3.2467041015625, 3.377197265625, 3.5076904296875, 3.63818359375, 3.7686767578125, 3.899169921875, 4.0296630859375, 4.16015625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 4.0, 7.0, 9.0, 11.0, 9.0, 16.0, 23.0, 21.0, 32.0, 36.0, 45.0, 44.0, 48.0, 51.0, 53.0, 67.0, 48.0, 46.0, 44.0, 38.0, 63.0, 42.0, 43.0, 30.0, 22.0, 33.0, 27.0, 24.0, 10.0, 16.0, 11.0, 12.0, 2.0, 4.0, 5.0, 4.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.791015625, -2.706878662109375, -2.62274169921875, -2.538604736328125, -2.4544677734375, -2.370330810546875, -2.28619384765625, -2.202056884765625, -2.117919921875, -2.033782958984375, -1.94964599609375, -1.865509033203125, -1.7813720703125, -1.697235107421875, -1.61309814453125, -1.528961181640625, -1.44482421875, -1.360687255859375, -1.27655029296875, -1.192413330078125, -1.1082763671875, -1.024139404296875, -0.94000244140625, -0.855865478515625, -0.771728515625, -0.687591552734375, -0.60345458984375, -0.519317626953125, -0.4351806640625, -0.351043701171875, -0.26690673828125, -0.182769775390625, -0.0986328125, -0.014495849609375, 0.06964111328125, 0.153778076171875, 0.2379150390625, 0.322052001953125, 0.40618896484375, 0.490325927734375, 0.574462890625, 0.658599853515625, 0.74273681640625, 0.826873779296875, 0.9110107421875, 0.995147705078125, 1.07928466796875, 1.163421630859375, 1.24755859375, 1.331695556640625, 1.41583251953125, 1.499969482421875, 1.5841064453125, 1.668243408203125, 1.75238037109375, 1.836517333984375, 1.920654296875, 2.004791259765625, 2.08892822265625, 2.173065185546875, 2.2572021484375, 2.341339111328125, 2.42547607421875, 2.509613037109375, 2.59375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 2.0, 13.0, 19.0, 33.0, 80.0, 102.0, 273.0, 739.0, 4391.0, 833510.0, 3346764.0, 6930.0, 834.0, 290.0, 136.0, 91.0, 32.0, 20.0, 16.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.578125, -10.971435546875, -10.36474609375, -9.758056640625, -9.1513671875, -8.544677734375, -7.93798828125, -7.331298828125, -6.724609375, -6.117919921875, -5.51123046875, -4.904541015625, -4.2978515625, -3.691162109375, -3.08447265625, -2.477783203125, -1.87109375, -1.264404296875, -0.65771484375, -0.051025390625, 0.5556640625, 1.162353515625, 1.76904296875, 2.375732421875, 2.982421875, 3.589111328125, 4.19580078125, 4.802490234375, 5.4091796875, 6.015869140625, 6.62255859375, 7.229248046875, 7.8359375, 8.442626953125, 9.04931640625, 9.656005859375, 10.2626953125, 10.869384765625, 11.47607421875, 12.082763671875, 12.689453125, 13.296142578125, 13.90283203125, 14.509521484375, 15.1162109375, 15.722900390625, 16.32958984375, 16.936279296875, 17.54296875, 18.149658203125, 18.75634765625, 19.363037109375, 19.9697265625, 20.576416015625, 21.18310546875, 21.789794921875, 22.396484375, 23.003173828125, 23.60986328125, 24.216552734375, 24.8232421875, 25.429931640625, 26.03662109375, 26.643310546875, 27.25]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 11.0, 8.0, 16.0, 17.0, 35.0, 40.0, 83.0, 138.0, 208.0, 371.0, 604.0, 773.0, 723.0, 435.0, 230.0, 139.0, 87.0, 51.0, 35.0, 22.0, 15.0, 13.0, 9.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.640625, -8.42236328125, -8.2041015625, -7.98583984375, -7.767578125, -7.54931640625, -7.3310546875, -7.11279296875, -6.89453125, -6.67626953125, -6.4580078125, -6.23974609375, -6.021484375, -5.80322265625, -5.5849609375, -5.36669921875, -5.1484375, -4.93017578125, -4.7119140625, -4.49365234375, -4.275390625, -4.05712890625, -3.8388671875, -3.62060546875, -3.40234375, -3.18408203125, -2.9658203125, -2.74755859375, -2.529296875, -2.31103515625, -2.0927734375, -1.87451171875, -1.65625, -1.43798828125, -1.2197265625, -1.00146484375, -0.783203125, -0.56494140625, -0.3466796875, -0.12841796875, 0.08984375, 0.30810546875, 0.5263671875, 0.74462890625, 0.962890625, 1.18115234375, 1.3994140625, 1.61767578125, 1.8359375, 2.05419921875, 2.2724609375, 2.49072265625, 2.708984375, 2.92724609375, 3.1455078125, 3.36376953125, 3.58203125, 3.80029296875, 4.0185546875, 4.23681640625, 4.455078125, 4.67333984375, 4.8916015625, 5.10986328125, 5.328125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 5.0, 3.0, 4.0, 6.0, 20.0, 15.0, 25.0, 44.0, 70.0, 117.0, 137.0, 146.0, 131.0, 98.0, 73.0, 40.0, 24.0, 15.0, 5.0, 11.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-56.90744400024414, -55.34212875366211, -53.77681350708008, -52.21149444580078, -50.64617919921875, -49.08086395263672, -47.51554870605469, -45.950233459472656, -44.384918212890625, -42.819602966308594, -41.25428771972656, -39.68897247314453, -38.123653411865234, -36.5583381652832, -34.99302291870117, -33.42770767211914, -31.862388610839844, -30.297073364257812, -28.73175621032715, -27.166440963745117, -25.601123809814453, -24.035808563232422, -22.47049331665039, -20.90517807006836, -19.339860916137695, -17.774545669555664, -16.209228515625, -14.643913269042969, -13.078597068786621, -11.513280868530273, -9.947965621948242, -8.382649421691895, -6.8173370361328125, -5.252020835876465, -3.6867051124572754, -2.121389389038086, -0.5560731887817383, 1.0092430114746094, 2.5745582580566406, 4.139874458312988, 5.705190658569336, 7.270506858825684, 8.835823059082031, 10.401138305664062, 11.96645450592041, 13.531770706176758, 15.097085952758789, 16.662403106689453, 18.227718353271484, 19.793033599853516, 21.35835075378418, 22.92366600036621, 24.488983154296875, 26.054298400878906, 27.619613647460938, 29.18492889404297, 30.750246047973633, 32.3155632019043, 33.88087844848633, 35.44619369506836, 37.01150894165039, 38.57682800292969, 40.14214324951172, 41.70745849609375, 43.27277374267578]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 6.0, 11.0, 6.0, 7.0, 8.0, 11.0, 13.0, 10.0, 20.0, 23.0, 16.0, 19.0, 33.0, 36.0, 32.0, 37.0, 40.0, 38.0, 56.0, 58.0, 57.0, 54.0, 45.0, 31.0, 39.0, 41.0, 28.0, 27.0, 28.0, 23.0, 20.0, 28.0, 21.0, 14.0, 12.0, 7.0, 10.0, 11.0, 8.0, 8.0, 4.0, 4.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.80084800720215, -22.054649353027344, -21.30845069885254, -20.562252044677734, -19.816055297851562, -19.069856643676758, -18.323657989501953, -17.57745933532715, -16.831260681152344, -16.08506202697754, -15.33886432647705, -14.592665672302246, -13.846467971801758, -13.100269317626953, -12.354070663452148, -11.607872009277344, -10.861675262451172, -10.115476608276367, -9.369278907775879, -8.623080253601074, -7.876882076263428, -7.130683898925781, -6.384485244750977, -5.63828706741333, -4.892088890075684, -4.145890712738037, -3.3996922969818115, -2.653493881225586, -1.9072957038879395, -1.161097526550293, -0.4148988723754883, 0.3312993049621582, 1.0774955749511719, 1.823693871498108, 2.569892168045044, 3.3160905838012695, 4.062288761138916, 4.8084869384765625, 5.554685592651367, 6.300883769989014, 7.04708194732666, 7.793280124664307, 8.539478302001953, 9.285676956176758, 10.031875610351562, 10.77807331085205, 11.524271965026855, 12.270469665527344, 13.016668319702148, 13.762866973876953, 14.509064674377441, 15.255263328552246, 16.001461029052734, 16.74765968322754, 17.493858337402344, 18.24005699157715, 18.986255645751953, 19.732454299926758, 20.478652954101562, 21.224849700927734, 21.97104835510254, 22.717247009277344, 23.46344566345215, 24.209644317626953, 24.955841064453125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 5.0, 14.0, 18.0, 25.0, 40.0, 98.0, 172.0, 427.0, 879.0, 2023.0, 5179.0, 14270.0, 45586.0, 191520.0, 542507.0, 179920.0, 43569.0, 13847.0, 4887.0, 1935.0, 841.0, 385.0, 188.0, 86.0, 61.0, 21.0, 15.0, 11.0, 9.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.984375, -5.82470703125, -5.6650390625, -5.50537109375, -5.345703125, -5.18603515625, -5.0263671875, -4.86669921875, -4.70703125, -4.54736328125, -4.3876953125, -4.22802734375, -4.068359375, -3.90869140625, -3.7490234375, -3.58935546875, -3.4296875, -3.27001953125, -3.1103515625, -2.95068359375, -2.791015625, -2.63134765625, -2.4716796875, -2.31201171875, -2.15234375, -1.99267578125, -1.8330078125, -1.67333984375, -1.513671875, -1.35400390625, -1.1943359375, -1.03466796875, -0.875, -0.71533203125, -0.5556640625, -0.39599609375, -0.236328125, -0.07666015625, 0.0830078125, 0.24267578125, 0.40234375, 0.56201171875, 0.7216796875, 0.88134765625, 1.041015625, 1.20068359375, 1.3603515625, 1.52001953125, 1.6796875, 1.83935546875, 1.9990234375, 2.15869140625, 2.318359375, 2.47802734375, 2.6376953125, 2.79736328125, 2.95703125, 3.11669921875, 3.2763671875, 3.43603515625, 3.595703125, 3.75537109375, 3.9150390625, 4.07470703125, 4.234375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 2.0, 4.0, 4.0, 5.0, 7.0, 13.0, 8.0, 17.0, 12.0, 18.0, 21.0, 17.0, 28.0, 30.0, 55.0, 41.0, 57.0, 41.0, 45.0, 57.0, 44.0, 47.0, 30.0, 38.0, 41.0, 37.0, 48.0, 34.0, 25.0, 28.0, 26.0, 19.0, 17.0, 20.0, 14.0, 10.0, 11.0, 9.0, 7.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-2.82421875, -2.74139404296875, -2.6585693359375, -2.57574462890625, -2.492919921875, -2.41009521484375, -2.3272705078125, -2.24444580078125, -2.16162109375, -2.07879638671875, -1.9959716796875, -1.91314697265625, -1.830322265625, -1.74749755859375, -1.6646728515625, -1.58184814453125, -1.4990234375, -1.41619873046875, -1.3333740234375, -1.25054931640625, -1.167724609375, -1.08489990234375, -1.0020751953125, -0.91925048828125, -0.83642578125, -0.75360107421875, -0.6707763671875, -0.58795166015625, -0.505126953125, -0.42230224609375, -0.3394775390625, -0.25665283203125, -0.173828125, -0.09100341796875, -0.0081787109375, 0.07464599609375, 0.157470703125, 0.24029541015625, 0.3231201171875, 0.40594482421875, 0.48876953125, 0.57159423828125, 0.6544189453125, 0.73724365234375, 0.820068359375, 0.90289306640625, 0.9857177734375, 1.06854248046875, 1.1513671875, 1.23419189453125, 1.3170166015625, 1.39984130859375, 1.482666015625, 1.56549072265625, 1.6483154296875, 1.73114013671875, 1.81396484375, 1.89678955078125, 1.9796142578125, 2.06243896484375, 2.145263671875, 2.22808837890625, 2.3109130859375, 2.39373779296875, 2.4765625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 2.0, 6.0, 6.0, 7.0, 15.0, 12.0, 25.0, 17.0, 36.0, 63.0, 77.0, 130.0, 172.0, 262.0, 493.0, 1005.0, 2533.0, 11717.0, 142580.0, 841189.0, 39413.0, 5507.0, 1612.0, 666.0, 354.0, 224.0, 150.0, 82.0, 56.0, 47.0, 31.0, 19.0, 20.0, 9.0, 5.0, 8.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3046875, -6.976806640625, -6.64892578125, -6.321044921875, -5.9931640625, -5.665283203125, -5.33740234375, -5.009521484375, -4.681640625, -4.353759765625, -4.02587890625, -3.697998046875, -3.3701171875, -3.042236328125, -2.71435546875, -2.386474609375, -2.05859375, -1.730712890625, -1.40283203125, -1.074951171875, -0.7470703125, -0.419189453125, -0.09130859375, 0.236572265625, 0.564453125, 0.892333984375, 1.22021484375, 1.548095703125, 1.8759765625, 2.203857421875, 2.53173828125, 2.859619140625, 3.1875, 3.515380859375, 3.84326171875, 4.171142578125, 4.4990234375, 4.826904296875, 5.15478515625, 5.482666015625, 5.810546875, 6.138427734375, 6.46630859375, 6.794189453125, 7.1220703125, 7.449951171875, 7.77783203125, 8.105712890625, 8.43359375, 8.761474609375, 9.08935546875, 9.417236328125, 9.7451171875, 10.072998046875, 10.40087890625, 10.728759765625, 11.056640625, 11.384521484375, 11.71240234375, 12.040283203125, 12.3681640625, 12.696044921875, 13.02392578125, 13.351806640625, 13.6796875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 6.0, 3.0, 2.0, 9.0, 9.0, 8.0, 11.0, 22.0, 32.0, 24.0, 31.0, 27.0, 60.0, 57.0, 63.0, 51.0, 64.0, 66.0, 64.0, 53.0, 46.0, 40.0, 38.0, 37.0, 38.0, 37.0, 14.0, 12.0, 15.0, 14.0, 16.0, 10.0, 8.0, 5.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.875, -10.493896484375, -10.11279296875, -9.731689453125, -9.3505859375, -8.969482421875, -8.58837890625, -8.207275390625, -7.826171875, -7.445068359375, -7.06396484375, -6.682861328125, -6.3017578125, -5.920654296875, -5.53955078125, -5.158447265625, -4.77734375, -4.396240234375, -4.01513671875, -3.634033203125, -3.2529296875, -2.871826171875, -2.49072265625, -2.109619140625, -1.728515625, -1.347412109375, -0.96630859375, -0.585205078125, -0.2041015625, 0.177001953125, 0.55810546875, 0.939208984375, 1.3203125, 1.701416015625, 2.08251953125, 2.463623046875, 2.8447265625, 3.225830078125, 3.60693359375, 3.988037109375, 4.369140625, 4.750244140625, 5.13134765625, 5.512451171875, 5.8935546875, 6.274658203125, 6.65576171875, 7.036865234375, 7.41796875, 7.799072265625, 8.18017578125, 8.561279296875, 8.9423828125, 9.323486328125, 9.70458984375, 10.085693359375, 10.466796875, 10.847900390625, 11.22900390625, 11.610107421875, 11.9912109375, 12.372314453125, 12.75341796875, 13.134521484375, 13.515625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 1.0, 3.0, 8.0, 17.0, 12.0, 13.0, 28.0, 44.0, 79.0, 141.0, 250.0, 560.0, 1470.0, 5305.0, 27883.0, 680295.0, 301480.0, 23785.0, 4808.0, 1308.0, 501.0, 251.0, 126.0, 65.0, 43.0, 21.0, 11.0, 17.0, 13.0, 8.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.109375, -3.98077392578125, -3.8521728515625, -3.72357177734375, -3.594970703125, -3.46636962890625, -3.3377685546875, -3.20916748046875, -3.08056640625, -2.95196533203125, -2.8233642578125, -2.69476318359375, -2.566162109375, -2.43756103515625, -2.3089599609375, -2.18035888671875, -2.0517578125, -1.92315673828125, -1.7945556640625, -1.66595458984375, -1.537353515625, -1.40875244140625, -1.2801513671875, -1.15155029296875, -1.02294921875, -0.89434814453125, -0.7657470703125, -0.63714599609375, -0.508544921875, -0.37994384765625, -0.2513427734375, -0.12274169921875, 0.005859375, 0.13446044921875, 0.2630615234375, 0.39166259765625, 0.520263671875, 0.64886474609375, 0.7774658203125, 0.90606689453125, 1.03466796875, 1.16326904296875, 1.2918701171875, 1.42047119140625, 1.549072265625, 1.67767333984375, 1.8062744140625, 1.93487548828125, 2.0634765625, 2.19207763671875, 2.3206787109375, 2.44927978515625, 2.577880859375, 2.70648193359375, 2.8350830078125, 2.96368408203125, 3.09228515625, 3.22088623046875, 3.3494873046875, 3.47808837890625, 3.606689453125, 3.73529052734375, 3.8638916015625, 3.99249267578125, 4.12109375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 6.0, 7.0, 5.0, 7.0, 9.0, 15.0, 27.0, 35.0, 89.0, 208.0, 269.0, 142.0, 60.0, 27.0, 32.0, 16.0, 14.0, 9.0, 12.0, 3.0, 1.0, 3.0, 4.0, 6.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010128021240234375, -0.0009672492742538452, -0.0009216964244842529, -0.0008761435747146606, -0.0008305907249450684, -0.0007850378751754761, -0.0007394850254058838, -0.0006939321756362915, -0.0006483793258666992, -0.0006028264760971069, -0.0005572736263275146, -0.0005117207765579224, -0.0004661679267883301, -0.0004206150770187378, -0.0003750622272491455, -0.0003295093774795532, -0.00028395652770996094, -0.00023840367794036865, -0.00019285082817077637, -0.00014729797840118408, -0.0001017451286315918, -5.619227886199951e-05, -1.0639429092407227e-05, 3.491342067718506e-05, 8.046627044677734e-05, 0.00012601912021636963, 0.00017157196998596191, 0.0002171248197555542, 0.0002626776695251465, 0.00030823051929473877, 0.00035378336906433105, 0.00039933621883392334, 0.0004448890686035156, 0.0004904419183731079, 0.0005359947681427002, 0.0005815476179122925, 0.0006271004676818848, 0.000672653317451477, 0.0007182061672210693, 0.0007637590169906616, 0.0008093118667602539, 0.0008548647165298462, 0.0009004175662994385, 0.0009459704160690308, 0.000991523265838623, 0.0010370761156082153, 0.0010826289653778076, 0.0011281818151474, 0.0011737346649169922, 0.0012192875146865845, 0.0012648403644561768, 0.001310393214225769, 0.0013559460639953613, 0.0014014989137649536, 0.001447051763534546, 0.0014926046133041382, 0.0015381574630737305, 0.0015837103128433228, 0.001629263162612915, 0.0016748160123825073, 0.0017203688621520996, 0.001765921711921692, 0.0018114745616912842, 0.0018570274114608765, 0.0019025802612304688]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 6.0, 7.0, 8.0, 11.0, 20.0, 20.0, 33.0, 51.0, 85.0, 121.0, 181.0, 284.0, 596.0, 1232.0, 3033.0, 9596.0, 43192.0, 657578.0, 285107.0, 34192.0, 8020.0, 2675.0, 1189.0, 560.0, 261.0, 163.0, 97.0, 67.0, 44.0, 36.0, 31.0, 17.0, 8.0, 4.0, 5.0, 2.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.0703125, -2.967742919921875, -2.86517333984375, -2.762603759765625, -2.6600341796875, -2.557464599609375, -2.45489501953125, -2.352325439453125, -2.249755859375, -2.147186279296875, -2.04461669921875, -1.942047119140625, -1.8394775390625, -1.736907958984375, -1.63433837890625, -1.531768798828125, -1.42919921875, -1.326629638671875, -1.22406005859375, -1.121490478515625, -1.0189208984375, -0.916351318359375, -0.81378173828125, -0.711212158203125, -0.608642578125, -0.506072998046875, -0.40350341796875, -0.300933837890625, -0.1983642578125, -0.095794677734375, 0.00677490234375, 0.109344482421875, 0.2119140625, 0.314483642578125, 0.41705322265625, 0.519622802734375, 0.6221923828125, 0.724761962890625, 0.82733154296875, 0.929901123046875, 1.032470703125, 1.135040283203125, 1.23760986328125, 1.340179443359375, 1.4427490234375, 1.545318603515625, 1.64788818359375, 1.750457763671875, 1.85302734375, 1.955596923828125, 2.05816650390625, 2.160736083984375, 2.2633056640625, 2.365875244140625, 2.46844482421875, 2.571014404296875, 2.673583984375, 2.776153564453125, 2.87872314453125, 2.981292724609375, 3.0838623046875, 3.186431884765625, 3.28900146484375, 3.391571044921875, 3.494140625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 4.0, 7.0, 8.0, 6.0, 10.0, 8.0, 4.0, 10.0, 16.0, 20.0, 34.0, 35.0, 48.0, 68.0, 91.0, 76.0, 104.0, 86.0, 70.0, 67.0, 57.0, 37.0, 32.0, 20.0, 16.0, 15.0, 8.0, 14.0, 8.0, 10.0, 3.0, 3.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.33984375, -2.268035888671875, -2.19622802734375, -2.124420166015625, -2.0526123046875, -1.980804443359375, -1.90899658203125, -1.837188720703125, -1.765380859375, -1.693572998046875, -1.62176513671875, -1.549957275390625, -1.4781494140625, -1.406341552734375, -1.33453369140625, -1.262725830078125, -1.19091796875, -1.119110107421875, -1.04730224609375, -0.975494384765625, -0.9036865234375, -0.831878662109375, -0.76007080078125, -0.688262939453125, -0.616455078125, -0.544647216796875, -0.47283935546875, -0.401031494140625, -0.3292236328125, -0.257415771484375, -0.18560791015625, -0.113800048828125, -0.0419921875, 0.029815673828125, 0.10162353515625, 0.173431396484375, 0.2452392578125, 0.317047119140625, 0.38885498046875, 0.460662841796875, 0.532470703125, 0.604278564453125, 0.67608642578125, 0.747894287109375, 0.8197021484375, 0.891510009765625, 0.96331787109375, 1.035125732421875, 1.10693359375, 1.178741455078125, 1.25054931640625, 1.322357177734375, 1.3941650390625, 1.465972900390625, 1.53778076171875, 1.609588623046875, 1.681396484375, 1.753204345703125, 1.82501220703125, 1.896820068359375, 1.9686279296875, 2.040435791015625, 2.11224365234375, 2.184051513671875, 2.255859375]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 4.0, 4.0, 5.0, 9.0, 31.0, 86.0, 228.0, 424.0, 114.0, 55.0, 17.0, 9.0, 7.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.10440826416016, -74.27012634277344, -71.43583679199219, -68.60155487060547, -65.76727294921875, -62.9329833984375, -60.09870147705078, -57.2644157409668, -54.43013000488281, -51.59584426879883, -48.761558532714844, -45.927276611328125, -43.09299087524414, -40.258705139160156, -37.42442321777344, -34.59013748168945, -31.75585174560547, -28.921566009521484, -26.087282180786133, -23.25299835205078, -20.418712615966797, -17.584426879882812, -14.750143051147461, -11.91585922241211, -9.081573486328125, -6.247288703918457, -3.413003921508789, -0.5787191390991211, 2.255565643310547, 5.089850425720215, 7.924135208129883, 10.758419036865234, 13.59271240234375, 16.426998138427734, 19.261281967163086, 22.095565795898438, 24.929851531982422, 27.764137268066406, 30.598421096801758, 33.43270492553711, 36.266990661621094, 39.10127639770508, 41.93556213378906, 44.76984405517578, 47.604129791259766, 50.43841552734375, 53.27269744873047, 56.10698318481445, 58.94126892089844, 61.77555465698242, 64.6098403930664, 67.44412231445312, 70.27841186523438, 73.1126937866211, 75.94697570800781, 78.78126525878906, 81.61554718017578, 84.4498291015625, 87.28411865234375, 90.11840057373047, 92.95268249511719, 95.78697204589844, 98.62125396728516, 101.45553588867188, 104.28982543945312]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 4.0, 3.0, 4.0, 5.0, 3.0, 9.0, 15.0, 7.0, 6.0, 17.0, 8.0, 12.0, 15.0, 21.0, 16.0, 21.0, 25.0, 35.0, 30.0, 39.0, 57.0, 121.0, 142.0, 64.0, 45.0, 39.0, 38.0, 27.0, 23.0, 26.0, 23.0, 16.0, 13.0, 16.0, 10.0, 10.0, 10.0, 10.0, 6.0, 5.0, 2.0, 1.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-48.115516662597656, -46.81957244873047, -45.52363204956055, -44.227691650390625, -42.93174743652344, -41.63580322265625, -40.33986282348633, -39.043922424316406, -37.74797821044922, -36.45203399658203, -35.15609359741211, -33.86015319824219, -32.564208984375, -31.268266677856445, -29.97232437133789, -28.676382064819336, -27.38043975830078, -26.084497451782227, -24.788555145263672, -23.492612838745117, -22.196670532226562, -20.900728225708008, -19.604785919189453, -18.3088436126709, -17.012901306152344, -15.716958999633789, -14.421016693115234, -13.12507438659668, -11.829132080078125, -10.53318977355957, -9.237247467041016, -7.941305160522461, -6.645366668701172, -5.349424362182617, -4.0534820556640625, -2.757539749145508, -1.4615974426269531, -0.16565513610839844, 1.1302871704101562, 2.426229476928711, 3.7221717834472656, 5.01811408996582, 6.314056396484375, 7.60999870300293, 8.905941009521484, 10.201883316040039, 11.497825622558594, 12.793767929077148, 14.089710235595703, 15.385652542114258, 16.681594848632812, 17.977537155151367, 19.273479461669922, 20.569421768188477, 21.86536407470703, 23.161306381225586, 24.45724868774414, 25.753190994262695, 27.04913330078125, 28.345075607299805, 29.64101791381836, 30.936960220336914, 32.23290252685547, 33.528846740722656, 34.82478713989258]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 5.0, 2.0, 5.0, 8.0, 15.0, 5.0, 19.0, 37.0, 50.0, 68.0, 112.0, 182.0, 264.0, 473.0, 753.0, 1254.0, 2263.0, 4576.0, 9822.0, 25710.0, 96687.0, 497537.0, 1798628.0, 1351741.0, 305684.0, 63342.0, 18941.0, 7723.0, 3608.0, 1888.0, 1074.0, 672.0, 399.0, 247.0, 172.0, 92.0, 73.0, 37.0, 34.0, 20.0, 15.0, 17.0, 10.0, 9.0, 3.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-4.625, -4.47979736328125, -4.3345947265625, -4.18939208984375, -4.044189453125, -3.89898681640625, -3.7537841796875, -3.60858154296875, -3.46337890625, -3.31817626953125, -3.1729736328125, -3.02777099609375, -2.882568359375, -2.73736572265625, -2.5921630859375, -2.44696044921875, -2.3017578125, -2.15655517578125, -2.0113525390625, -1.86614990234375, -1.720947265625, -1.57574462890625, -1.4305419921875, -1.28533935546875, -1.14013671875, -0.99493408203125, -0.8497314453125, -0.70452880859375, -0.559326171875, -0.41412353515625, -0.2689208984375, -0.12371826171875, 0.021484375, 0.16668701171875, 0.3118896484375, 0.45709228515625, 0.602294921875, 0.74749755859375, 0.8927001953125, 1.03790283203125, 1.18310546875, 1.32830810546875, 1.4735107421875, 1.61871337890625, 1.763916015625, 1.90911865234375, 2.0543212890625, 2.19952392578125, 2.3447265625, 2.48992919921875, 2.6351318359375, 2.78033447265625, 2.925537109375, 3.07073974609375, 3.2159423828125, 3.36114501953125, 3.50634765625, 3.65155029296875, 3.7967529296875, 3.94195556640625, 4.087158203125, 4.23236083984375, 4.3775634765625, 4.52276611328125, 4.66796875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 1.0, 2.0, 3.0, 6.0, 4.0, 10.0, 14.0, 16.0, 19.0, 13.0, 17.0, 29.0, 19.0, 32.0, 47.0, 28.0, 48.0, 53.0, 58.0, 43.0, 63.0, 57.0, 51.0, 43.0, 42.0, 27.0, 39.0, 42.0, 34.0, 23.0, 18.0, 31.0, 21.0, 15.0, 14.0, 6.0, 5.0, 4.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.958984375, -2.868316650390625, -2.77764892578125, -2.686981201171875, -2.5963134765625, -2.505645751953125, -2.41497802734375, -2.324310302734375, -2.233642578125, -2.142974853515625, -2.05230712890625, -1.961639404296875, -1.8709716796875, -1.780303955078125, -1.68963623046875, -1.598968505859375, -1.50830078125, -1.417633056640625, -1.32696533203125, -1.236297607421875, -1.1456298828125, -1.054962158203125, -0.96429443359375, -0.873626708984375, -0.782958984375, -0.692291259765625, -0.60162353515625, -0.510955810546875, -0.4202880859375, -0.329620361328125, -0.23895263671875, -0.148284912109375, -0.0576171875, 0.033050537109375, 0.12371826171875, 0.214385986328125, 0.3050537109375, 0.395721435546875, 0.48638916015625, 0.577056884765625, 0.667724609375, 0.758392333984375, 0.84906005859375, 0.939727783203125, 1.0303955078125, 1.121063232421875, 1.21173095703125, 1.302398681640625, 1.39306640625, 1.483734130859375, 1.57440185546875, 1.665069580078125, 1.7557373046875, 1.846405029296875, 1.93707275390625, 2.027740478515625, 2.118408203125, 2.209075927734375, 2.29974365234375, 2.390411376953125, 2.4810791015625, 2.571746826171875, 2.66241455078125, 2.753082275390625, 2.84375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 8.0, 14.0, 24.0, 44.0, 71.0, 185.0, 389.0, 1512.0, 18968.0, 4162834.0, 8436.0, 1218.0, 330.0, 115.0, 64.0, 29.0, 13.0, 15.0, 8.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-49.15625, -47.5390625, -45.921875, -44.3046875, -42.6875, -41.0703125, -39.453125, -37.8359375, -36.21875, -34.6015625, -32.984375, -31.3671875, -29.75, -28.1328125, -26.515625, -24.8984375, -23.28125, -21.6640625, -20.046875, -18.4296875, -16.8125, -15.1953125, -13.578125, -11.9609375, -10.34375, -8.7265625, -7.109375, -5.4921875, -3.875, -2.2578125, -0.640625, 0.9765625, 2.59375, 4.2109375, 5.828125, 7.4453125, 9.0625, 10.6796875, 12.296875, 13.9140625, 15.53125, 17.1484375, 18.765625, 20.3828125, 22.0, 23.6171875, 25.234375, 26.8515625, 28.46875, 30.0859375, 31.703125, 33.3203125, 34.9375, 36.5546875, 38.171875, 39.7890625, 41.40625, 43.0234375, 44.640625, 46.2578125, 47.875, 49.4921875, 51.109375, 52.7265625, 54.34375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 4.0, 10.0, 10.0, 34.0, 74.0, 156.0, 269.0, 566.0, 1004.0, 908.0, 499.0, 251.0, 113.0, 91.0, 41.0, 24.0, 12.0, 3.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.7734375, -15.2071533203125, -14.640869140625, -14.0745849609375, -13.50830078125, -12.9420166015625, -12.375732421875, -11.8094482421875, -11.2431640625, -10.6768798828125, -10.110595703125, -9.5443115234375, -8.97802734375, -8.4117431640625, -7.845458984375, -7.2791748046875, -6.712890625, -6.1466064453125, -5.580322265625, -5.0140380859375, -4.44775390625, -3.8814697265625, -3.315185546875, -2.7489013671875, -2.1826171875, -1.6163330078125, -1.050048828125, -0.4837646484375, 0.08251953125, 0.6488037109375, 1.215087890625, 1.7813720703125, 2.34765625, 2.9139404296875, 3.480224609375, 4.0465087890625, 4.61279296875, 5.1790771484375, 5.745361328125, 6.3116455078125, 6.8779296875, 7.4442138671875, 8.010498046875, 8.5767822265625, 9.14306640625, 9.7093505859375, 10.275634765625, 10.8419189453125, 11.408203125, 11.9744873046875, 12.540771484375, 13.1070556640625, 13.67333984375, 14.2396240234375, 14.805908203125, 15.3721923828125, 15.9384765625, 16.5047607421875, 17.071044921875, 17.6373291015625, 18.20361328125, 18.7698974609375, 19.336181640625, 19.9024658203125, 20.46875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 2.0, 5.0, 5.0, 8.0, 12.0, 40.0, 92.0, 242.0, 257.0, 172.0, 84.0, 40.0, 14.0, 5.0, 9.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-149.33010864257812, -143.35935974121094, -137.3886260986328, -131.41787719726562, -125.44713592529297, -119.47639465332031, -113.50564575195312, -107.53490447998047, -101.56416320800781, -95.59342193603516, -89.6226806640625, -83.65193176269531, -77.68119049072266, -71.71044921875, -65.73970031738281, -59.768959045410156, -53.7982177734375, -47.827476501464844, -41.85673141479492, -35.885986328125, -29.915245056152344, -23.944501876831055, -17.973758697509766, -12.003013610839844, -6.0322723388671875, -0.06152915954589844, 5.909214019775391, 11.87995719909668, 17.85070037841797, 23.821443557739258, 29.792186737060547, 35.76293182373047, 41.733673095703125, 47.70441436767578, 53.6751594543457, 59.645904541015625, 65.61664581298828, 71.58738708496094, 77.55813598632812, 83.52887725830078, 89.49961853027344, 95.4703598022461, 101.44110107421875, 107.41184997558594, 113.3825912475586, 119.35333251953125, 125.32408142089844, 131.29483032226562, 137.26556396484375, 143.23631286621094, 149.20704650878906, 155.17779541015625, 161.14852905273438, 167.11927795410156, 173.09002685546875, 179.06076049804688, 185.03150939941406, 191.00225830078125, 196.97299194335938, 202.94374084472656, 208.91448974609375, 214.88522338867188, 220.85597229003906, 226.82672119140625, 232.79745483398438]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 4.0, 5.0, 11.0, 14.0, 15.0, 22.0, 33.0, 30.0, 34.0, 45.0, 62.0, 55.0, 67.0, 68.0, 91.0, 71.0, 72.0, 58.0, 50.0, 46.0, 39.0, 32.0, 19.0, 23.0, 14.0, 3.0, 9.0, 5.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.39311981201172, -70.87631225585938, -68.3594970703125, -65.84268951416016, -63.32587432861328, -60.80906295776367, -58.29225158691406, -55.77544403076172, -53.258628845214844, -50.741817474365234, -48.225006103515625, -45.708194732666016, -43.191383361816406, -40.6745719909668, -38.15776062011719, -35.640953063964844, -33.124141693115234, -30.607330322265625, -28.090518951416016, -25.573707580566406, -23.056896209716797, -20.540084838867188, -18.02327537536621, -15.506464004516602, -12.989652633666992, -10.472841262817383, -7.956030368804932, -5.4392194747924805, -2.922408103942871, -0.4055967330932617, 2.1112136840820312, 4.628025054931641, 7.14483642578125, 9.66164779663086, 12.178459167480469, 14.695269584655762, 17.212081909179688, 19.728893280029297, 22.245702743530273, 24.762514114379883, 27.279325485229492, 29.7961368560791, 32.31294631958008, 34.82975769042969, 37.3465690612793, 39.863380432128906, 42.380191802978516, 44.897003173828125, 47.413814544677734, 49.930625915527344, 52.44743728637695, 54.96424865722656, 57.48106002807617, 59.99787139892578, 62.514678955078125, 65.031494140625, 67.54830169677734, 70.06510925292969, 72.58192443847656, 75.0987319946289, 77.61554718017578, 80.13235473632812, 82.649169921875, 85.16597747802734, 87.68279266357422]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 3.0, 8.0, 11.0, 11.0, 22.0, 28.0, 48.0, 57.0, 114.0, 152.0, 248.0, 457.0, 817.0, 1625.0, 3405.0, 8132.0, 26376.0, 136898.0, 706073.0, 124744.0, 24816.0, 7833.0, 3228.0, 1584.0, 776.0, 442.0, 246.0, 145.0, 73.0, 52.0, 42.0, 29.0, 13.0, 13.0, 10.0, 8.0, 6.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.80859375, -6.59893798828125, -6.3892822265625, -6.17962646484375, -5.969970703125, -5.76031494140625, -5.5506591796875, -5.34100341796875, -5.13134765625, -4.92169189453125, -4.7120361328125, -4.50238037109375, -4.292724609375, -4.08306884765625, -3.8734130859375, -3.66375732421875, -3.4541015625, -3.24444580078125, -3.0347900390625, -2.82513427734375, -2.615478515625, -2.40582275390625, -2.1961669921875, -1.98651123046875, -1.77685546875, -1.56719970703125, -1.3575439453125, -1.14788818359375, -0.938232421875, -0.72857666015625, -0.5189208984375, -0.30926513671875, -0.099609375, 0.11004638671875, 0.3197021484375, 0.52935791015625, 0.739013671875, 0.94866943359375, 1.1583251953125, 1.36798095703125, 1.57763671875, 1.78729248046875, 1.9969482421875, 2.20660400390625, 2.416259765625, 2.62591552734375, 2.8355712890625, 3.04522705078125, 3.2548828125, 3.46453857421875, 3.6741943359375, 3.88385009765625, 4.093505859375, 4.30316162109375, 4.5128173828125, 4.72247314453125, 4.93212890625, 5.14178466796875, 5.3514404296875, 5.56109619140625, 5.770751953125, 5.98040771484375, 6.1900634765625, 6.39971923828125, 6.609375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 6.0, 4.0, 8.0, 9.0, 13.0, 21.0, 19.0, 35.0, 27.0, 38.0, 57.0, 49.0, 48.0, 67.0, 55.0, 65.0, 50.0, 61.0, 64.0, 50.0, 37.0, 46.0, 40.0, 29.0, 25.0, 15.0, 15.0, 15.0, 10.0, 4.0, 11.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.75, -4.60516357421875, -4.4603271484375, -4.31549072265625, -4.170654296875, -4.02581787109375, -3.8809814453125, -3.73614501953125, -3.59130859375, -3.44647216796875, -3.3016357421875, -3.15679931640625, -3.011962890625, -2.86712646484375, -2.7222900390625, -2.57745361328125, -2.4326171875, -2.28778076171875, -2.1429443359375, -1.99810791015625, -1.853271484375, -1.70843505859375, -1.5635986328125, -1.41876220703125, -1.27392578125, -1.12908935546875, -0.9842529296875, -0.83941650390625, -0.694580078125, -0.54974365234375, -0.4049072265625, -0.26007080078125, -0.115234375, 0.02960205078125, 0.1744384765625, 0.31927490234375, 0.464111328125, 0.60894775390625, 0.7537841796875, 0.89862060546875, 1.04345703125, 1.18829345703125, 1.3331298828125, 1.47796630859375, 1.622802734375, 1.76763916015625, 1.9124755859375, 2.05731201171875, 2.2021484375, 2.34698486328125, 2.4918212890625, 2.63665771484375, 2.781494140625, 2.92633056640625, 3.0711669921875, 3.21600341796875, 3.36083984375, 3.50567626953125, 3.6505126953125, 3.79534912109375, 3.940185546875, 4.08502197265625, 4.2298583984375, 4.37469482421875, 4.51953125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 1.0, 5.0, 8.0, 10.0, 9.0, 17.0, 21.0, 27.0, 39.0, 66.0, 87.0, 122.0, 300.0, 588.0, 1564.0, 6857.0, 76798.0, 929357.0, 26756.0, 3752.0, 1127.0, 408.0, 215.0, 128.0, 94.0, 51.0, 38.0, 25.0, 14.0, 14.0, 15.0, 9.0, 7.0, 6.0, 10.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.28125, -9.942138671875, -9.60302734375, -9.263916015625, -8.9248046875, -8.585693359375, -8.24658203125, -7.907470703125, -7.568359375, -7.229248046875, -6.89013671875, -6.551025390625, -6.2119140625, -5.872802734375, -5.53369140625, -5.194580078125, -4.85546875, -4.516357421875, -4.17724609375, -3.838134765625, -3.4990234375, -3.159912109375, -2.82080078125, -2.481689453125, -2.142578125, -1.803466796875, -1.46435546875, -1.125244140625, -0.7861328125, -0.447021484375, -0.10791015625, 0.231201171875, 0.5703125, 0.909423828125, 1.24853515625, 1.587646484375, 1.9267578125, 2.265869140625, 2.60498046875, 2.944091796875, 3.283203125, 3.622314453125, 3.96142578125, 4.300537109375, 4.6396484375, 4.978759765625, 5.31787109375, 5.656982421875, 5.99609375, 6.335205078125, 6.67431640625, 7.013427734375, 7.3525390625, 7.691650390625, 8.03076171875, 8.369873046875, 8.708984375, 9.048095703125, 9.38720703125, 9.726318359375, 10.0654296875, 10.404541015625, 10.74365234375, 11.082763671875, 11.421875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 4.0, 6.0, 7.0, 4.0, 11.0, 6.0, 13.0, 15.0, 14.0, 21.0, 23.0, 23.0, 27.0, 41.0, 45.0, 36.0, 69.0, 91.0, 80.0, 75.0, 65.0, 53.0, 53.0, 38.0, 32.0, 21.0, 24.0, 14.0, 16.0, 15.0, 10.0, 10.0, 14.0, 5.0, 7.0, 2.0, 2.0, 4.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-15.9296875, -15.4547119140625, -14.979736328125, -14.5047607421875, -14.02978515625, -13.5548095703125, -13.079833984375, -12.6048583984375, -12.1298828125, -11.6549072265625, -11.179931640625, -10.7049560546875, -10.22998046875, -9.7550048828125, -9.280029296875, -8.8050537109375, -8.330078125, -7.8551025390625, -7.380126953125, -6.9051513671875, -6.43017578125, -5.9552001953125, -5.480224609375, -5.0052490234375, -4.5302734375, -4.0552978515625, -3.580322265625, -3.1053466796875, -2.63037109375, -2.1553955078125, -1.680419921875, -1.2054443359375, -0.73046875, -0.2554931640625, 0.219482421875, 0.6944580078125, 1.16943359375, 1.6444091796875, 2.119384765625, 2.5943603515625, 3.0693359375, 3.5443115234375, 4.019287109375, 4.4942626953125, 4.96923828125, 5.4442138671875, 5.919189453125, 6.3941650390625, 6.869140625, 7.3441162109375, 7.819091796875, 8.2940673828125, 8.76904296875, 9.2440185546875, 9.718994140625, 10.1939697265625, 10.6689453125, 11.1439208984375, 11.618896484375, 12.0938720703125, 12.56884765625, 13.0438232421875, 13.518798828125, 13.9937744140625, 14.46875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 6.0, 5.0, 5.0, 6.0, 8.0, 12.0, 20.0, 26.0, 34.0, 57.0, 106.0, 168.0, 272.0, 551.0, 1405.0, 4246.0, 18770.0, 782029.0, 219379.0, 15350.0, 3598.0, 1256.0, 538.0, 277.0, 156.0, 96.0, 61.0, 35.0, 21.0, 19.0, 20.0, 11.0, 6.0, 4.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.9833984375, -1.9213104248046875, -1.859222412109375, -1.7971343994140625, -1.73504638671875, -1.6729583740234375, -1.610870361328125, -1.5487823486328125, -1.4866943359375, -1.4246063232421875, -1.362518310546875, -1.3004302978515625, -1.23834228515625, -1.1762542724609375, -1.114166259765625, -1.0520782470703125, -0.989990234375, -0.9279022216796875, -0.865814208984375, -0.8037261962890625, -0.74163818359375, -0.6795501708984375, -0.617462158203125, -0.5553741455078125, -0.4932861328125, -0.4311981201171875, -0.369110107421875, -0.3070220947265625, -0.24493408203125, -0.1828460693359375, -0.120758056640625, -0.0586700439453125, 0.00341796875, 0.0655059814453125, 0.127593994140625, 0.1896820068359375, 0.25177001953125, 0.3138580322265625, 0.375946044921875, 0.4380340576171875, 0.5001220703125, 0.5622100830078125, 0.624298095703125, 0.6863861083984375, 0.74847412109375, 0.8105621337890625, 0.872650146484375, 0.9347381591796875, 0.996826171875, 1.0589141845703125, 1.121002197265625, 1.1830902099609375, 1.24517822265625, 1.3072662353515625, 1.369354248046875, 1.4314422607421875, 1.4935302734375, 1.5556182861328125, 1.617706298828125, 1.6797943115234375, 1.74188232421875, 1.8039703369140625, 1.866058349609375, 1.9281463623046875, 1.990234375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 8.0, 9.0, 11.0, 7.0, 16.0, 21.0, 31.0, 53.0, 81.0, 141.0, 209.0, 134.0, 91.0, 59.0, 28.0, 18.0, 13.0, 18.0, 6.0, 5.0, 5.0, 4.0, 2.0, 5.0, 7.0, 2.0, 1.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00047135353088378906, -0.00045420601963996887, -0.0004370585083961487, -0.0004199109971523285, -0.0004027634859085083, -0.0003856159746646881, -0.0003684684634208679, -0.00035132095217704773, -0.00033417344093322754, -0.00031702592968940735, -0.00029987841844558716, -0.00028273090720176697, -0.0002655833959579468, -0.0002484358847141266, -0.0002312883734703064, -0.0002141408622264862, -0.00019699335098266602, -0.00017984583973884583, -0.00016269832849502563, -0.00014555081725120544, -0.00012840330600738525, -0.00011125579476356506, -9.410828351974487e-05, -7.696077227592468e-05, -5.981326103210449e-05, -4.26657497882843e-05, -2.551823854446411e-05, -8.370727300643921e-06, 8.77678394317627e-06, 2.592429518699646e-05, 4.307180643081665e-05, 6.021931767463684e-05, 7.736682891845703e-05, 9.451434016227722e-05, 0.00011166185140609741, 0.0001288093626499176, 0.0001459568738937378, 0.00016310438513755798, 0.00018025189638137817, 0.00019739940762519836, 0.00021454691886901855, 0.00023169443011283875, 0.00024884194135665894, 0.0002659894526004791, 0.0002831369638442993, 0.0003002844750881195, 0.0003174319863319397, 0.0003345794975757599, 0.0003517270088195801, 0.00036887452006340027, 0.00038602203130722046, 0.00040316954255104065, 0.00042031705379486084, 0.00043746456503868103, 0.0004546120762825012, 0.0004717595875263214, 0.0004889070987701416, 0.0005060546100139618, 0.000523202121257782, 0.0005403496325016022, 0.0005574971437454224, 0.0005746446549892426, 0.0005917921662330627, 0.0006089396774768829, 0.0006260871887207031]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 6.0, 13.0, 18.0, 12.0, 22.0, 30.0, 46.0, 65.0, 100.0, 177.0, 247.0, 430.0, 786.0, 1488.0, 2946.0, 7233.0, 20771.0, 104571.0, 825771.0, 58469.0, 14652.0, 5396.0, 2429.0, 1228.0, 658.0, 343.0, 221.0, 131.0, 99.0, 51.0, 44.0, 30.0, 15.0, 12.0, 11.0, 7.0, 4.0, 7.0, 2.0, 3.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4365234375, -1.3958892822265625, -1.355255126953125, -1.3146209716796875, -1.27398681640625, -1.2333526611328125, -1.192718505859375, -1.1520843505859375, -1.1114501953125, -1.0708160400390625, -1.030181884765625, -0.9895477294921875, -0.94891357421875, -0.9082794189453125, -0.867645263671875, -0.8270111083984375, -0.786376953125, -0.7457427978515625, -0.705108642578125, -0.6644744873046875, -0.62384033203125, -0.5832061767578125, -0.542572021484375, -0.5019378662109375, -0.4613037109375, -0.4206695556640625, -0.380035400390625, -0.3394012451171875, -0.29876708984375, -0.2581329345703125, -0.217498779296875, -0.1768646240234375, -0.13623046875, -0.0955963134765625, -0.054962158203125, -0.0143280029296875, 0.02630615234375, 0.0669403076171875, 0.107574462890625, 0.1482086181640625, 0.1888427734375, 0.2294769287109375, 0.270111083984375, 0.3107452392578125, 0.35137939453125, 0.3920135498046875, 0.432647705078125, 0.4732818603515625, 0.513916015625, 0.5545501708984375, 0.595184326171875, 0.6358184814453125, 0.67645263671875, 0.7170867919921875, 0.757720947265625, 0.7983551025390625, 0.8389892578125, 0.8796234130859375, 0.920257568359375, 0.9608917236328125, 1.00152587890625, 1.0421600341796875, 1.082794189453125, 1.1234283447265625, 1.1640625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 5.0, 3.0, 6.0, 3.0, 5.0, 6.0, 8.0, 10.0, 9.0, 19.0, 16.0, 23.0, 36.0, 32.0, 43.0, 58.0, 67.0, 82.0, 76.0, 95.0, 93.0, 66.0, 47.0, 33.0, 32.0, 25.0, 16.0, 13.0, 9.0, 7.0, 2.0, 8.0, 10.0, 4.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.97802734375, -0.9470596313476562, -0.9160919189453125, -0.8851242065429688, -0.854156494140625, -0.8231887817382812, -0.7922210693359375, -0.7612533569335938, -0.73028564453125, -0.6993179321289062, -0.6683502197265625, -0.6373825073242188, -0.606414794921875, -0.5754470825195312, -0.5444793701171875, -0.5135116577148438, -0.4825439453125, -0.45157623291015625, -0.4206085205078125, -0.38964080810546875, -0.358673095703125, -0.32770538330078125, -0.2967376708984375, -0.26576995849609375, -0.23480224609375, -0.20383453369140625, -0.1728668212890625, -0.14189910888671875, -0.110931396484375, -0.07996368408203125, -0.0489959716796875, -0.01802825927734375, 0.012939453125, 0.04390716552734375, 0.0748748779296875, 0.10584259033203125, 0.136810302734375, 0.16777801513671875, 0.1987457275390625, 0.22971343994140625, 0.26068115234375, 0.29164886474609375, 0.3226165771484375, 0.35358428955078125, 0.384552001953125, 0.41551971435546875, 0.4464874267578125, 0.47745513916015625, 0.5084228515625, 0.5393905639648438, 0.5703582763671875, 0.6013259887695312, 0.632293701171875, 0.6632614135742188, 0.6942291259765625, 0.7251968383789062, 0.75616455078125, 0.7871322631835938, 0.8180999755859375, 0.8490676879882812, 0.880035400390625, 0.9110031127929688, 0.9419708251953125, 0.9729385375976562, 1.00390625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 19.0, 49.0, 214.0, 581.0, 90.0, 29.0, 9.0, 9.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.48039245605469, -68.4775619506836, -64.4747314453125, -60.47189712524414, -56.46906661987305, -52.46623611450195, -48.463401794433594, -44.4605712890625, -40.457740783691406, -36.45491027832031, -32.45207977294922, -28.44924545288086, -24.446414947509766, -20.443584442138672, -16.440752029418945, -12.437919616699219, -8.435089111328125, -4.432257652282715, -0.4294261932373047, 3.5734052658081055, 7.576236724853516, 11.57906723022461, 15.581899642944336, 19.584732055664062, 23.587562561035156, 27.59039306640625, 31.593225479125977, 35.5960578918457, 39.5988883972168, 43.60171890258789, 47.60455322265625, 51.607383728027344, 55.6102294921875, 59.613059997558594, 63.61589050292969, 67.61872100830078, 71.62155151367188, 75.6243896484375, 79.6272201538086, 83.63005065917969, 87.63288116455078, 91.63571166992188, 95.63854217529297, 99.64137268066406, 103.64421081542969, 107.64703369140625, 111.64987182617188, 115.65270233154297, 119.65553283691406, 123.65836334228516, 127.66119384765625, 131.66403198242188, 135.66685485839844, 139.66969299316406, 143.67251586914062, 147.67535400390625, 151.67819213867188, 155.6810302734375, 159.68385314941406, 163.6866912841797, 167.68951416015625, 171.69235229492188, 175.69517517089844, 179.69801330566406, 183.70083618164062]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 2.0, 6.0, 5.0, 7.0, 11.0, 6.0, 12.0, 17.0, 18.0, 19.0, 25.0, 30.0, 19.0, 23.0, 30.0, 53.0, 303.0, 158.0, 37.0, 37.0, 29.0, 19.0, 27.0, 21.0, 17.0, 19.0, 9.0, 11.0, 6.0, 8.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.92304992675781, -50.28929138183594, -48.65553283691406, -47.02177429199219, -45.38801574707031, -43.75425720214844, -42.12049865722656, -40.48674011230469, -38.85298156738281, -37.21922302246094, -35.58546447753906, -33.95170593261719, -32.31794738769531, -30.684188842773438, -29.05042839050293, -27.416669845581055, -25.782909393310547, -24.149150848388672, -22.515392303466797, -20.881633758544922, -19.247875213623047, -17.614116668701172, -15.980356216430664, -14.346597671508789, -12.712839126586914, -11.079080581665039, -9.445322036743164, -7.811562538146973, -6.177803993225098, -4.544045448303223, -2.9102859497070312, -1.2765274047851562, 0.35723114013671875, 1.9909899234771729, 3.624748706817627, 5.25850772857666, 6.892266273498535, 8.52602481842041, 10.159784317016602, 11.793542861938477, 13.427301406860352, 15.061059951782227, 16.6948184967041, 18.32857894897461, 19.962337493896484, 21.59609603881836, 23.229854583740234, 24.86361312866211, 26.497371673583984, 28.13113021850586, 29.764888763427734, 31.39864730834961, 33.032405853271484, 34.66616439819336, 36.2999267578125, 37.933685302734375, 39.56744384765625, 41.201202392578125, 42.8349609375, 44.468719482421875, 46.10247802734375, 47.736236572265625, 49.3699951171875, 51.003753662109375, 52.63751220703125]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 5.0, 3.0, 3.0, 6.0, 14.0, 17.0, 18.0, 20.0, 33.0, 32.0, 45.0, 50.0, 59.0, 173.0, 198.0, 72.0, 59.0, 37.0, 39.0, 28.0, 25.0, 22.0, 11.0, 8.0, 6.0, 9.0, 7.0, 1.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.0234375, -5.86114501953125, -5.6988525390625, -5.53656005859375, -5.374267578125, -5.21197509765625, -5.0496826171875, -4.88739013671875, -4.72509765625, -4.56280517578125, -4.4005126953125, -4.23822021484375, -4.075927734375, -3.91363525390625, -3.7513427734375, -3.58905029296875, -3.4267578125, -3.26446533203125, -3.1021728515625, -2.93988037109375, -2.777587890625, -2.61529541015625, -2.4530029296875, -2.29071044921875, -2.12841796875, -1.96612548828125, -1.8038330078125, -1.64154052734375, -1.479248046875, -1.31695556640625, -1.1546630859375, -0.99237060546875, -0.830078125, -0.66778564453125, -0.5054931640625, -0.34320068359375, -0.180908203125, -0.01861572265625, 0.1436767578125, 0.30596923828125, 0.46826171875, 0.63055419921875, 0.7928466796875, 0.95513916015625, 1.117431640625, 1.27972412109375, 1.4420166015625, 1.60430908203125, 1.7666015625, 1.92889404296875, 2.0911865234375, 2.25347900390625, 2.415771484375, 2.57806396484375, 2.7403564453125, 2.90264892578125, 3.06494140625, 3.22723388671875, 3.3895263671875, 3.55181884765625, 3.714111328125, 3.87640380859375, 4.0386962890625, 4.20098876953125, 4.36328125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 9.0, 3.0, 6.0, 14.0, 16.0, 25.0, 42.0, 31.0, 63.0, 130.0, 221.0, 594.0, 2069.0, 15244.0, 8357033.0, 10467.0, 1565.0, 507.0, 210.0, 118.0, 60.0, 38.0, 30.0, 25.0, 25.0, 10.0, 11.0, 2.0, 1.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 6.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.689971923828125, -58.05156326293945, -56.41315460205078, -54.77474594116211, -53.13633728027344, -51.497928619384766, -49.859519958496094, -48.22111511230469, -46.58270263671875, -44.94429397583008, -43.305885314941406, -41.667476654052734, -40.02906799316406, -38.39065933227539, -36.75225067138672, -35.11384582519531, -33.47543716430664, -31.83702850341797, -30.198619842529297, -28.560211181640625, -26.921802520751953, -25.28339385986328, -23.644987106323242, -22.00657844543457, -20.3681697845459, -18.729761123657227, -17.091352462768555, -15.4529447555542, -13.814536094665527, -12.176127433776855, -10.5377197265625, -8.899311065673828, -7.260902404785156, -5.622493743896484, -3.9840855598449707, -2.345677375793457, -0.7072687149047852, 0.9311399459838867, 2.569547653198242, 4.207956314086914, 5.846364974975586, 7.484773635864258, 9.12318229675293, 10.761590003967285, 12.399998664855957, 14.038407325744629, 15.676815032958984, 17.315223693847656, 18.953632354736328, 20.592041015625, 22.230449676513672, 23.868858337402344, 25.507266998291016, 27.145675659179688, 28.784082412719727, 30.4224910736084, 32.06089782714844, 33.69930648803711, 35.33771514892578, 36.97612380981445, 38.614532470703125, 40.2529411315918, 41.89134979248047, 43.529754638671875, 45.16816711425781]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 4.0, 6.0, 1.0, 3.0, 5.0, 11.0, 5.0, 6.0, 3.0, 5.0, 9.0, 4.0, 8.0, 4.0, 1.0, 4.0, 2.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.11027526855469, -63.181297302246094, -61.252315521240234, -59.32333755493164, -57.39435958862305, -55.46537780761719, -53.536399841308594, -51.607421875, -49.67844009399414, -47.74946212768555, -45.82048034667969, -43.891502380371094, -41.9625244140625, -40.03354263305664, -38.10456466674805, -36.17558288574219, -34.246604919433594, -32.317626953125, -30.388647079467773, -28.459667205810547, -26.53068733215332, -24.601707458496094, -22.6727294921875, -20.743749618530273, -18.814773559570312, -16.885793685913086, -14.956814765930176, -13.027835845947266, -11.098855972290039, -9.169877052307129, -7.240898132324219, -5.311918258666992, -3.3829383850097656, -1.4539591073989868, 0.475020170211792, 2.4039993286132812, 4.33297872543335, 6.261958122253418, 8.190937042236328, 10.119916915893555, 12.048895835876465, 13.977874755859375, 15.906854629516602, 17.835834503173828, 19.764812469482422, 21.69379234313965, 23.622772216796875, 25.55175018310547, 27.480730056762695, 29.409709930419922, 31.338687896728516, 33.267669677734375, 35.19664764404297, 37.12562561035156, 39.054603576660156, 40.983585357666016, 42.91256332397461, 44.8415412902832, 46.77052307128906, 48.699501037597656, 50.62847900390625, 52.55746078491211, 54.4864387512207, 56.41542053222656, 58.344398498535156]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 0.0, 1.0, 4.0, 8.0, 7.0, 13.0, 18.0, 18.0, 38.0, 42.0, 37.0, 43.0, 72.0, 71.0, 84.0, 102.0, 78.0, 70.0, 72.0, 50.0, 44.0, 21.0, 29.0, 22.0, 17.0, 14.0, 6.0, 4.0, 4.0, 9.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0], "bins": [-3.029296875, -2.95526123046875, -2.8812255859375, -2.80718994140625, -2.733154296875, -2.65911865234375, -2.5850830078125, -2.51104736328125, -2.43701171875, -2.36297607421875, -2.2889404296875, -2.21490478515625, -2.140869140625, -2.06683349609375, -1.9927978515625, -1.91876220703125, -1.8447265625, -1.77069091796875, -1.6966552734375, -1.62261962890625, -1.548583984375, -1.47454833984375, -1.4005126953125, -1.32647705078125, -1.25244140625, -1.17840576171875, -1.1043701171875, -1.03033447265625, -0.956298828125, -0.88226318359375, -0.8082275390625, -0.73419189453125, -0.66015625, -0.58612060546875, -0.5120849609375, -0.43804931640625, -0.364013671875, -0.28997802734375, -0.2159423828125, -0.14190673828125, -0.06787109375, 0.00616455078125, 0.0802001953125, 0.15423583984375, 0.228271484375, 0.30230712890625, 0.3763427734375, 0.45037841796875, 0.5244140625, 0.59844970703125, 0.6724853515625, 0.74652099609375, 0.820556640625, 0.89459228515625, 0.9686279296875, 1.04266357421875, 1.11669921875, 1.19073486328125, 1.2647705078125, 1.33880615234375, 1.412841796875, 1.48687744140625, 1.5609130859375, 1.63494873046875, 1.708984375]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 7.0, 5.0, 3.0, 14.0, 23.0, 25.0, 47.0, 65.0, 105.0, 150.0, 312.0, 591.0, 1248.0, 2663.0, 7037.0, 21889.0, 84213.0, 235570.0, 123293.0, 31050.0, 9183.0, 3414.0, 1496.0, 785.0, 399.0, 231.0, 154.0, 98.0, 59.0, 41.0, 26.0, 23.0, 14.0, 14.0, 6.0, 3.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.328125, -26.302490234375, -25.27685546875, -24.251220703125, -23.2255859375, -22.199951171875, -21.17431640625, -20.148681640625, -19.123046875, -18.097412109375, -17.07177734375, -16.046142578125, -15.0205078125, -13.994873046875, -12.96923828125, -11.943603515625, -10.91796875, -9.892333984375, -8.86669921875, -7.841064453125, -6.8154296875, -5.789794921875, -4.76416015625, -3.738525390625, -2.712890625, -1.687255859375, -0.66162109375, 0.364013671875, 1.3896484375, 2.415283203125, 3.44091796875, 4.466552734375, 5.4921875, 6.517822265625, 7.54345703125, 8.569091796875, 9.5947265625, 10.620361328125, 11.64599609375, 12.671630859375, 13.697265625, 14.722900390625, 15.74853515625, 16.774169921875, 17.7998046875, 18.825439453125, 19.85107421875, 20.876708984375, 21.90234375, 22.927978515625, 23.95361328125, 24.979248046875, 26.0048828125, 27.030517578125, 28.05615234375, 29.081787109375, 30.107421875, 31.133056640625, 32.15869140625, 33.184326171875, 34.2099609375, 35.235595703125, 36.26123046875, 37.286865234375, 38.3125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 1.0, 1.0, 5.0, 2.0, 4.0, 7.0, 5.0, 7.0, 6.0, 10.0, 12.0, 25.0, 13.0, 26.0, 35.0, 29.0, 41.0, 59.0, 53.0, 68.0, 54.0, 58.0, 65.0, 67.0, 39.0, 53.0, 49.0, 51.0, 35.0, 24.0, 24.0, 13.0, 21.0, 8.0, 16.0, 8.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.787109375, -3.659515380859375, -3.53192138671875, -3.404327392578125, -3.2767333984375, -3.149139404296875, -3.02154541015625, -2.893951416015625, -2.766357421875, -2.638763427734375, -2.51116943359375, -2.383575439453125, -2.2559814453125, -2.128387451171875, -2.00079345703125, -1.873199462890625, -1.74560546875, -1.618011474609375, -1.49041748046875, -1.362823486328125, -1.2352294921875, -1.107635498046875, -0.98004150390625, -0.852447509765625, -0.724853515625, -0.597259521484375, -0.46966552734375, -0.342071533203125, -0.2144775390625, -0.086883544921875, 0.04071044921875, 0.168304443359375, 0.2958984375, 0.423492431640625, 0.55108642578125, 0.678680419921875, 0.8062744140625, 0.933868408203125, 1.06146240234375, 1.189056396484375, 1.316650390625, 1.444244384765625, 1.57183837890625, 1.699432373046875, 1.8270263671875, 1.954620361328125, 2.08221435546875, 2.209808349609375, 2.33740234375, 2.464996337890625, 2.59259033203125, 2.720184326171875, 2.8477783203125, 2.975372314453125, 3.10296630859375, 3.230560302734375, 3.358154296875, 3.485748291015625, 3.61334228515625, 3.740936279296875, 3.8685302734375, 3.996124267578125, 4.12371826171875, 4.251312255859375, 4.37890625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 7.0, 12.0, 10.0, 21.0, 32.0, 81.0, 137.0, 89.0, 41.0, 24.0, 6.0, 9.0, 6.0, 7.0, 2.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-71.03413391113281, -69.43814086914062, -67.8421401977539, -66.24614715576172, -64.650146484375, -63.05415344238281, -61.45815658569336, -59.862159729003906, -58.26616668701172, -56.670169830322266, -55.07417297363281, -53.478179931640625, -51.88218307495117, -50.28618621826172, -48.690189361572266, -47.09419250488281, -45.49819564819336, -43.902198791503906, -42.30620193481445, -40.710205078125, -39.11421203613281, -37.51821517944336, -35.922218322753906, -34.32622146606445, -32.730224609375, -31.134227752685547, -29.538232803344727, -27.942235946655273, -26.346240997314453, -24.750244140625, -23.154247283935547, -21.558250427246094, -19.962257385253906, -18.366260528564453, -16.770265579223633, -15.17426872253418, -13.578272819519043, -11.982276916503906, -10.386280059814453, -8.790284156799316, -7.19428825378418, -5.598292350769043, -4.002295970916748, -2.406299591064453, -0.8103036880493164, 0.7856922149658203, 2.3816890716552734, 3.97768497467041, 5.573680877685547, 7.169676780700684, 8.76567268371582, 10.361669540405273, 11.95766544342041, 13.553661346435547, 15.149658203125, 16.745655059814453, 18.341650009155273, 19.937646865844727, 21.533641815185547, 23.129638671875, 24.725635528564453, 26.321630477905273, 27.917627334594727, 29.513622283935547, 31.109619140625]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 4.0, 8.0, 3.0, 4.0, 6.0, 5.0, 8.0, 10.0, 16.0, 28.0, 46.0, 49.0, 80.0, 61.0, 49.0, 32.0, 14.0, 10.0, 7.0, 9.0, 5.0, 4.0, 10.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-22.81552505493164, -22.24567222595215, -21.675819396972656, -21.105968475341797, -20.536115646362305, -19.966262817382812, -19.39640998840332, -18.826557159423828, -18.25670623779297, -17.686853408813477, -17.117000579833984, -16.547149658203125, -15.977296829223633, -15.40744400024414, -14.837591171264648, -14.267738342285156, -13.697885513305664, -13.128032684326172, -12.558180809020996, -11.988327980041504, -11.418476104736328, -10.848623275756836, -10.278770446777344, -9.708917617797852, -9.139065742492676, -8.569212913513184, -7.999361038208008, -7.429508209228516, -6.859655857086182, -6.289803504943848, -5.7199506759643555, -5.1500983238220215, -4.5802459716796875, -4.0103936195373535, -3.4405410289764404, -2.8706884384155273, -2.3008360862731934, -1.7309837341308594, -1.1611311435699463, -0.5912785530090332, -0.02142620086669922, 0.5484262704849243, 1.1182787418365479, 1.6881312131881714, 2.257983684539795, 2.827836036682129, 3.397688627243042, 3.967541217803955, 4.537393569946289, 5.107245922088623, 5.677098274230957, 6.246951103210449, 6.816803455352783, 7.386655807495117, 7.956508636474609, 8.526361465454102, 9.096213340759277, 9.66606616973877, 10.235918045043945, 10.805770874023438, 11.37562370300293, 11.945475578308105, 12.515328407287598, 13.085180282592773, 13.655033111572266]}, "eval/loss": 6.049000263214111, "eval/wer": 1.1433359777865926, "eval/runtime": 744.98, "eval/samples_per_second": 3.546, "eval/steps_per_second": 0.444} \ No newline at end of file